lunahr commited on
Commit
fee0a19
1 Parent(s): c42ddb0

updated usernames

Browse files
Files changed (1) hide show
  1. README.md +9 -9
README.md CHANGED
@@ -13,7 +13,7 @@ tags:
13
  base_model: meta-llama/Llama-3.2-3B-Instruct
14
  datasets:
15
  - KingNish/reasoning-base-20k
16
- - piotr25691/thea-name-overrides
17
  model-index:
18
  - name: thea-c-3b-25r
19
  results:
@@ -30,7 +30,7 @@ model-index:
30
  value: 74.02
31
  name: strict accuracy
32
  source:
33
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=piotr25691/thea-c-3b-25r
34
  name: Open LLM Leaderboard
35
  - task:
36
  type: text-generation
@@ -45,7 +45,7 @@ model-index:
45
  value: 22.77
46
  name: normalized accuracy
47
  source:
48
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=piotr25691/thea-c-3b-25r
49
  name: Open LLM Leaderboard
50
  - task:
51
  type: text-generation
@@ -60,7 +60,7 @@ model-index:
60
  value: 13.37
61
  name: exact match
62
  source:
63
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=piotr25691/thea-c-3b-25r
64
  name: Open LLM Leaderboard
65
  - task:
66
  type: text-generation
@@ -75,7 +75,7 @@ model-index:
75
  value: 2.01
76
  name: acc_norm
77
  source:
78
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=piotr25691/thea-c-3b-25r
79
  name: Open LLM Leaderboard
80
  - task:
81
  type: text-generation
@@ -90,7 +90,7 @@ model-index:
90
  value: 1.27
91
  name: acc_norm
92
  source:
93
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=piotr25691/thea-c-3b-25r
94
  name: Open LLM Leaderboard
95
  - task:
96
  type: text-generation
@@ -107,7 +107,7 @@ model-index:
107
  value: 24.2
108
  name: accuracy
109
  source:
110
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=piotr25691/thea-c-3b-25r
111
  name: Open LLM Leaderboard
112
  ---
113
 
@@ -123,7 +123,7 @@ from transformers import AutoModelForCausalLM, AutoTokenizer
123
  MAX_REASONING_TOKENS = 1024
124
  MAX_RESPONSE_TOKENS = 512
125
 
126
- model_name = "piotr25691/thea-3b-25r"
127
 
128
  model = AutoModelForCausalLM.from_pretrained(model_name, torch_dtype="auto", device_map="auto")
129
  tokenizer = AutoTokenizer.from_pretrained(model_name)
@@ -151,7 +151,7 @@ response_output = tokenizer.decode(response_ids[0, response_inputs.input_ids.sha
151
  print("ANSWER: " + response_output)
152
  ```
153
 
154
- - **Trained by:** [Piotr Zalewski](https://huggingface.co/piotr25691)
155
  - **License:** llama3.2
156
  - **Finetuned from model:** [meta-llama/Llama-3.2-3B-Instruct](https://huggingface.co/meta-llama/Llama-3.2-3B-Instruct)
157
  - **Dataset used:** [KingNish/reasoning-base-20k](https://huggingface.co/datasets/KingNish/reasoning-base-20k)
 
13
  base_model: meta-llama/Llama-3.2-3B-Instruct
14
  datasets:
15
  - KingNish/reasoning-base-20k
16
+ - lunahr/thea-name-overrides
17
  model-index:
18
  - name: thea-c-3b-25r
19
  results:
 
30
  value: 74.02
31
  name: strict accuracy
32
  source:
33
+ url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=lunahr/thea-c-3b-25r
34
  name: Open LLM Leaderboard
35
  - task:
36
  type: text-generation
 
45
  value: 22.77
46
  name: normalized accuracy
47
  source:
48
+ url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=lunahr/thea-c-3b-25r
49
  name: Open LLM Leaderboard
50
  - task:
51
  type: text-generation
 
60
  value: 13.37
61
  name: exact match
62
  source:
63
+ url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=lunahr/thea-c-3b-25r
64
  name: Open LLM Leaderboard
65
  - task:
66
  type: text-generation
 
75
  value: 2.01
76
  name: acc_norm
77
  source:
78
+ url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=lunahr/thea-c-3b-25r
79
  name: Open LLM Leaderboard
80
  - task:
81
  type: text-generation
 
90
  value: 1.27
91
  name: acc_norm
92
  source:
93
+ url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=lunahr/thea-c-3b-25r
94
  name: Open LLM Leaderboard
95
  - task:
96
  type: text-generation
 
107
  value: 24.2
108
  name: accuracy
109
  source:
110
+ url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=lunahr/thea-c-3b-25r
111
  name: Open LLM Leaderboard
112
  ---
113
 
 
123
  MAX_REASONING_TOKENS = 1024
124
  MAX_RESPONSE_TOKENS = 512
125
 
126
+ model_name = "lunahr/thea-3b-25r"
127
 
128
  model = AutoModelForCausalLM.from_pretrained(model_name, torch_dtype="auto", device_map="auto")
129
  tokenizer = AutoTokenizer.from_pretrained(model_name)
 
151
  print("ANSWER: " + response_output)
152
  ```
153
 
154
+ - **Trained by:** [Piotr Zalewski](https://huggingface.co/lunahr)
155
  - **License:** llama3.2
156
  - **Finetuned from model:** [meta-llama/Llama-3.2-3B-Instruct](https://huggingface.co/meta-llama/Llama-3.2-3B-Instruct)
157
  - **Dataset used:** [KingNish/reasoning-base-20k](https://huggingface.co/datasets/KingNish/reasoning-base-20k)