lunahr
/

thea-c-3b-25r

@@ -13,7 +13,7 @@ tags:
 base_model: meta-llama/Llama-3.2-3B-Instruct
 datasets:
 - KingNish/reasoning-base-20k
-- piotr25691/thea-name-overrides
 model-index:
 - name: thea-c-3b-25r
   results:
@@ -30,7 +30,7 @@ model-index:
       value: 74.02
       name: strict accuracy
     source:
-      url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=piotr25691/thea-c-3b-25r
       name: Open LLM Leaderboard
   - task:
       type: text-generation
@@ -45,7 +45,7 @@ model-index:
       value: 22.77
       name: normalized accuracy
     source:
-      url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=piotr25691/thea-c-3b-25r
       name: Open LLM Leaderboard
   - task:
       type: text-generation
@@ -60,7 +60,7 @@ model-index:
       value: 13.37
       name: exact match
     source:
-      url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=piotr25691/thea-c-3b-25r
       name: Open LLM Leaderboard
   - task:
       type: text-generation
@@ -75,7 +75,7 @@ model-index:
       value: 2.01
       name: acc_norm
     source:
-      url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=piotr25691/thea-c-3b-25r
       name: Open LLM Leaderboard
   - task:
       type: text-generation
@@ -90,7 +90,7 @@ model-index:
       value: 1.27
       name: acc_norm
     source:
-      url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=piotr25691/thea-c-3b-25r
       name: Open LLM Leaderboard
   - task:
       type: text-generation
@@ -107,7 +107,7 @@ model-index:
       value: 24.2
       name: accuracy
     source:
-      url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=piotr25691/thea-c-3b-25r
       name: Open LLM Leaderboard
 ---
@@ -123,7 +123,7 @@ from transformers import AutoModelForCausalLM, AutoTokenizer
 MAX_REASONING_TOKENS = 1024
 MAX_RESPONSE_TOKENS = 512
-model_name = "piotr25691/thea-3b-25r"
 model = AutoModelForCausalLM.from_pretrained(model_name, torch_dtype="auto", device_map="auto")
 tokenizer = AutoTokenizer.from_pretrained(model_name)
@@ -151,7 +151,7 @@ response_output = tokenizer.decode(response_ids[0, response_inputs.input_ids.sha
 print("ANSWER: " + response_output)
 ```
-- **Trained by:** [Piotr Zalewski](https://huggingface.co/piotr25691)
 - **License:** llama3.2
 - **Finetuned from model:** [meta-llama/Llama-3.2-3B-Instruct](https://huggingface.co/meta-llama/Llama-3.2-3B-Instruct)
 - **Dataset used:** [KingNish/reasoning-base-20k](https://huggingface.co/datasets/KingNish/reasoning-base-20k)

 base_model: meta-llama/Llama-3.2-3B-Instruct
 datasets:
 - KingNish/reasoning-base-20k
+- lunahr/thea-name-overrides
 model-index:
 - name: thea-c-3b-25r
   results:
       value: 74.02
       name: strict accuracy
     source:
+      url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=lunahr/thea-c-3b-25r
       name: Open LLM Leaderboard
   - task:
       type: text-generation
       value: 22.77
       name: normalized accuracy
     source:
+      url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=lunahr/thea-c-3b-25r
       name: Open LLM Leaderboard
   - task:
       type: text-generation
       value: 13.37
       name: exact match
     source:
+      url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=lunahr/thea-c-3b-25r
       name: Open LLM Leaderboard
   - task:
       type: text-generation
       value: 2.01
       name: acc_norm
     source:
+      url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=lunahr/thea-c-3b-25r
       name: Open LLM Leaderboard
   - task:
       type: text-generation
       value: 1.27
       name: acc_norm
     source:
+      url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=lunahr/thea-c-3b-25r
       name: Open LLM Leaderboard
   - task:
       type: text-generation
       value: 24.2
       name: accuracy
     source:
+      url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=lunahr/thea-c-3b-25r
       name: Open LLM Leaderboard
 ---
 MAX_REASONING_TOKENS = 1024
 MAX_RESPONSE_TOKENS = 512
+model_name = "lunahr/thea-3b-25r"
 model = AutoModelForCausalLM.from_pretrained(model_name, torch_dtype="auto", device_map="auto")
 tokenizer = AutoTokenizer.from_pretrained(model_name)
 print("ANSWER: " + response_output)
 ```
+- **Trained by:** [Piotr Zalewski](https://huggingface.co/lunahr)
 - **License:** llama3.2
 - **Finetuned from model:** [meta-llama/Llama-3.2-3B-Instruct](https://huggingface.co/meta-llama/Llama-3.2-3B-Instruct)
 - **Dataset used:** [KingNish/reasoning-base-20k](https://huggingface.co/datasets/KingNish/reasoning-base-20k)