Update README.md
Browse files
README.md
CHANGED
@@ -126,7 +126,18 @@ This is a large language model with 12 billion parameters, created by merging mu
|
|
126 |
- **Paper [optional]:** N/A
|
127 |
- **Demo [optional]:** N/A
|
128 |
|
129 |
-
##
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
130 |
|
131 |
### Direct Use
|
132 |
|
@@ -171,16 +182,5 @@ inputs = tokenizer(prompt, return_tensors="pt")
|
|
171 |
outputs = model.generate(**inputs.to("cuda"), max_new_tokens=100)
|
172 |
result = tokenizer.batch_decode(outputs, skip_special_tokens=True)
|
173 |
print(result)
|
174 |
-
# [Open LLM Leaderboard Evaluation Results](https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard)
|
175 |
-
Detailed results can be found [here](https://huggingface.co/datasets/open-llm-leaderboard/details_Xclbr7__caliburn-12b)
|
176 |
|
177 |
-
| Metric |Value|
|
178 |
-
|-------------------|----:|
|
179 |
-
|Avg. |22.68|
|
180 |
-
|IFEval (0-Shot) |35.76|
|
181 |
-
|BBH (3-Shot) |35.64|
|
182 |
-
|MATH Lvl 5 (4-Shot)| 9.67|
|
183 |
-
|GPQA (0-shot) |11.52|
|
184 |
-
|MuSR (0-shot) |13.78|
|
185 |
-
|MMLU-PRO (5-shot) |29.72|
|
186 |
|
|
|
126 |
- **Paper [optional]:** N/A
|
127 |
- **Demo [optional]:** N/A
|
128 |
|
129 |
+
## [Open LLM Leaderboard Evaluation Results](https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard)
|
130 |
+
Detailed results can be found [here](https://huggingface.co/datasets/open-llm-leaderboard/details_Xclbr7__caliburn-12b)
|
131 |
+
|
132 |
+
| Metric |Value|
|
133 |
+
|-------------------|----:|
|
134 |
+
|Avg. |22.68|
|
135 |
+
|IFEval (0-Shot) |35.76|
|
136 |
+
|BBH (3-Shot) |35.64|
|
137 |
+
|MATH Lvl 5 (4-Shot)| 9.67|
|
138 |
+
|GPQA (0-shot) |11.52|
|
139 |
+
|MuSR (0-shot) |13.78|
|
140 |
+
|MMLU-PRO (5-shot) |29.72|
|
141 |
|
142 |
### Direct Use
|
143 |
|
|
|
182 |
outputs = model.generate(**inputs.to("cuda"), max_new_tokens=100)
|
183 |
result = tokenizer.batch_decode(outputs, skip_special_tokens=True)
|
184 |
print(result)
|
|
|
|
|
185 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
186 |
|