Update README.md
Browse files
README.md
CHANGED
@@ -21,9 +21,9 @@ model-index:
|
|
21 |
- name: GSM8k (0-Shot)
|
22 |
type: GSM8k (0-Shot)
|
23 |
value: 17%
|
24 |
-
|
25 |
-
|
26 |
-
|
27 |
co2_eq_emissions:
|
28 |
emissions: 7100
|
29 |
source: "https://mlco2.github.io/impact#compute"
|
@@ -44,7 +44,7 @@ It has been trained using [TRL](https://github.com/huggingface/trl).
|
|
44 |
| Model | GSM8k 0-Shot | GSM8k Few-Shot |
|
45 |
|------------------------------------------|------------------|-------------------|
|
46 |
| Mistral-7B-v0.1 | 10% | 41% |
|
47 |
-
| Qwen2.5-1.5B-Thinking | 17% |
|
48 |
|
49 |
## Training procedure
|
50 |
|
|
|
21 |
- name: GSM8k (0-Shot)
|
22 |
type: GSM8k (0-Shot)
|
23 |
value: 17%
|
24 |
+
- name: GSM8k (Few-Shot)
|
25 |
+
type: GSM8k (Few-Shot)
|
26 |
+
value: 64.2%
|
27 |
co2_eq_emissions:
|
28 |
emissions: 7100
|
29 |
source: "https://mlco2.github.io/impact#compute"
|
|
|
44 |
| Model | GSM8k 0-Shot | GSM8k Few-Shot |
|
45 |
|------------------------------------------|------------------|-------------------|
|
46 |
| Mistral-7B-v0.1 | 10% | 41% |
|
47 |
+
| Qwen2.5-1.5B-Thinking | 17% | 64.2% |
|
48 |
|
49 |
## Training procedure
|
50 |
|