csabakecskemeti commited on
Commit
f01ec6b
1 Parent(s): e058427

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +51 -0
README.md CHANGED
@@ -11,6 +11,56 @@ tags:
11
  model-index:
12
  - name: analytical_reasoning_r16a32_unsloth-Llama-3.2-3B-Instruct-bnb-4bit
13
  results:
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
14
  - task:
15
  type: text-generation
16
  dataset:
@@ -25,6 +75,7 @@ model-index:
25
  type: acc_norm
26
  value: 0.6793
27
  verified: false
 
28
  ---
29
 
30
  ![image/png](https://cdn-uploads.huggingface.co/production/uploads/64e6d37e02dee9bcb9d9fa18/X4WG8AnMFqJuWkRvA0CrW.png)
 
11
  model-index:
12
  - name: analytical_reasoning_r16a32_unsloth-Llama-3.2-3B-Instruct-bnb-4bit
13
  results:
14
+ - task:
15
+ type: text-generation
16
+ dataset:
17
+ type: lm-evaluation-harness
18
+ name: bbh
19
+ metrics:
20
+ - name: acc_norm
21
+ type: acc_norm
22
+ value: 0.4168
23
+ verified: false
24
+ - task:
25
+ type: text-generation
26
+ dataset:
27
+ type: lm-evaluation-harness
28
+ name: gpqa
29
+ metrics:
30
+ - name: acc_norm
31
+ type: acc_norm
32
+ value: 0.2691
33
+ verified: false
34
+ - task:
35
+ type: text-generation
36
+ dataset:
37
+ type: lm-evaluation-harness
38
+ name: math
39
+ metrics:
40
+ - name: exact_match
41
+ type: exact_match
42
+ value: 0.0867
43
+ verified: false
44
+ - task:
45
+ type: text-generation
46
+ dataset:
47
+ type: lm-evaluation-harness
48
+ name: mmlu
49
+ metrics:
50
+ - name: acc_norm
51
+ type: acc_norm
52
+ value: 0.2822
53
+ verified: false
54
+ - task:
55
+ type: text-generation
56
+ dataset:
57
+ type: lm-evaluation-harness
58
+ name: musr
59
+ metrics:
60
+ - name: acc_norm
61
+ type: acc_norm
62
+ value: 0.3648
63
+ verified: false
64
  - task:
65
  type: text-generation
66
  dataset:
 
75
  type: acc_norm
76
  value: 0.6793
77
  verified: false
78
+
79
  ---
80
 
81
  ![image/png](https://cdn-uploads.huggingface.co/production/uploads/64e6d37e02dee9bcb9d9fa18/X4WG8AnMFqJuWkRvA0CrW.png)