melaseddik commited on
Commit
bad033a
1 Parent(s): f8fb5e2

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +67 -0
README.md CHANGED
@@ -167,6 +167,73 @@ print(tokenizer.decode(outputs[0]))
167
  </table>
168
 
169
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
170
  # Citation
171
 
172
 
 
167
  </table>
168
 
169
 
170
+ <table border="1" style="width: 100%; text-align: center;">
171
+ <colgroup>
172
+ <col style="width: 10%;">
173
+ <col style="width: 10%;">
174
+ <col style="width: 7%;">
175
+ <col style="width: 7%;">
176
+ <col style="width: 7%;">
177
+ <col style="background-color: rgba(128, 0, 128, 0.5); width: 7%;">
178
+ <col style="width: 7%;">
179
+ <col style="width: 7%;">
180
+ <col style="width: 7%;">
181
+ <col style="background-color: rgba(128, 0, 128, 0.5); width: 7%;">
182
+ </colgroup>
183
+ <thead>
184
+ <tr>
185
+ <th>Category</th>
186
+ <th>Benchmark</th>
187
+ <th>Llama3.1-8B</th>
188
+ <th>Qwen2-7B</th>
189
+ <th>Qwen2.5-7B</th>
190
+ <th>falcon{7}{Base}</th>
191
+ <th>Gemma2-9B</th>
192
+ <th>Yi1.5-9B</th>
193
+ <th>Mistral-NeMo-12B</th>
194
+ <th>falcon{10}{Base}</th>
195
+ </tr>
196
+ </thead>
197
+ <tbody>
198
+ <tr>
199
+ <td rowspan="3">General</td>
200
+ <td>MMLU (5-shot)</td>
201
+ <td>65.2</td>
202
+ <td>70.4</td>
203
+ <td>74.2</td>
204
+ <td>67.5</td>
205
+ <td>0</td>
206
+ <td>69.6</td>
207
+ <td>68.8</td>
208
+ <td>73.1</td>
209
+ </tr>
210
+ <tr>
211
+ <td>MMLU-PRO (5-shot)</td>
212
+ <td>32.7</td>
213
+ <td>42.1</td>
214
+ <td>43.5</td>
215
+ <td>39.2</td>
216
+ <td>0</td>
217
+ <td>39.3</td>
218
+ <td>34.7</td>
219
+ <td>42.5</td>
220
+ </tr>
221
+ <tr>
222
+ <td>IFEval</td>
223
+ <td>12.0</td>
224
+ <td>30.6</td>
225
+ <td>33.9</td>
226
+ <td>34.3</td>
227
+ <td>0</td>
228
+ <td>29.1</td>
229
+ <td>16.1</td>
230
+ <td>36.4</td>
231
+ </tr>
232
+ <!-- Continue with other rows similarly -->
233
+ </tbody>
234
+ </table>
235
+
236
+
237
  # Citation
238
 
239