Commit
•
09b4560
1
Parent(s):
c0ff2ac
Update README.md (#1)
Browse files- Update README.md (459f47ac7da56daed1cff088464d710f563c75dc)
Co-authored-by: Karna <karnakar@users.noreply.huggingface.co>
README.md
CHANGED
@@ -111,24 +111,24 @@ We report in the following table our internal pipeline benchmarks:
|
|
111 |
<tbody>
|
112 |
<tr>
|
113 |
<td>MMLU</td>
|
114 |
-
<td>43.
|
115 |
-
<td>42.
|
116 |
-
<td>
|
117 |
-
<td>43.
|
118 |
</tr>
|
119 |
<tr>
|
120 |
<td>MMLU-PRO</td>
|
121 |
-
<td>18.
|
122 |
-
<td>17.
|
123 |
-
<td>17.
|
124 |
-
<td>18.
|
125 |
</tr>
|
126 |
<tr>
|
127 |
<td>IFEval</td>
|
128 |
-
<td>54.
|
129 |
-
<td>51.
|
130 |
-
<td>51.
|
131 |
-
<td>56.
|
132 |
</tr>
|
133 |
</tbody>
|
134 |
</table>
|
|
|
111 |
<tbody>
|
112 |
<tr>
|
113 |
<td>MMLU</td>
|
114 |
+
<td>43.6</td>
|
115 |
+
<td>42.6</td>
|
116 |
+
<td>43.0</td>
|
117 |
+
<td>43.5</td>
|
118 |
</tr>
|
119 |
<tr>
|
120 |
<td>MMLU-PRO</td>
|
121 |
+
<td>18.5</td>
|
122 |
+
<td>17.7</td>
|
123 |
+
<td>17.3</td>
|
124 |
+
<td>18.5</td>
|
125 |
</tr>
|
126 |
<tr>
|
127 |
<td>IFEval</td>
|
128 |
+
<td>54.9</td>
|
129 |
+
<td>51.4</td>
|
130 |
+
<td>51.2</td>
|
131 |
+
<td>56.1</td>
|
132 |
</tr>
|
133 |
</tbody>
|
134 |
</table>
|