alexmarques
commited on
Commit
•
6ef48df
1
Parent(s):
c265f0f
Update README.md
Browse files
README.md
CHANGED
@@ -202,9 +202,9 @@ This version of the lm-evaluation-harness includes versions of MMLU, ARC-Challen
|
|
202 |
</td>
|
203 |
<td>78.06
|
204 |
</td>
|
205 |
-
<td>77.
|
206 |
</td>
|
207 |
-
<td>99.
|
208 |
</td>
|
209 |
</tr>
|
210 |
<tr>
|
@@ -212,9 +212,9 @@ This version of the lm-evaluation-harness includes versions of MMLU, ARC-Challen
|
|
212 |
</td>
|
213 |
<td>54.48
|
214 |
</td>
|
215 |
-
<td>54.
|
216 |
</td>
|
217 |
-
<td>99.
|
218 |
</td>
|
219 |
</tr>
|
220 |
<tr>
|
@@ -222,7 +222,7 @@ This version of the lm-evaluation-harness includes versions of MMLU, ARC-Challen
|
|
222 |
</td>
|
223 |
<td><strong>74.05</strong>
|
224 |
</td>
|
225 |
-
<td><strong>74.
|
226 |
</td>
|
227 |
<td><strong>100.0%</strong>
|
228 |
</td>
|
|
|
202 |
</td>
|
203 |
<td>78.06
|
204 |
</td>
|
205 |
+
<td>77.51
|
206 |
</td>
|
207 |
+
<td>99.3%
|
208 |
</td>
|
209 |
</tr>
|
210 |
<tr>
|
|
|
212 |
</td>
|
213 |
<td>54.48
|
214 |
</td>
|
215 |
+
<td>54.41
|
216 |
</td>
|
217 |
+
<td>99.9%
|
218 |
</td>
|
219 |
</tr>
|
220 |
<tr>
|
|
|
222 |
</td>
|
223 |
<td><strong>74.05</strong>
|
224 |
</td>
|
225 |
+
<td><strong>74.06</strong>
|
226 |
</td>
|
227 |
<td><strong>100.0%</strong>
|
228 |
</td>
|