alexmarques
commited on
Commit
•
e8aa908
1
Parent(s):
cc8251c
Update README.md
Browse files
README.md
CHANGED
@@ -172,11 +172,11 @@ This version of the lm-evaluation-harness includes versions of MMLU, ARC-Challen
|
|
172 |
<tr>
|
173 |
<td>MMLU (CoT, 0-shot)
|
174 |
</td>
|
175 |
-
<td>88.
|
176 |
</td>
|
177 |
<td>88.23
|
178 |
</td>
|
179 |
-
<td>100.
|
180 |
</td>
|
181 |
</tr>
|
182 |
<tr>
|
@@ -232,7 +232,7 @@ This version of the lm-evaluation-harness includes versions of MMLU, ARC-Challen
|
|
232 |
<tr>
|
233 |
<td><strong>Average</strong>
|
234 |
</td>
|
235 |
-
<td><strong>86.
|
236 |
</td>
|
237 |
<td><strong>86.89</strong>
|
238 |
</td>
|
|
|
172 |
<tr>
|
173 |
<td>MMLU (CoT, 0-shot)
|
174 |
</td>
|
175 |
+
<td>88.26
|
176 |
</td>
|
177 |
<td>88.23
|
178 |
</td>
|
179 |
+
<td>100.0%
|
180 |
</td>
|
181 |
</tr>
|
182 |
<tr>
|
|
|
232 |
<tr>
|
233 |
<td><strong>Average</strong>
|
234 |
</td>
|
235 |
+
<td><strong>86.75</strong>
|
236 |
</td>
|
237 |
<td><strong>86.89</strong>
|
238 |
</td>
|