+metrics: hellaswag
Browse files
README.md
CHANGED
@@ -9,4 +9,6 @@ language:
|
|
9 |
|arc_challenge|Yaml |none | 25|acc |0.1775|± |0.0112|
|
10 |
| | |none | 25|acc_norm|0.2133|± |0.0120|
|
11 |
|truthfulqa_mc2|Yaml |none | 0|acc |0.4457|± |0.0152|
|
12 |
-
|winogrande|Yaml |none | 5|acc |0.5154|± | 0.014|
|
|
|
|
|
|
9 |
|arc_challenge|Yaml |none | 25|acc |0.1775|± |0.0112|
|
10 |
| | |none | 25|acc_norm|0.2133|± |0.0120|
|
11 |
|truthfulqa_mc2|Yaml |none | 0|acc |0.4457|± |0.0152|
|
12 |
+
|winogrande|Yaml |none | 5|acc |0.5154|± | 0.014|
|
13 |
+
|hellaswag|Yaml |none | 10|acc |0.2832|± |0.0045|
|
14 |
+
| | |none | 10|acc_norm|0.3024|± |0.0046|
|