Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
pminervini
commited on
Commit
•
e7827c3
1
Parent(s):
fb52440
update
Browse files- src/backend/envs.py +0 -1
- src/leaderboard/read_evals.py +1 -1
src/backend/envs.py
CHANGED
@@ -58,7 +58,6 @@ class Tasks(Enum):
|
|
58 |
task20 = Task("race", "acc", "RACE", 0)
|
59 |
|
60 |
|
61 |
-
|
62 |
EVAL_REQUESTS_PATH_BACKEND = os.path.join(CACHE_PATH, "eval-queue-bk")
|
63 |
EVAL_RESULTS_PATH_BACKEND = os.path.join(CACHE_PATH, "eval-results-bk")
|
64 |
|
|
|
58 |
task20 = Task("race", "acc", "RACE", 0)
|
59 |
|
60 |
|
|
|
61 |
EVAL_REQUESTS_PATH_BACKEND = os.path.join(CACHE_PATH, "eval-queue-bk")
|
62 |
EVAL_RESULTS_PATH_BACKEND = os.path.join(CACHE_PATH, "eval-results-bk")
|
63 |
|
src/leaderboard/read_evals.py
CHANGED
@@ -93,7 +93,7 @@ class EvalResult:
|
|
93 |
|
94 |
if to_add is True:
|
95 |
multiplier = 100.0
|
96 |
-
if 'rouge' in metric:
|
97 |
multiplier = 1.0
|
98 |
if 'squad' in benchmark:
|
99 |
multiplier = 1.0
|
|
|
93 |
|
94 |
if to_add is True:
|
95 |
multiplier = 100.0
|
96 |
+
if 'rouge' in metric and 'truthful' not in benchmark:
|
97 |
multiplier = 1.0
|
98 |
if 'squad' in benchmark:
|
99 |
multiplier = 1.0
|