Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
Update src/leaderboard/read_evals.py
Browse files
src/leaderboard/read_evals.py
CHANGED
@@ -77,7 +77,6 @@ class EvalResult:
|
|
77 |
task_value = task.value
|
78 |
if task_value.metric in scores:
|
79 |
results[task_value.benchmark] = Decimal(scores[task_value.metric])
|
80 |
-
print(f"Debug: {task_value.benchmark} = {results[task_value.benchmark]}")
|
81 |
|
82 |
|
83 |
return self(
|
@@ -128,7 +127,8 @@ class EvalResult:
|
|
128 |
}
|
129 |
|
130 |
for task in Tasks:
|
131 |
-
|
|
|
132 |
print(f"Debug: {task_value.col_name} = {self.results.get(task_value.benchmark, 'Not Found')}")
|
133 |
|
134 |
return data_dict
|
|
|
77 |
task_value = task.value
|
78 |
if task_value.metric in scores:
|
79 |
results[task_value.benchmark] = Decimal(scores[task_value.metric])
|
|
|
80 |
|
81 |
|
82 |
return self(
|
|
|
127 |
}
|
128 |
|
129 |
for task in Tasks:
|
130 |
+
task_value = task.value
|
131 |
+
data_dict[task_value.col_name] = self.results.get(task_value.benchmark, None)
|
132 |
print(f"Debug: {task_value.col_name} = {self.results.get(task_value.benchmark, 'Not Found')}")
|
133 |
|
134 |
return data_dict
|