Spaces:
Sleeping
Sleeping
Graheet commited on
Commit ·
17c3cb4
1
Parent(s): 567645a
Clamp task score strictly within (0, 1) for evaluator compliance
Browse files
grader.py
CHANGED
|
@@ -137,7 +137,8 @@ def grade_task_result(
|
|
| 137 |
+ 0.15 * uncertainty_accuracy
|
| 138 |
+ 0.15 * consistency_score
|
| 139 |
)
|
| 140 |
-
|
|
|
|
| 141 |
|
| 142 |
|
| 143 |
def task_failure_messages(
|
|
|
|
| 137 |
+ 0.15 * uncertainty_accuracy
|
| 138 |
+ 0.15 * consistency_score
|
| 139 |
)
|
| 140 |
+
eps = 1e-6
|
| 141 |
+
return max(eps, min(1.0 - eps, task_score))
|
| 142 |
|
| 143 |
|
| 144 |
def task_failure_messages(
|