Graheet commited on
Commit
17c3cb4
·
1 Parent(s): 567645a

Clamp task score strictly within (0, 1) for evaluator compliance

Browse files
Files changed (1) hide show
  1. grader.py +2 -1
grader.py CHANGED
@@ -137,7 +137,8 @@ def grade_task_result(
137
  + 0.15 * uncertainty_accuracy
138
  + 0.15 * consistency_score
139
  )
140
- return max(0.0, min(1.0, task_score))
 
141
 
142
 
143
  def task_failure_messages(
 
137
  + 0.15 * uncertainty_accuracy
138
  + 0.15 * consistency_score
139
  )
140
+ eps = 1e-6
141
+ return max(eps, min(1.0 - eps, task_score))
142
 
143
 
144
  def task_failure_messages(