DEVessi commited on
Commit
b761978
·
verified ·
1 Parent(s): 516d2c6

Upload folder using huggingface_hub

Browse files
inference.py CHANGED
@@ -177,10 +177,10 @@ def main():
177
  })
178
 
179
  final_score = getattr(obs, 'grader_score', 0.0)
180
- if getattr(obs, 'grader_score', 0.0) >= 1.0 or getattr(obs, 'done', False) or (hasattr(result, 'done') and result.done):
181
  break
182
 
183
- success_str = "true" if final_score >= 1.0 else "false"
184
  rewards_str = ",".join(rewards) if rewards else "0.00"
185
  print(f"[END] success={success_str} steps={steps_taken} score={final_score:.2f} rewards={rewards_str}", flush=True)
186
  except Exception as e:
 
177
  })
178
 
179
  final_score = getattr(obs, 'grader_score', 0.0)
180
+ if getattr(obs, 'grader_score', 0.0) >= 0.99 or getattr(obs, 'done', False) or (hasattr(result, 'done') and result.done):
181
  break
182
 
183
+ success_str = "true" if final_score >= 0.99 else "false"
184
  rewards_str = ",".join(rewards) if rewards else "0.00"
185
  print(f"[END] success={success_str} steps={steps_taken} score={final_score:.2f} rewards={rewards_str}", flush=True)
186
  except Exception as e:
server/devops_sandbox_environment.py CHANGED
@@ -434,6 +434,7 @@ class DevOpsSandbox(Environment):
434
  raw_target = 1.0
435
 
436
  final_score = min(1.0, score / raw_target)
437
- final_score = round(min(max(final_score, 0.0), 1.0), 2)
 
438
 
439
  return (final_score, " | ".join(feedback_parts))
 
434
  raw_target = 1.0
435
 
436
  final_score = min(1.0, score / raw_target)
437
+ # Cap strictly within (0, 1) per Phase 2 Validator requirements
438
+ final_score = round(min(max(final_score, 0.01), 0.99), 2)
439
 
440
  return (final_score, " | ".join(feedback_parts))