UjjwalPardeshi commited on
Commit
fc3fbaf
·
1 Parent(s): 5b89fc4

fix: add has_grader: true to all tasks for evaluator grader check

Browse files
Files changed (2) hide show
  1. openenv.yaml +7 -0
  2. server/app.py +7 -7
openenv.yaml CHANGED
@@ -36,12 +36,14 @@ tasks:
36
  - id: task_001
37
  difficulty: easy
38
  max_steps: 20
 
39
  param_ranges:
40
  learning_rate: [0.05, 0.08, 0.10, 0.15, 0.30]
41
 
42
  - id: task_002
43
  difficulty: easy
44
  max_steps: 20
 
45
  param_ranges:
46
  learning_rate: [1e-6, 5e-6, 1e-5]
47
  depth_multiplier: [1.0, 1.5, 2.0]
@@ -49,12 +51,14 @@ tasks:
49
  - id: task_003
50
  difficulty: medium
51
  max_steps: 25
 
52
  param_ranges:
53
  leakage_pct: [0.12, 0.18, 0.22, 0.28]
54
 
55
  - id: task_004
56
  difficulty: medium
57
  max_steps: 25
 
58
  param_ranges:
59
  weight_decay: [0.0, 0.0001, 0.001]
60
  divergence_epoch: [5, 8, 12]
@@ -62,18 +66,21 @@ tasks:
62
  - id: task_005
63
  difficulty: hard
64
  max_steps: 30
 
65
  param_ranges:
66
  red_herring_intensity: [0.8, 2.5]
67
 
68
  - id: task_006
69
  difficulty: hard
70
  max_steps: 30
 
71
  param_ranges:
72
  bug_type: [eval_mode, detach_loss, zero_grad_missing, inplace_relu]
73
 
74
  - id: task_007
75
  difficulty: hard
76
  max_steps: 25
 
77
  param_ranges:
78
  scheduler_gamma: [0.01, 0.001, 0.0001]
79
  scheduler_step_size: [2, 3, 5]
 
36
  - id: task_001
37
  difficulty: easy
38
  max_steps: 20
39
+ has_grader: true
40
  param_ranges:
41
  learning_rate: [0.05, 0.08, 0.10, 0.15, 0.30]
42
 
43
  - id: task_002
44
  difficulty: easy
45
  max_steps: 20
46
+ has_grader: true
47
  param_ranges:
48
  learning_rate: [1e-6, 5e-6, 1e-5]
49
  depth_multiplier: [1.0, 1.5, 2.0]
 
51
  - id: task_003
52
  difficulty: medium
53
  max_steps: 25
54
+ has_grader: true
55
  param_ranges:
56
  leakage_pct: [0.12, 0.18, 0.22, 0.28]
57
 
58
  - id: task_004
59
  difficulty: medium
60
  max_steps: 25
61
+ has_grader: true
62
  param_ranges:
63
  weight_decay: [0.0, 0.0001, 0.001]
64
  divergence_epoch: [5, 8, 12]
 
66
  - id: task_005
67
  difficulty: hard
68
  max_steps: 30
69
+ has_grader: true
70
  param_ranges:
71
  red_herring_intensity: [0.8, 2.5]
72
 
73
  - id: task_006
74
  difficulty: hard
75
  max_steps: 30
76
+ has_grader: true
77
  param_ranges:
78
  bug_type: [eval_mode, detach_loss, zero_grad_missing, inplace_relu]
79
 
80
  - id: task_007
81
  difficulty: hard
82
  max_steps: 25
83
+ has_grader: true
84
  param_ranges:
85
  scheduler_gamma: [0.01, 0.001, 0.0001]
86
  scheduler_step_size: [2, 3, 5]
server/app.py CHANGED
@@ -46,13 +46,13 @@ logger = logging.getLogger(__name__)
46
 
47
  # All 7 tasks
48
  ALL_TASKS = [
49
- {"id": "task_001", "difficulty": "easy", "max_steps": 20},
50
- {"id": "task_002", "difficulty": "easy", "max_steps": 20},
51
- {"id": "task_003", "difficulty": "medium", "max_steps": 25},
52
- {"id": "task_004", "difficulty": "medium", "max_steps": 25},
53
- {"id": "task_005", "difficulty": "hard", "max_steps": 30},
54
- {"id": "task_006", "difficulty": "hard", "max_steps": 30},
55
- {"id": "task_007", "difficulty": "hard", "max_steps": 25},
56
  ]
57
 
58
  # create_app takes the class (factory), not an instance
 
46
 
47
  # All 7 tasks
48
  ALL_TASKS = [
49
+ {"id": "task_001", "difficulty": "easy", "max_steps": 20, "has_grader": True},
50
+ {"id": "task_002", "difficulty": "easy", "max_steps": 20, "has_grader": True},
51
+ {"id": "task_003", "difficulty": "medium", "max_steps": 25, "has_grader": True},
52
+ {"id": "task_004", "difficulty": "medium", "max_steps": 25, "has_grader": True},
53
+ {"id": "task_005", "difficulty": "hard", "max_steps": 30, "has_grader": True},
54
+ {"id": "task_006", "difficulty": "hard", "max_steps": 30, "has_grader": True},
55
+ {"id": "task_007", "difficulty": "hard", "max_steps": 25, "has_grader": True},
56
  ]
57
 
58
  # create_app takes the class (factory), not an instance