UjjwalPardeshi commited on
Commit ·
fc3fbaf
1
Parent(s): 5b89fc4
fix: add has_grader: true to all tasks for evaluator grader check
Browse files- openenv.yaml +7 -0
- server/app.py +7 -7
openenv.yaml
CHANGED
|
@@ -36,12 +36,14 @@ tasks:
|
|
| 36 |
- id: task_001
|
| 37 |
difficulty: easy
|
| 38 |
max_steps: 20
|
|
|
|
| 39 |
param_ranges:
|
| 40 |
learning_rate: [0.05, 0.08, 0.10, 0.15, 0.30]
|
| 41 |
|
| 42 |
- id: task_002
|
| 43 |
difficulty: easy
|
| 44 |
max_steps: 20
|
|
|
|
| 45 |
param_ranges:
|
| 46 |
learning_rate: [1e-6, 5e-6, 1e-5]
|
| 47 |
depth_multiplier: [1.0, 1.5, 2.0]
|
|
@@ -49,12 +51,14 @@ tasks:
|
|
| 49 |
- id: task_003
|
| 50 |
difficulty: medium
|
| 51 |
max_steps: 25
|
|
|
|
| 52 |
param_ranges:
|
| 53 |
leakage_pct: [0.12, 0.18, 0.22, 0.28]
|
| 54 |
|
| 55 |
- id: task_004
|
| 56 |
difficulty: medium
|
| 57 |
max_steps: 25
|
|
|
|
| 58 |
param_ranges:
|
| 59 |
weight_decay: [0.0, 0.0001, 0.001]
|
| 60 |
divergence_epoch: [5, 8, 12]
|
|
@@ -62,18 +66,21 @@ tasks:
|
|
| 62 |
- id: task_005
|
| 63 |
difficulty: hard
|
| 64 |
max_steps: 30
|
|
|
|
| 65 |
param_ranges:
|
| 66 |
red_herring_intensity: [0.8, 2.5]
|
| 67 |
|
| 68 |
- id: task_006
|
| 69 |
difficulty: hard
|
| 70 |
max_steps: 30
|
|
|
|
| 71 |
param_ranges:
|
| 72 |
bug_type: [eval_mode, detach_loss, zero_grad_missing, inplace_relu]
|
| 73 |
|
| 74 |
- id: task_007
|
| 75 |
difficulty: hard
|
| 76 |
max_steps: 25
|
|
|
|
| 77 |
param_ranges:
|
| 78 |
scheduler_gamma: [0.01, 0.001, 0.0001]
|
| 79 |
scheduler_step_size: [2, 3, 5]
|
|
|
|
| 36 |
- id: task_001
|
| 37 |
difficulty: easy
|
| 38 |
max_steps: 20
|
| 39 |
+
has_grader: true
|
| 40 |
param_ranges:
|
| 41 |
learning_rate: [0.05, 0.08, 0.10, 0.15, 0.30]
|
| 42 |
|
| 43 |
- id: task_002
|
| 44 |
difficulty: easy
|
| 45 |
max_steps: 20
|
| 46 |
+
has_grader: true
|
| 47 |
param_ranges:
|
| 48 |
learning_rate: [1e-6, 5e-6, 1e-5]
|
| 49 |
depth_multiplier: [1.0, 1.5, 2.0]
|
|
|
|
| 51 |
- id: task_003
|
| 52 |
difficulty: medium
|
| 53 |
max_steps: 25
|
| 54 |
+
has_grader: true
|
| 55 |
param_ranges:
|
| 56 |
leakage_pct: [0.12, 0.18, 0.22, 0.28]
|
| 57 |
|
| 58 |
- id: task_004
|
| 59 |
difficulty: medium
|
| 60 |
max_steps: 25
|
| 61 |
+
has_grader: true
|
| 62 |
param_ranges:
|
| 63 |
weight_decay: [0.0, 0.0001, 0.001]
|
| 64 |
divergence_epoch: [5, 8, 12]
|
|
|
|
| 66 |
- id: task_005
|
| 67 |
difficulty: hard
|
| 68 |
max_steps: 30
|
| 69 |
+
has_grader: true
|
| 70 |
param_ranges:
|
| 71 |
red_herring_intensity: [0.8, 2.5]
|
| 72 |
|
| 73 |
- id: task_006
|
| 74 |
difficulty: hard
|
| 75 |
max_steps: 30
|
| 76 |
+
has_grader: true
|
| 77 |
param_ranges:
|
| 78 |
bug_type: [eval_mode, detach_loss, zero_grad_missing, inplace_relu]
|
| 79 |
|
| 80 |
- id: task_007
|
| 81 |
difficulty: hard
|
| 82 |
max_steps: 25
|
| 83 |
+
has_grader: true
|
| 84 |
param_ranges:
|
| 85 |
scheduler_gamma: [0.01, 0.001, 0.0001]
|
| 86 |
scheduler_step_size: [2, 3, 5]
|
server/app.py
CHANGED
|
@@ -46,13 +46,13 @@ logger = logging.getLogger(__name__)
|
|
| 46 |
|
| 47 |
# All 7 tasks
|
| 48 |
ALL_TASKS = [
|
| 49 |
-
{"id": "task_001", "difficulty": "easy", "max_steps": 20},
|
| 50 |
-
{"id": "task_002", "difficulty": "easy", "max_steps": 20},
|
| 51 |
-
{"id": "task_003", "difficulty": "medium", "max_steps": 25},
|
| 52 |
-
{"id": "task_004", "difficulty": "medium", "max_steps": 25},
|
| 53 |
-
{"id": "task_005", "difficulty": "hard", "max_steps": 30},
|
| 54 |
-
{"id": "task_006", "difficulty": "hard", "max_steps": 30},
|
| 55 |
-
{"id": "task_007", "difficulty": "hard", "max_steps": 25},
|
| 56 |
]
|
| 57 |
|
| 58 |
# create_app takes the class (factory), not an instance
|
|
|
|
| 46 |
|
| 47 |
# All 7 tasks
|
| 48 |
ALL_TASKS = [
|
| 49 |
+
{"id": "task_001", "difficulty": "easy", "max_steps": 20, "has_grader": True},
|
| 50 |
+
{"id": "task_002", "difficulty": "easy", "max_steps": 20, "has_grader": True},
|
| 51 |
+
{"id": "task_003", "difficulty": "medium", "max_steps": 25, "has_grader": True},
|
| 52 |
+
{"id": "task_004", "difficulty": "medium", "max_steps": 25, "has_grader": True},
|
| 53 |
+
{"id": "task_005", "difficulty": "hard", "max_steps": 30, "has_grader": True},
|
| 54 |
+
{"id": "task_006", "difficulty": "hard", "max_steps": 30, "has_grader": True},
|
| 55 |
+
{"id": "task_007", "difficulty": "hard", "max_steps": 25, "has_grader": True},
|
| 56 |
]
|
| 57 |
|
| 58 |
# create_app takes the class (factory), not an instance
|