Spaces:

K446
/

Opengrid

Running

K446 commited on 13 days ago

Commit

8a02303

1 Parent(s): 5ba53f6

feat: curriculum training + Karnataka scenarios + repo cleanup

- Add Karnataka scenario variants (easy/medium/hard) with same 15-bus topology
but different operating conditions (renewables, load, line capacity)
- Add curriculum training mode (--curriculum flag) that chains through
karnataka_easy -> medium -> hard -> full with checkpoint transfer
- Restructure repo: docs/ for documentation, scripts/ for utilities
- Clean up generated blobs (codebase_summary.md, inference_output.txt)
- Frontend: dynamic task groups (Procedural green, Karnataka gold)
- Map: no tiles for procedural grids (dark canvas), locked bounds for Karnataka
- Fix zone names: generic for procedural, KPTCL-specific for Karnataka
- Fix Raichur TPS GPS coordinates (16.36, 77.34)
- All 7 training pipeline checks pass

Files changed (14) hide show

.gitignore +4 -9
changes.md → docs/changes.md +0 -0
inference.py +3 -1
open-grid logo.png +3 -0
run_training.py +2 -2
scripts/generate_code_md.py +92 -0
scripts/get_scores.py +37 -0
scripts/verify_training.py +161 -0
src/scenarios.py +113 -0
src/tasks.py +23 -14
static/app.js +96 -26
static/index.html +57 -53
static/style.css +199 -70
training/train_grpo.py +99 -6

.gitignore CHANGED Viewed

@@ -13,14 +13,12 @@ build/
 # Generated / temporary files
 inference_output.txt
 codebase_summary.md
-generate_code_md.py
 uv.lock
-# Reference docs (not part of submission)
-guide.md
-detailed judging criteria.md
-ui_skill.md
-project-spec.md
 pyrightconfig.json
 # Training outputs (large files — push separately or add to HF)
@@ -31,6 +29,3 @@ training/outputs/
 # OS files
 Thumbs.db
 .DS_Store
-# Duplicate test file (tests/ directory has the real one)
-test_multiagent.py

 # Generated / temporary files
 inference_output.txt
 codebase_summary.md
 uv.lock
+# Reference docs (moved to docs/ — not part of submission)
+docs/guide.md
+docs/detailed_judging_criteria.md
+docs/project-spec.md
 pyrightconfig.json
 # Training outputs (large files — push separately or add to HF)
 # OS files
 Thumbs.db
 .DS_Store

changes.md → docs/changes.md RENAMED Viewed

File without changes

inference.py CHANGED Viewed

@@ -48,7 +48,9 @@ BENCHMARK = "OpenGrid"
 MAX_STEPS = 100
 SUCCESS_SCORE_THRESHOLD = 0.5
-TASKS = ["task_easy", "task_medium", "task_hard", "task_karnataka"]
 SYSTEM_PROMPT_SINGLE = """You are a Power Grid Controller AI. Your goal is to maintain grid stability.

 MAX_STEPS = 100
 SUCCESS_SCORE_THRESHOLD = 0.5
+TASKS = ["task_easy", "task_medium", "task_hard",
+         "karnataka_easy", "karnataka_medium", "karnataka_hard",
+         "task_karnataka"]
 SYSTEM_PROMPT_SINGLE = """You are a Power Grid Controller AI. Your goal is to maintain grid stability.

open-grid logo.png ADDED Viewed

Git LFS Details

SHA256: 7c5b33163678b884123740782fbaab4bafba3d02e4a2a36ec1ae4e138af31915
Pointer size: 129 Bytes
Size of remote file: 1.37 kB

run_training.py CHANGED Viewed

@@ -79,7 +79,7 @@ def run_grpo_training():
         return json.dumps({"bus_adjustments": [], "topology_actions": []})
     baseline_results = {}
-    for task_id in ["task_easy", "task_medium", "task_karnataka"]:
         if task_id not in TASKS:
             continue
         config = TASKS[task_id]
@@ -238,7 +238,7 @@ def run_grpo_training():
         return tokenizer.decode(outputs[0][inputs['input_ids'].shape[1]:], skip_special_tokens=True)
     trained_results = {}
-    for task_id in ["task_easy", "task_medium", "task_karnataka"]:
         if task_id not in TASKS:
             continue
         config = TASKS[task_id]

         return json.dumps({"bus_adjustments": [], "topology_actions": []})
     baseline_results = {}
+    for task_id in ["task_easy", "task_medium", "karnataka_easy", "karnataka_medium", "karnataka_hard", "task_karnataka"]:
         if task_id not in TASKS:
             continue
         config = TASKS[task_id]
         return tokenizer.decode(outputs[0][inputs['input_ids'].shape[1]:], skip_special_tokens=True)
     trained_results = {}
+    for task_id in ["task_easy", "task_medium", "karnataka_easy", "karnataka_medium", "karnataka_hard", "task_karnataka"]:
         if task_id not in TASKS:
             continue
         config = TASKS[task_id]

scripts/generate_code_md.py ADDED Viewed

	@@ -0,0 +1,92 @@

+import os
+def generate_tree(dir_path, ignore_dirs=None, prefix=""):
+    """Generates a text representation of the folder structure."""
+    if ignore_dirs is None:
+        ignore_dirs = {'.git', '__pycache__', 'venv', '.venv', 'env', 'node_modules', '.idea', '.vscode', 'build', 'dist'}
+    tree_str = ""
+    try:
+        items = os.listdir(dir_path)
+    except PermissionError:
+        return ""
+    items.sort()
+    # Filter out ignored directories
+    items = [item for item in items if item not in ignore_dirs]
+    for i, item in enumerate(items):
+        path = os.path.join(dir_path, item)
+        is_last = i == (len(items) - 1)
+        if is_last:
+            tree_str += f"{prefix}└── {item}\n"
+            new_prefix = prefix + "    "
+        else:
+            tree_str += f"{prefix}├── {item}\n"
+            new_prefix = prefix + "│   "
+        if os.path.isdir(path):
+            tree_str += generate_tree(path, ignore_dirs, new_prefix)
+    return tree_str
+def generate_markdown(output_file="codebase_summary.md", source_dir=".", ignore_dirs=None, ignore_exts=None):
+    """Creates a markdown file with the folder structure and content of all files."""
+    if ignore_dirs is None:
+        ignore_dirs = {'.git', '__pycache__', 'venv', '.venv', 'env', 'node_modules', '.idea', '.vscode', 'build', 'dist'}
+    # Common binary and non-text files to ignore
+    if ignore_exts is None:
+        ignore_exts = {'.pyc', '.pyo', '.pyd', '.so', '.dll', '.exe', '.bin',
+                       '.png', '.jpg', '.jpeg', '.gif', '.ico', '.pdf',
+                       '.zip', '.tar', '.gz', '.mp4', '.mp3', '.sqlite3'}
+    print(f"Generating {output_file}...")
+    with open(output_file, 'w', encoding='utf-8') as outfile:
+        outfile.write("# Codebase Structure\n\n")
+        outfile.write("```text\n")
+        outfile.write(f"{os.path.basename(os.path.abspath(source_dir))}/\n")
+        outfile.write(generate_tree(source_dir, ignore_dirs))
+        outfile.write("```\n\n")
+        outfile.write("# Code Files\n\n")
+        for root, dirs, files in os.walk(source_dir):
+            # Modify dirs in-place to skip ignored directories in os.walk
+            dirs[:] = [d for d in dirs if d not in ignore_dirs]
+            for file in files:
+                ext = os.path.splitext(file)[1].lower()
+                # Skip binary files, images, or the output file itself
+                if ext in ignore_exts or file == output_file or file == os.path.basename(__file__):
+                    continue
+                file_path = os.path.join(root, file)
+                rel_path = os.path.relpath(file_path, source_dir)
+                outfile.write(f"## `{rel_path}`\n\n")
+                # Determine language for markdown block
+                lang = ext[1:] if ext else "text"
+                if lang == "txt": lang = "text"
+                outfile.write(f"```{lang}\n")
+                try:
+                    with open(file_path, 'r', encoding='utf-8') as infile:
+                        content = infile.read()
+                        outfile.write(content)
+                        # Ensure there is a newline at the end of the content before closing the code block
+                        if content and not content.endswith('\n'):
+                            outfile.write('\n')
+                except UnicodeDecodeError:
+                    outfile.write(f"// File appears to be binary or has an unsupported encoding and could not be read.\n")
+                except Exception as e:
+                    outfile.write(f"// Error reading file: {e}\n")
+                outfile.write("```\n\n")
+    print(f"Successfully generated {output_file}!")
+if __name__ == "__main__":
+    generate_markdown()

scripts/get_scores.py ADDED Viewed

	@@ -0,0 +1,37 @@

+"""Evaluate heuristic baseline on all tasks and print scores."""
+import copy
+import json
+import sys
+from src.tasks import TASKS
+from src.grader import RobustnessGrader
+from src.baseline import heuristic_policy
+def main(n_episodes: int = 10):
+    all_results = {}
+    for tid, cfg in TASKS.items():
+        try:
+            grader = RobustnessGrader(copy.deepcopy(cfg))
+            result = grader.evaluate_policy(
+                heuristic_policy, n_episodes=n_episodes
+            )
+            all_results[tid] = result
+            print(f"{tid}:")
+            for k, v in result.items():
+                print(f"  {k}: {v}")
+            print()
+        except Exception as e:
+            all_results[tid] = {"error": str(e)}
+            print(f"{tid}: FAILED — {e}\n")
+    return all_results
+if __name__ == "__main__":
+    episodes = int(sys.argv[1]) if len(sys.argv) > 1 else 10
+    main(n_episodes=episodes)

scripts/verify_training.py ADDED Viewed

	@@ -0,0 +1,161 @@

+"""
+Comprehensive training pipeline verification.
+Tests: scenarios, reward functions, policies, GRPO integration, safety.
+"""
+import json
+import copy
+import sys
+sys.path.insert(0, ".")
+from src.tasks import TASKS, get_task
+from src.environment import OpenGridEnv
+from src.models import GridAction, GridObservation
+from src.grader import RobustnessGrader
+from src.baseline import heuristic_policy
+from src.safety import SafetyLayer
+print("=" * 60)
+print("  COMPREHENSIVE TRAINING PIPELINE VERIFICATION")
+print("=" * 60)
+errors = []
+# --- 1. Scenario loading ---
+print("\n[1/7] Scenario Loading...")
+expected_tasks = ["task_easy", "task_medium", "task_hard",
+                  "task_karnataka", "karnataka_easy", "karnataka_medium", "karnataka_hard"]
+for tid in expected_tasks:
+    if tid not in TASKS:
+        errors.append(f"Missing task: {tid}")
+        print(f"  FAIL: {tid} not in TASKS")
+    else:
+        cfg = TASKS[tid]
+        print(f"  OK: {tid} - {cfg['num_buses']}b/{cfg['num_agents']}a zones={cfg['zone_names']}")
+# --- 2. Environment step for each scenario ---
+print("\n[2/7] Environment Step Test...")
+for tid in expected_tasks:
+    try:
+        cfg = get_task(tid)
+        env = OpenGridEnv(cfg)
+        obs = env.reset()
+        action = GridAction.model_validate_json(
+            json.dumps({"bus_adjustments": [], "topology_actions": []})
+        )
+        obs2, reward, done, info = env.step(action)
+        freq = obs2.grid_frequency
+        r = reward.value
+        print(f"  OK: {tid} - freq={freq:.2f}Hz reward={r:.2f}")
+    except Exception as e:
+        errors.append(f"Env step failed for {tid}: {e}")
+        print(f"  FAIL: {tid} - {e}")
+# --- 3. Reward function (GRPO) test ---
+print("\n[3/7] GRPO Reward Function Test...")
+from training.train_grpo import compute_grpo_reward_env
+test_completions = [
+    '{"bus_adjustments": [{"bus_id": 0, "delta": 5.0}], "topology_actions": []}',
+    '{"bus_adjustments": [], "topology_actions": []}',
+    'not valid json',
+]
+test_observations = [
+    {"grid_frequency": 49.5, "buses": [], "lines": []},
+    {"grid_frequency": 50.0, "buses": [], "lines": []},
+    {"grid_frequency": 48.0, "buses": [], "lines": []},
+]
+try:
+    cfg = get_task("karnataka_easy")
+    rewards = compute_grpo_reward_env(test_completions, test_observations, cfg, horizon=1)
+    for i, r in enumerate(rewards):
+        print(f"  Completion {i}: reward={r:.3f}")
+    print(f"  OK: GRPO rewards computed for {len(rewards)} completions")
+except Exception as e:
+    errors.append(f"GRPO reward failed: {e}")
+    print(f"  FAIL: {e}")
+# --- 4. Karnataka Difficulty Gradient Test ---
+print("\n[4/7] Karnataka Difficulty Gradient Test...")
+ka_rewards = {}
+for tid in ["karnataka_easy", "karnataka_medium", "karnataka_hard"]:
+    try:
+        cfg = get_task(tid)
+        env = OpenGridEnv(cfg)
+        obs = env.reset()
+        total_r = 0
+        for step_i in range(5):
+            action = GridAction.model_validate_json(
+                json.dumps({"bus_adjustments": [], "topology_actions": []})
+            )
+            obs, reward, done, info = env.step(action)
+            total_r += reward.value
+            if done:
+                break
+        ka_rewards[tid] = total_r
+        print(f"  {tid}: 5-step reward={total_r:.2f}")
+    except Exception as e:
+        errors.append(f"Ka difficulty test failed for {tid}: {e}")
+        print(f"  FAIL: {tid} - {e}")
+if len(ka_rewards) == 3:
+    # Easy should generally give higher or equal rewards than hard
+    if ka_rewards["karnataka_easy"] >= ka_rewards["karnataka_hard"]:
+        print(f"  OK: Difficulty gradient correct (easy >= hard)")
+    else:
+        print(f"  WARN: easy ({ka_rewards['karnataka_easy']:.2f}) < hard ({ka_rewards['karnataka_hard']:.2f}) - may vary by seed")
+# --- 5. Heuristic policy test ---
+print("\n[5/7] Heuristic Policy Test...")
+for tid in ["task_easy", "karnataka_easy", "task_karnataka"]:
+    try:
+        cfg = get_task(tid)
+        env = OpenGridEnv(cfg)
+        obs = env.reset()
+        total_r = 0
+        for step_i in range(10):
+            action = heuristic_policy(obs)
+            obs, reward, done, info = env.step(action)
+            total_r += reward.value
+            if done:
+                break
+        print(f"  OK: {tid} - 10-step heuristic reward={total_r:.2f}")
+    except Exception as e:
+        errors.append(f"Heuristic policy failed for {tid}: {e}")
+        print(f"  FAIL: {tid} - {e}")
+# --- 6. Safety layer test ---
+print("\n[6/7] Safety Layer Test...")
+for tid in ["task_easy", "karnataka_easy", "karnataka_hard"]:
+    try:
+        cfg = get_task(tid)
+        layer = SafetyLayer(cfg)
+        action = GridAction.model_validate_json(
+            json.dumps({"bus_adjustments": [{"bus_id": 0, "delta": 100.0}], "topology_actions": []})
+        )
+        bus_state = [{"id": b["id"], "p": b.get("base_p", 0), "soc": b.get("init_soc", 0)} for b in cfg["buses"]]
+        line_state = [{"id": l["id"], "connected": True, "flow": 0} for l in cfg["lines"]]
+        safe_action, report = layer.validate_and_correct(0, action, line_state, bus_state, {})
+        print(f"  OK: {tid} - corrected={report.was_corrected}, n1_violations={report.n1_violations_detected}")
+    except Exception as e:
+        errors.append(f"Safety layer failed for {tid}: {e}")
+        print(f"  FAIL: {tid} - {e}")
+# --- 7. Curriculum order test ---
+print("\n[7/7] Curriculum Order Test...")
+from training.train_grpo import CURRICULUM_ORDER
+for tid in CURRICULUM_ORDER:
+    if tid in TASKS:
+        print(f"  OK: {tid} available")
+    else:
+        errors.append(f"Curriculum task missing: {tid}")
+        print(f"  FAIL: {tid} not in TASKS")
+# --- Summary ---
+print("\n" + "=" * 60)
+if errors:
+    print(f"  FAILED: {len(errors)} errors")
+    for e in errors:
+        print(f"    - {e}")
+    sys.exit(1)
+else:
+    print("  ALL CHECKS PASSED - Training pipeline ready")
+print("=" * 60)

src/scenarios.py ADDED Viewed

	@@ -0,0 +1,113 @@

+"""
+Karnataka Grid Scenarios
+========================
+Generates difficulty variants of the Karnataka 15-bus grid.
+Same topology (KPTCL transmission map), different operating conditions.
+Scenarios vary:
+- Renewable penetration (solar/wind max_p)
+- Load magnitude (base_p multiplier)
+- Line capacity (tighter or relaxed limits)
+- Battery capacity
+"""
+import copy
+from typing import Dict
+from src.tasks import generate_karnataka_task
+__all__ = ['generate_karnataka_scenario', 'KARNATAKA_SCENARIOS']
+# Difficulty profiles: multipliers applied to the base Karnataka grid
+_DIFFICULTY_PROFILES = {
+    "easy": {
+        "description": "Low renewables, light load, relaxed lines",
+        "renewable_multiplier": 0.3,      # Solar/wind max_p scaled down
+        "load_multiplier": 0.6,           # Loads are lighter
+        "line_capacity_multiplier": 1.5,  # Lines can carry more
+        "battery_capacity_multiplier": 1.5,  # More storage headroom
+        "max_steps": 50,
+    },
+    "medium": {
+        "description": "Moderate renewables, normal load, standard lines",
+        "renewable_multiplier": 0.7,
+        "load_multiplier": 1.0,
+        "line_capacity_multiplier": 1.0,
+        "battery_capacity_multiplier": 1.0,
+        "max_steps": 50,
+    },
+    "hard": {
+        "description": "High renewables, peak demand, tight lines",
+        "renewable_multiplier": 1.3,      # More volatile supply
+        "load_multiplier": 1.4,           # Peak demand
+        "line_capacity_multiplier": 0.75, # Congested corridors
+        "battery_capacity_multiplier": 0.7,  # Less storage
+        "max_steps": 50,
+    },
+}
+def generate_karnataka_scenario(difficulty: str, seed: int = 808) -> Dict:
+    """Generate a Karnataka grid scenario at a given difficulty level.
+    The base topology (15 buses, 18 lines, 4 zones) is identical across
+    all difficulties. Only the operating conditions change:
+    - Renewable generation capacity (solar/wind max_p)
+    - Load demand (base_p on load buses)
+    - Transmission line capacity
+    - Battery storage capacity
+    This enables curriculum learning on a consistent grid structure.
+    """
+    if difficulty not in _DIFFICULTY_PROFILES:
+        raise ValueError(
+            f"Unknown difficulty '{difficulty}'. "
+            f"Available: {list(_DIFFICULTY_PROFILES.keys())}"
+        )
+    profile = _DIFFICULTY_PROFILES[difficulty]
+    base = generate_karnataka_task(seed=seed)
+    # Apply multipliers to buses
+    for bus in base["buses"]:
+        bus_type = bus["type"]
+        if bus_type in ("solar", "wind"):
+            bus["max_p"] = round(bus["max_p"] * profile["renewable_multiplier"], 1)
+        elif bus_type == "load":
+            bus["base_p"] = round(bus["base_p"] * profile["load_multiplier"], 1)
+        elif bus_type == "battery":
+            bus["max_p"] = round(bus["max_p"] * profile["battery_capacity_multiplier"], 1)
+            bus["capacity"] = round(bus["capacity"] * profile["battery_capacity_multiplier"], 1)
+            bus["init_soc"] = round(bus["capacity"] * 0.5, 1)
+        elif bus_type == "slack":
+            # Scale slack to cover the adjusted load
+            total_load = sum(
+                b["base_p"] * (profile["load_multiplier"] if b["type"] == "load" else 1.0)
+                for b in base["buses"] if b["type"] == "load"
+            )
+            bus["max_p"] = max(200, round(total_load * 0.8, 1))
+            bus["min_p"] = -bus["max_p"]
+    # Apply line capacity multiplier
+    for line in base["lines"]:
+        line["capacity"] = round(line["capacity"] * profile["line_capacity_multiplier"], 1)
+    # Update metadata
+    base["id"] = f"karnataka_{difficulty}"
+    base["difficulty"] = f"karnataka_{difficulty}"
+    base["max_steps"] = profile["max_steps"]
+    base["scenario_description"] = profile["description"]
+    return base
+# Pre-built scenario configs
+KARNATAKA_SCENARIOS = {
+    f"karnataka_{diff}": generate_karnataka_scenario(diff)
+    for diff in _DIFFICULTY_PROFILES
+}

src/tasks.py CHANGED Viewed

@@ -18,18 +18,20 @@ from typing import Dict, List, Tuple
 __all__ = ['generate_procedural_grid', 'generate_karnataka_task', 'TASKS', 'get_task']
-# KPTCL-inspired zone names
 def _get_zone_names(num_agents: int) -> List[str]:
-    """Get human-readable zone names for a given agent count."""
-    base_names = [
-        "Bengaluru_Region", "Mysuru_Region", "Kalburagi_Region",
-        "Belagavi_Region", "Mangaluru_Region",
-    ]
-    if num_agents <= len(base_names):
-        return base_names[:num_agents]
     return [f"Zone_{i}" for i in range(num_agents)]
 def _partition_into_zones(G: nx.Graph, num_agents: int) -> Dict[int, int]:
     """Partition graph nodes into balanced, connected zones.
@@ -283,13 +285,13 @@ def generate_karnataka_task(seed: int = 808) -> Dict:
     KPTCL transmission map. Nodes have real GPS coordinates for GIS rendering.
     """
     nodes = [
-        {"id": 0, "name": "Raichur_TPS", "type": "slack", "lat": 16.20, "lon": 77.36, "max_p": 200, "base_p": 0},
         {"id": 1, "name": "Kalaburagi", "type": "load", "lat": 17.33, "lon": 76.83, "max_p": 0, "base_p": 40},
         {"id": 2, "name": "Belagavi", "type": "load", "lat": 15.85, "lon": 74.50, "max_p": 0, "base_p": 35},
-        {"id": 3, "name": "Hubballi", "type": "load", "lat": 15.36, "lon": 75.13, "max_p": 0, "base_p": 45},
         {"id": 4, "name": "Ballari_TPS", "type": "generator", "lat": 15.14, "lon": 76.92, "max_p": 150, "base_p": 0},
         {"id": 5, "name": "Chitradurga_Wind", "type": "wind", "lat": 14.23, "lon": 76.40, "max_p": 80, "base_p": 0},
-        {"id": 6, "name": "Pavagada_Solar", "type": "solar", "lat": 14.10, "lon": 77.27, "max_p": 120, "base_p": 0},
         {"id": 7, "name": "Sharavathi_Hydro", "type": "generator", "lat": 14.18, "lon": 74.83, "max_p": 100, "base_p": 0},
         {"id": 8, "name": "Shivamogga", "type": "load", "lat": 13.93, "lon": 75.57, "max_p": 0, "base_p": 30},
         {"id": 9, "name": "Mangaluru", "type": "load", "lat": 12.87, "lon": 74.88, "max_p": 0, "base_p": 50},
@@ -350,7 +352,7 @@ def generate_karnataka_task(seed: int = 808) -> Dict:
         "difficulty": "karnataka",
         "num_agents": 4,
         "zone_assignments": zone_assignments,
-        "zone_names": ["Kalaburagi_Region", "Hubballi_Region", "Mysuru_Region", "Bengaluru_Region"],
         "zone_bus_ids": zone_bus_ids,
         "internal_lines": internal_lines,
         "boundary_lines": boundary_lines,
@@ -380,5 +382,12 @@ TASKS = {
     "task_easy": generate_procedural_grid("easy", seed=101),
     "task_medium": generate_procedural_grid("medium", seed=102),
     "task_hard": generate_procedural_grid("hard", seed=103),
-    "task_karnataka": generate_karnataka_task()
-}

 __all__ = ['generate_procedural_grid', 'generate_karnataka_task', 'TASKS', 'get_task']
+# Generic zone names for procedural grids
 def _get_zone_names(num_agents: int) -> List[str]:
+    """Get human-readable zone names for a given agent count (generic)."""
+    generic = ["Zone_Alpha", "Zone_Beta", "Zone_Gamma", "Zone_Delta", "Zone_Epsilon"]
+    if num_agents <= len(generic):
+        return generic[:num_agents]
     return [f"Zone_{i}" for i in range(num_agents)]
+# KPTCL-specific zone names (only for Karnataka tasks)
+def _get_karnataka_zone_names() -> List[str]:
+    return ["Kalaburagi_Region", "Hubballi_Region", "Mysuru_Region", "Bengaluru_Region"]
 def _partition_into_zones(G: nx.Graph, num_agents: int) -> Dict[int, int]:
     """Partition graph nodes into balanced, connected zones.
     KPTCL transmission map. Nodes have real GPS coordinates for GIS rendering.
     """
     nodes = [
+        {"id": 0, "name": "Raichur_TPS", "type": "slack", "lat": 16.36, "lon": 77.34, "max_p": 200, "base_p": 0},
         {"id": 1, "name": "Kalaburagi", "type": "load", "lat": 17.33, "lon": 76.83, "max_p": 0, "base_p": 40},
         {"id": 2, "name": "Belagavi", "type": "load", "lat": 15.85, "lon": 74.50, "max_p": 0, "base_p": 35},
+        {"id": 3, "name": "Hubballi", "type": "load", "lat": 15.36, "lon": 75.12, "max_p": 0, "base_p": 45},
         {"id": 4, "name": "Ballari_TPS", "type": "generator", "lat": 15.14, "lon": 76.92, "max_p": 150, "base_p": 0},
         {"id": 5, "name": "Chitradurga_Wind", "type": "wind", "lat": 14.23, "lon": 76.40, "max_p": 80, "base_p": 0},
+        {"id": 6, "name": "Pavagada_Solar", "type": "solar", "lat": 14.10, "lon": 77.28, "max_p": 120, "base_p": 0},
         {"id": 7, "name": "Sharavathi_Hydro", "type": "generator", "lat": 14.18, "lon": 74.83, "max_p": 100, "base_p": 0},
         {"id": 8, "name": "Shivamogga", "type": "load", "lat": 13.93, "lon": 75.57, "max_p": 0, "base_p": 30},
         {"id": 9, "name": "Mangaluru", "type": "load", "lat": 12.87, "lon": 74.88, "max_p": 0, "base_p": 50},
         "difficulty": "karnataka",
         "num_agents": 4,
         "zone_assignments": zone_assignments,
+        "zone_names": _get_karnataka_zone_names(),
         "zone_bus_ids": zone_bus_ids,
         "internal_lines": internal_lines,
         "boundary_lines": boundary_lines,
     "task_easy": generate_procedural_grid("easy", seed=101),
     "task_medium": generate_procedural_grid("medium", seed=102),
     "task_hard": generate_procedural_grid("hard", seed=103),
+    "task_karnataka": generate_karnataka_task(),
+}
+# Register Karnataka scenario variants (same topology, different difficulty)
+from src.scenarios import KARNATAKA_SCENARIOS, generate_karnataka_scenario  # noqa: E402
+for _sid, _cfg in KARNATAKA_SCENARIOS.items():
+    TASKS[_sid] = _cfg
+    _TASK_GENERATORS[_sid] = (lambda d=_sid.replace("karnataka_", ""): generate_karnataka_scenario(d))

static/app.js CHANGED Viewed

@@ -15,17 +15,52 @@ let state = {
 };
 // --- Init ---
-document.addEventListener('DOMContentLoaded', () => {
-    document.querySelectorAll('.task-btn').forEach(btn => {
         btn.addEventListener('click', () => {
             document.querySelectorAll('.task-btn').forEach(b => b.classList.remove('active'));
             btn.classList.add('active');
-            state.task = btn.dataset.task;
         });
     });
     fetch(`${API}/tasks`).then(r=>r.json()).then(d=>{
         d.forEach(t => state.taskConfigs[t.id] = t);
-        resetEpisode(); // reset only after configs are loaded
         setTimeout(() => document.getElementById('loading').classList.add('hidden'), 800);
     });
 });
@@ -358,29 +393,41 @@ function initLeafletMap() {
     const container = document.getElementById('gridMap');
     if (leafletMap) return;
-    // Karnataka bounds
-    const kaBounds = [[11.5, 73.5], [18.5, 79.0]];
-    leafletMap = L.map(container, {
-        center: [14.5, 76.5],
-        zoom: 7,
         zoomControl: true,
         attributionControl: false,
-        minZoom: 5,
         maxZoom: 15,
         preferCanvas: true,
-    });
-    // Dark tile layer for SCADA aesthetic
-    L.tileLayer('https://{s}.basemaps.cartocdn.com/dark_all/{z}/{x}/{y}{r}.png', {
-        subdomains: 'abcd',
-        maxZoom: 19,
-    }).addTo(leafletMap);
-    // Attribution (small, bottom-right)
-    L.control.attribution({position: 'bottomright', prefix: false})
-        .addAttribution('© <a href="https://carto.com/">CARTO</a>')
-        .addTo(leafletMap);
     // Layer groups for easy clearing
     mapLayers.lines = L.layerGroup().addTo(leafletMap);
@@ -390,7 +437,7 @@ function initLeafletMap() {
     // Fix Leaflet size after container is fully rendered
     setTimeout(() => {
         leafletMap.invalidateSize();
-        leafletMap.fitBounds(kaBounds, { padding: [20, 20] });
     }, 200);
 }
@@ -464,17 +511,40 @@ function updateGridMap() {
             if (!from || !to) return;
             const lc = !l.connected ? '#4a5568' : l.rho > 1 ? '#ff1744' : l.rho > 0.8 ? '#ff9100' : '#e91e63';
-            const w = !l.connected ? 1.5 : l.rho > 0.8 ? 5 : 3;
             const polyline = L.polyline(
                 [[from.lat, from.lon], [to.lat, to.lon]],
-                { color: lc, weight: w, dashArray: l.connected ? '10 5' : '4 4', opacity: 0.9 }
             );
-            if (l.connected && Math.abs(l.flow) > 0.5) {
-                polyline.bindTooltip(`${l.id}: ${l.flow.toFixed(0)} MW (${(l.rho*100).toFixed(0)}%)`, {
-                    permanent: false, className: 'leaflet-tooltip-dark'
                 });
             }
             mapLayers.lines.addLayer(polyline);
         });
     }

 };
 // --- Init ---
+function isKarnatakaTask(taskId) {
+    return taskId.includes('karnataka');
+}
+function buildTaskButtons(tasks) {
+    const procContainer = document.getElementById('proceduralTasks');
+    const kaContainer = document.getElementById('karnatakaTasks');
+    procContainer.innerHTML = '';
+    kaContainer.innerHTML = '';
+    // Display-friendly names
+    const nameMap = {
+        'task_easy': 'Easy', 'task_medium': 'Medium', 'task_hard': 'Hard',
+        'task_karnataka': 'Full ★',
+        'karnataka_easy': 'Easy', 'karnataka_medium': 'Medium', 'karnataka_hard': 'Hard',
+    };
+    tasks.forEach(t => {
+        const btn = document.createElement('button');
+        btn.className = 'task-btn' + (t.id === state.task ? ' active' : '');
+        if (isKarnatakaTask(t.id)) btn.classList.add('ka');
+        btn.dataset.task = t.id;
+        const label = nameMap[t.id] || t.id.replace('task_','').replace('karnataka_','');
+        btn.innerHTML = `<span class="task-name">${label}</span><span class="task-info">${t.num_buses}b · ${t.num_agents}a</span>`;
         btn.addEventListener('click', () => {
             document.querySelectorAll('.task-btn').forEach(b => b.classList.remove('active'));
             btn.classList.add('active');
+            state.task = t.id;
+            // Destroy map so it reinitializes with correct bounds
+            if (leafletMap) { leafletMap.remove(); leafletMap = null; mapLayers = {lines:null,nodes:null,badges:null}; }
+            mapFitted = false;
+            resetEpisode();
         });
+        if (t.id.startsWith('task_') && !t.id.includes('karnataka')) {
+            procContainer.appendChild(btn);
+        } else {
+            kaContainer.appendChild(btn);
+        }
     });
+}
+document.addEventListener('DOMContentLoaded', () => {
     fetch(`${API}/tasks`).then(r=>r.json()).then(d=>{
         d.forEach(t => state.taskConfigs[t.id] = t);
+        buildTaskButtons(d);
+        resetEpisode();
         setTimeout(() => document.getElementById('loading').classList.add('hidden'), 800);
     });
 });
     const container = document.getElementById('gridMap');
     if (leafletMap) return;
+    const isKa = isKarnatakaTask(state.task);
+    // Karnataka bounds: tight crop around the state
+    const kaBounds = [[11.5, 73.8], [18.5, 79.0]];
+    const mapOpts = {
+        center: isKa ? [14.5, 76.5] : [15, 76],
+        zoom: isKa ? 7 : 6,
         zoomControl: true,
         attributionControl: false,
+        minZoom: isKa ? 6 : 3,
         maxZoom: 15,
         preferCanvas: true,
+    };
+    // Lock panning for Karnataka tasks
+    if (isKa) {
+        mapOpts.maxBounds = L.latLngBounds(kaBounds).pad(0.15);
+        mapOpts.maxBoundsViscosity = 1.0;
+    }
+    leafletMap = L.map(container, mapOpts);
+    if (isKa) {
+        // Real map tiles for Karnataka tasks
+        L.tileLayer('https://{s}.basemaps.cartocdn.com/dark_all/{z}/{x}/{y}{r}.png', {
+            subdomains: 'abcd',
+            maxZoom: 19,
+        }).addTo(leafletMap);
+        L.control.attribution({position: 'bottomright', prefix: false})
+            .addAttribution('© <a href="https://carto.com/">CARTO</a>')
+            .addTo(leafletMap);
+        leafletMap.fitBounds(kaBounds, { padding: [20, 20] });
+    }
+    // Procedural grids: no tiles — plain dark background via CSS
     // Layer groups for easy clearing
     mapLayers.lines = L.layerGroup().addTo(leafletMap);
     // Fix Leaflet size after container is fully rendered
     setTimeout(() => {
         leafletMap.invalidateSize();
+        if (isKa) leafletMap.fitBounds(kaBounds, { padding: [20, 20] });
     }, 200);
 }
             if (!from || !to) return;
             const lc = !l.connected ? '#4a5568' : l.rho > 1 ? '#ff1744' : l.rho > 0.8 ? '#ff9100' : '#e91e63';
+            const w = !l.connected ? 2 : l.rho > 1 ? 6 : l.rho > 0.8 ? 5 : 3.5;
+            // Glow layer for overloaded/congested lines
+            if (l.connected && l.rho > 0.8) {
+                const glow = L.polyline(
+                    [[from.lat, from.lon], [to.lat, to.lon]],
+                    { color: lc, weight: w + 6, opacity: 0.15, dashArray: null, interactive: false }
+                );
+                mapLayers.lines.addLayer(glow);
+            }
             const polyline = L.polyline(
                 [[from.lat, from.lon], [to.lat, to.lon]],
+                { color: lc, weight: w, dashArray: l.connected ? '12 6' : '4 6', opacity: 0.95 }
             );
+            // Show tooltip with flow info
+            const flowStr = l.connected ? `${l.flow.toFixed(0)} MW · ${(l.rho*100).toFixed(0)}% load` : 'Disconnected';
+            polyline.bindTooltip(`<b>${l.id}</b><br>${flowStr}`, {
+                permanent: false, className: 'leaflet-tooltip-dark', direction: 'center'
+            });
+            // Permanent label for high-flow lines
+            if (l.connected && Math.abs(l.flow) > 10) {
+                const midLat = (from.lat + to.lat) / 2;
+                const midLon = (from.lon + to.lon) / 2;
+                const flowLabel = L.divIcon({
+                    className: 'line-flow-label',
+                    html: `<span style="color:${lc};text-shadow:0 0 4px #000,0 0 8px #000;font-size:9px;font-family:'JetBrains Mono',monospace;font-weight:600;white-space:nowrap;">${Math.abs(l.flow).toFixed(0)}MW</span>`,
+                    iconSize: [40, 12],
+                    iconAnchor: [20, 6],
                 });
+                L.marker([midLat, midLon], { icon: flowLabel, interactive: false }).addTo(mapLayers.lines);
             }
             mapLayers.lines.addLayer(polyline);
         });
     }

static/index.html CHANGED Viewed

@@ -66,6 +66,46 @@
         </div>
     </header>
     <!-- ===== LEFT PANEL ===== -->
     <aside class="left-panel">
@@ -128,25 +168,7 @@
         <!-- Exception Log -->
         <div class="card" style="flex:1; display:flex; flex-direction:column; overflow:hidden;">
             <div class="card-title" style="color: var(--status-warning);">Exception Log</div>
-            <div class="alarm-log" id="alarmLog">
-                <!-- Populated by JS -->
-            </div>
-        </div>
-        <!-- Task Selector -->
-        <div class="card" style="flex-shrink:0;">
-            <div class="card-title">Task &amp; Controls</div>
-            <div class="task-selector" id="taskSelector">
-                <button class="task-btn" data-task="task_easy">Easy</button>
-                <button class="task-btn" data-task="task_medium">Medium</button>
-                <button class="task-btn" data-task="task_hard">Hard</button>
-                <button class="task-btn active" data-task="task_karnataka" style="color: #ffeb3b; border-color: rgba(255,235,59,0.3);">Karnataka</button>
-            </div>
-            <div class="controls-row" style="margin-top: var(--gap-sm);">
-                <button class="ctrl-btn active" id="btnReset" onclick="resetEpisode()">Reset</button>
-                <button class="ctrl-btn" id="btnStep" onclick="stepEpisode()">Step</button>
-                <button class="ctrl-btn" id="btnAutoRun" onclick="toggleAutoRun()">Auto</button>
-            </div>
         </div>
     </aside>
@@ -154,6 +176,19 @@
     <!-- ===== CENTER PANEL (Grid Map) ===== -->
     <main class="center-panel" id="centerPanel">
         <div class="grid-map" id="gridMap"></div>
         <div class="bus-tooltip" id="busTooltip">
             <div class="tt-title" id="ttTitle">Bus 0</div>
             <div class="tt-row"><span>Type</span><span class="tt-val" id="ttType">--</span></div>
@@ -162,60 +197,29 @@
         </div>
     </main>
-    <!-- ===== RIGHT PANEL (Agent Monitor) ===== -->
     <aside class="right-panel">
         <div class="card">
             <div class="card-title">Agent Leaderboard</div>
-            <ul class="leaderboard" id="leaderboard">
-                <!-- Populated by JS -->
-            </ul>
-        </div>
-        <div id="agentCards">
-            <!-- Populated by JS -->
         </div>
     </aside>
     <!-- ===== BOTTOM PANEL ===== -->
     <footer class="bottom-panel">
-        <!-- Reward History Chart -->
         <div class="bottom-card">
             <div class="card-title">Reward History</div>
             <div class="chart-area" id="rewardChart"></div>
         </div>
-        <!-- Frequency Trend -->
         <div class="bottom-card">
             <div class="card-title">Frequency Trend</div>
             <div class="chart-area" id="freqChart"></div>
         </div>
-        <!-- Generation Mix -->
         <div class="bottom-card">
             <div class="card-title">Generation Mix</div>
             <div class="chart-area" id="genMixChart"></div>
         </div>
-        <!-- Episode Score -->
-        <div class="bottom-card">
-            <div class="card-title">Episode Score</div>
-            <div class="coord-score" style="flex:1; display:flex; flex-direction:column; justify-content:center;">
-                <div class="big-value" id="episodeScore" style="color: var(--chart-reward); font-size: 36px;">--</div>
-                <div style="font-size:10px; color: var(--text-secondary); margin-top:4px;">Grader Score</div>
-                <div style="font-size:11px; margin-top:8px;">
-                    <span style="color: var(--text-secondary);">Steps:</span>
-                    <span id="totalSteps" style="font-family: 'JetBrains Mono'; font-weight:600;">0</span>
-                    <span style="color: var(--text-secondary); margin-left:8px;">Blackout:</span>
-                    <span id="blackoutStatus" style="font-family: 'JetBrains Mono'; font-weight:600; color: var(--status-normal);">No</span>
-                </div>
-            </div>
-            <div class="controls-row">
-                <button class="ctrl-btn" onclick="getGrade()">Grade</button>
-                <button class="ctrl-btn danger" onclick="resetEpisode()">New Episode</button>
-            </div>
-        </div>
     </footer>
 </div>

         </div>
     </header>
+    <!-- ===== TOOLBAR ===== -->
+    <div class="toolbar">
+        <div class="toolbar-section">
+            <span class="toolbar-label">PROCEDURAL</span>
+            <div class="task-group" id="proceduralTasks">
+                <!-- Populated by JS -->
+            </div>
+        </div>
+        <div class="toolbar-divider"></div>
+        <div class="toolbar-section">
+            <span class="toolbar-label">KARNATAKA</span>
+            <div class="task-group" id="karnatakaTasks">
+                <!-- Populated by JS -->
+            </div>
+        </div>
+        <div class="toolbar-divider"></div>
+        <div class="toolbar-section">
+            <span class="toolbar-label">CONTROLS</span>
+            <div class="controls-row">
+                <button class="ctrl-btn accent" id="btnReset" onclick="resetEpisode()">⟳ Reset</button>
+                <button class="ctrl-btn" id="btnStep" onclick="stepEpisode()">▶ Step</button>
+                <button class="ctrl-btn" id="btnAutoRun" onclick="toggleAutoRun()">⏩ Auto</button>
+                <button class="ctrl-btn" onclick="getGrade()">★ Grade</button>
+            </div>
+        </div>
+        <div class="toolbar-divider"></div>
+        <div class="toolbar-section">
+            <span class="toolbar-label">SCORE</span>
+            <div class="toolbar-score" id="episodeScore">--</div>
+        </div>
+        <div class="toolbar-section" style="margin-left:auto;">
+            <span class="toolbar-label">STEPS</span>
+            <span class="toolbar-value" id="totalSteps">0</span>
+        </div>
+        <div class="toolbar-section">
+            <span class="toolbar-label">BLACKOUT</span>
+            <span class="toolbar-value" id="blackoutStatus" style="color: var(--status-normal);">No</span>
+        </div>
+    </div>
     <!-- ===== LEFT PANEL ===== -->
     <aside class="left-panel">
         <!-- Exception Log -->
         <div class="card" style="flex:1; display:flex; flex-direction:column; overflow:hidden;">
             <div class="card-title" style="color: var(--status-warning);">Exception Log</div>
+            <div class="alarm-log" id="alarmLog"></div>
         </div>
     </aside>
     <!-- ===== CENTER PANEL (Grid Map) ===== -->
     <main class="center-panel" id="centerPanel">
         <div class="grid-map" id="gridMap"></div>
+        <!-- Map legend -->
+        <div class="map-legend">
+            <div class="legend-title">Legend</div>
+            <div class="legend-item"><span class="legend-dot" style="background:#00e5a0;"></span> Slack</div>
+            <div class="legend-item"><span class="legend-dot" style="background:#f5a623;"></span> Generator</div>
+            <div class="legend-item"><span class="legend-dot" style="background:#e94560;"></span> Load</div>
+            <div class="legend-item"><span class="legend-dot" style="background:#4a90d9;"></span> Battery</div>
+            <div class="legend-item"><span class="legend-dot" style="background:#ffeb3b;"></span> Solar</div>
+            <div class="legend-item"><span class="legend-dot" style="background:#64ffda;"></span> Wind</div>
+            <div class="legend-line"><span class="legend-line-sample normal"></span> Normal</div>
+            <div class="legend-line"><span class="legend-line-sample warn"></span> Congested</div>
+            <div class="legend-line"><span class="legend-line-sample crit"></span> Overloaded</div>
+        </div>
         <div class="bus-tooltip" id="busTooltip">
             <div class="tt-title" id="ttTitle">Bus 0</div>
             <div class="tt-row"><span>Type</span><span class="tt-val" id="ttType">--</span></div>
         </div>
     </main>
+    <!-- ===== RIGHT PANEL ===== -->
     <aside class="right-panel">
         <div class="card">
             <div class="card-title">Agent Leaderboard</div>
+            <ul class="leaderboard" id="leaderboard"></ul>
         </div>
+        <div id="agentCards"></div>
     </aside>
     <!-- ===== BOTTOM PANEL ===== -->
     <footer class="bottom-panel">
         <div class="bottom-card">
             <div class="card-title">Reward History</div>
             <div class="chart-area" id="rewardChart"></div>
         </div>
         <div class="bottom-card">
             <div class="card-title">Frequency Trend</div>
             <div class="chart-area" id="freqChart"></div>
         </div>
         <div class="bottom-card">
             <div class="card-title">Generation Mix</div>
             <div class="chart-area" id="genMixChart"></div>
         </div>
     </footer>
 </div>

static/style.css CHANGED Viewed

@@ -89,10 +89,11 @@ body::before {
 /* ---------- Layout ---------- */
 .control-room {
     display: grid;
-    grid-template-rows: 52px 1fr 180px;
-    grid-template-columns: 260px 1fr 300px;
     grid-template-areas:
         "header  header  header"
         "left    center  right"
         "bottom  bottom  bottom";
     height: 100vh;
@@ -100,6 +101,190 @@ body::before {
     background: rgba(255,255,255,0.04);
 }
 /* ---------- Header ---------- */
 .header {
     grid-area: header;
@@ -667,7 +852,7 @@ body::before {
     grid-area: bottom;
     background: var(--bg-secondary);
     display: grid;
-    grid-template-columns: 2fr 1fr 1fr 1fr;
     gap: 1px;
     border-top: 1px solid rgba(255,255,255,0.05);
 }
@@ -695,73 +880,6 @@ body::before {
     flex: 1;
 }
-/* Controls */
-.controls-row {
-    display: flex;
-    gap: var(--gap-sm);
-    margin-top: var(--gap-sm);
-}
-.ctrl-btn {
-    flex: 1;
-    padding: 6px 10px;
-    background: rgba(255,255,255,0.04);
-    border: 1px solid rgba(255,255,255,0.1);
-    border-radius: var(--radius-sm);
-    color: var(--text-primary);
-    font-family: 'Inter', sans-serif;
-    font-size: 11px;
-    font-weight: 500;
-    cursor: pointer;
-    transition: all 0.2s;
-    text-align: center;
-}
-.ctrl-btn:hover {
-    background: rgba(0,229,160,0.1);
-    border-color: rgba(0,229,160,0.3);
-}
-.ctrl-btn.active {
-    background: rgba(0,229,160,0.15);
-    border-color: var(--status-normal);
-    color: var(--status-normal);
-}
-.ctrl-btn.danger {
-    border-color: rgba(255,61,61,0.3);
-}
-.ctrl-btn.danger:hover {
-    background: rgba(255,61,61,0.1);
-    border-color: rgba(255,61,61,0.5);
-    color: var(--status-critical);
-}
-/* Task selector */
-.task-selector {
-    display: flex;
-    gap: 4px;
-}
-.task-btn {
-    flex: 1;
-    padding: 4px 8px;
-    background: rgba(255,255,255,0.03);
-    border: 1px solid rgba(255,255,255,0.08);
-    border-radius: var(--radius-sm);
-    color: var(--text-secondary);
-    font-size: 10px;
-    font-weight: 500;
-    cursor: pointer;
-    transition: all 0.2s;
-    text-transform: uppercase;
-    letter-spacing: 0.5px;
-}
-.task-btn:hover { border-color: rgba(0,229,160,0.3); color: var(--text-primary); }
-.task-btn.active { background: rgba(0,229,160,0.1); border-color: var(--status-normal); color: var(--status-normal); }
 /* Leaderboard */
 .leaderboard {
     list-style: none;
@@ -933,3 +1051,14 @@ body::before {
 .leaflet-control-attribution a {
     color: #666 !important;
 }

 /* ---------- Layout ---------- */
 .control-room {
     display: grid;
+    grid-template-rows: 48px 44px 1fr 160px;
+    grid-template-columns: 240px 1fr 280px;
     grid-template-areas:
         "header  header  header"
+        "toolbar toolbar toolbar"
         "left    center  right"
         "bottom  bottom  bottom";
     height: 100vh;
     background: rgba(255,255,255,0.04);
 }
+/* ---------- Toolbar ---------- */
+.toolbar {
+    grid-area: toolbar;
+    background: linear-gradient(90deg, #0d1225, #111a33);
+    display: flex;
+    align-items: center;
+    padding: 0 var(--gap-md);
+    gap: var(--gap-md);
+    border-bottom: 1px solid rgba(0,229,160,0.1);
+    z-index: 10;
+    overflow-x: auto;
+}
+.toolbar-section {
+    display: flex;
+    align-items: center;
+    gap: 8px;
+    flex-shrink: 0;
+}
+.toolbar-label {
+    font-size: 9px;
+    font-weight: 600;
+    text-transform: uppercase;
+    letter-spacing: 1.2px;
+    color: var(--text-muted);
+    white-space: nowrap;
+}
+.toolbar-divider {
+    width: 1px;
+    height: 24px;
+    background: rgba(255,255,255,0.08);
+    flex-shrink: 0;
+}
+.toolbar-score {
+    font-family: 'JetBrains Mono', monospace;
+    font-size: 18px;
+    font-weight: 700;
+    color: var(--chart-reward);
+}
+.toolbar-value {
+    font-family: 'JetBrains Mono', monospace;
+    font-size: 13px;
+    font-weight: 600;
+    color: var(--text-primary);
+}
+/* Task buttons (toolbar version) */
+.task-selector {
+    display: flex;
+    gap: 4px;
+}
+.task-btn {
+    display: flex;
+    flex-direction: column;
+    align-items: center;
+    padding: 4px 10px;
+    background: rgba(255,255,255,0.03);
+    border: 1px solid rgba(255,255,255,0.08);
+    border-radius: var(--radius-sm);
+    color: var(--text-secondary);
+    font-size: 11px;
+    font-weight: 600;
+    cursor: pointer;
+    transition: all 0.2s;
+    text-transform: uppercase;
+    letter-spacing: 0.5px;
+    line-height: 1.2;
+}
+.task-btn .task-name { font-size: 11px; }
+.task-btn .task-info {
+    font-size: 8px;
+    font-weight: 400;
+    color: var(--text-muted);
+    letter-spacing: 0;
+    text-transform: none;
+    white-space: nowrap;
+}
+.task-btn:hover { border-color: rgba(0,229,160,0.3); color: var(--text-primary); }
+.task-btn.active {
+    background: rgba(0,229,160,0.12);
+    border-color: var(--status-normal);
+    color: var(--status-normal);
+}
+.task-btn.active .task-info { color: rgba(0,229,160,0.6); }
+/* Karnataka scenario gold accent */
+.task-btn.ka:hover { border-color: rgba(255,235,59,0.4); color: #ffeb3b; }
+.task-btn.ka.active {
+    background: rgba(255,235,59,0.1);
+    border-color: #ffeb3b;
+    color: #ffeb3b;
+}
+.task-btn.ka.active .task-info { color: rgba(255,235,59,0.5); }
+/* Task group container */
+.task-group {
+    display: flex;
+    gap: 4px;
+}
+/* Controls in toolbar */
+.controls-row {
+    display: flex;
+    gap: 4px;
+}
+.ctrl-btn {
+    padding: 5px 12px;
+    background: rgba(255,255,255,0.04);
+    border: 1px solid rgba(255,255,255,0.1);
+    border-radius: var(--radius-sm);
+    color: var(--text-primary);
+    font-family: 'Inter', sans-serif;
+    font-size: 11px;
+    font-weight: 500;
+    cursor: pointer;
+    transition: all 0.2s;
+    text-align: center;
+    white-space: nowrap;
+}
+.ctrl-btn:hover {
+    background: rgba(0,229,160,0.1);
+    border-color: rgba(0,229,160,0.3);
+}
+.ctrl-btn.accent {
+    background: rgba(0,229,160,0.12);
+    border-color: rgba(0,229,160,0.3);
+    color: var(--status-normal);
+}
+.ctrl-btn.active {
+    background: rgba(0,229,160,0.2);
+    border-color: var(--status-normal);
+    color: var(--status-normal);
+    box-shadow: 0 0 8px rgba(0,229,160,0.15);
+}
+.ctrl-btn.danger { border-color: rgba(255,61,61,0.3); }
+.ctrl-btn.danger:hover {
+    background: rgba(255,61,61,0.1);
+    border-color: rgba(255,61,61,0.5);
+    color: var(--status-critical);
+}
+/* ---------- Map Legend ---------- */
+.map-legend {
+    position: absolute;
+    bottom: 12px;
+    left: 12px;
+    background: rgba(10,14,26,0.92);
+    border: 1px solid rgba(255,255,255,0.1);
+    border-radius: var(--radius-md);
+    padding: 8px 12px;
+    z-index: 5;
+    backdrop-filter: blur(8px);
+    font-size: 10px;
+}
+.legend-title {
+    font-size: 9px;
+    font-weight: 600;
+    text-transform: uppercase;
+    letter-spacing: 1px;
+    color: var(--text-muted);
+    margin-bottom: 4px;
+}
+.legend-item, .legend-line {
+    display: flex;
+    align-items: center;
+    gap: 6px;
+    padding: 1px 0;
+    color: var(--text-secondary);
+}
+.legend-dot {
+    width: 8px;
+    height: 8px;
+    border-radius: 50%;
+    flex-shrink: 0;
+}
+.legend-line-sample {
+    width: 20px;
+    height: 3px;
+    border-radius: 2px;
+    flex-shrink: 0;
+}
+.legend-line-sample.normal { background: #e91e63; }
+.legend-line-sample.warn { background: #ff9100; }
+.legend-line-sample.crit { background: #ff1744; box-shadow: 0 0 6px rgba(255,23,68,0.5); }
 /* ---------- Header ---------- */
 .header {
     grid-area: header;
     grid-area: bottom;
     background: var(--bg-secondary);
     display: grid;
+    grid-template-columns: 2fr 1fr 1fr;
     gap: 1px;
     border-top: 1px solid rgba(255,255,255,0.05);
 }
     flex: 1;
 }
 /* Leaderboard */
 .leaderboard {
     list-style: none;
 .leaflet-control-attribution a {
     color: #666 !important;
 }
+.line-flow-label {
+    background: none !important;
+    border: none !important;
+    text-align: center;
+}
+/* Dark background for procedural grids (no map tiles) */
+.leaflet-container {
+    background: #0a0e1a !important;
+}

training/train_grpo.py CHANGED Viewed

@@ -786,6 +786,94 @@ def run_test_mode():
     print("="*60)
 # ============================================================================
 # Main
 # ============================================================================
@@ -795,7 +883,7 @@ def main():
     parser.add_argument("--model", default="Qwen/Qwen2.5-1.5B-Instruct",
                         help="HuggingFace model name or path")
     parser.add_argument("--task", default="task_easy", choices=list(TASKS.keys()),
-                        help="Which task to train on")
     parser.add_argument("--epochs", type=int, default=3, help="Number of training epochs")
     parser.add_argument("--batch-size", type=int, default=2, help="Batch size per device")
     parser.add_argument("--num-prompts", type=int, default=50,
@@ -806,6 +894,10 @@ def main():
                         help="Use Unsloth for 4-bit quantized training")
     parser.add_argument("--test-mode", action="store_true",
                         help="Run pipeline verification without GPU")
     args = parser.parse_args()
@@ -816,11 +908,12 @@ def main():
     # Create output directory
     Path(args.output_dir).mkdir(parents=True, exist_ok=True)
-    # Run training
-    train_result = train_grpo(args)
-    print("\n[DONE] Training complete!")
-    print(f"  Output: {args.output_dir}")
 if __name__ == "__main__":

     print("="*60)
+# ============================================================================
+# Curriculum Training
+# ============================================================================
+CURRICULUM_ORDER = ["karnataka_easy", "karnataka_medium", "karnataka_hard", "task_karnataka"]
+def run_curriculum(args):
+    """Run curriculum training: easy→medium→hard→full on Karnataka grid.
+    Each phase trains for `args.epochs` epochs, saves a checkpoint,
+    and the next phase resumes from that checkpoint.
+    """
+    print("\n" + "=" * 60)
+    print("  OpenGrid Curriculum Training")
+    print(f"  Phases: {' → '.join(CURRICULUM_ORDER)}")
+    print(f"  Epochs per phase: {args.epochs}")
+    print("=" * 60)
+    checkpoint_path = args.resume_from
+    all_results = {}
+    for phase_idx, task_id in enumerate(CURRICULUM_ORDER):
+        phase_num = phase_idx + 1
+        print(f"\n{'─' * 60}")
+        print(f"  Phase {phase_num}/{len(CURRICULUM_ORDER)}: {task_id}")
+        if checkpoint_path:
+            print(f"  Resuming from: {checkpoint_path}")
+        print(f"{'─' * 60}")
+        # Override args for this phase
+        phase_args = copy.copy(args)
+        phase_args.task = task_id
+        phase_args.output_dir = str(Path(args.output_dir) / f"phase_{phase_num}_{task_id}")
+        if checkpoint_path:
+            phase_args.model = checkpoint_path
+        Path(phase_args.output_dir).mkdir(parents=True, exist_ok=True)
+        # Train this phase
+        train_result = train_grpo(phase_args)
+        # Set checkpoint for next phase
+        checkpoint_path = str(Path(phase_args.output_dir) / "trained_model")
+        # Evaluate on all Karnataka tasks
+        print(f"\n  [EVAL] Phase {phase_num} evaluation...")
+        eval_tasks = CURRICULUM_ORDER
+        from src.baseline import heuristic_policy
+        def heuristic_generate(prompt):
+            freq_match = re.search(r'Frequency:\s*([-+]?\d+(?:\.\d+)?)', prompt)
+            freq = float(freq_match.group(1)) if freq_match else 50.0
+            error = 50.0 - freq
+            delta = max(-20, min(20, error * 10))
+            bus_matches = re.findall(r'Bus (\d+) \((generator|battery)\)', prompt)
+            if bus_matches:
+                per_bus = delta / len(bus_matches)
+                return json.dumps({"bus_adjustments": [{"bus_id": int(m[0]), "delta": round(per_bus, 1)} for m in bus_matches], "topology_actions": []})
+            return json.dumps({"bus_adjustments": [], "topology_actions": []})
+        phase_results = evaluate_model(heuristic_generate, task_ids=eval_tasks, n_episodes=2)
+        all_results[f"phase_{phase_num}"] = phase_results
+        for tid, res in phase_results.items():
+            print(f"    {tid}: {res['avg_reward']:.2f} ± {res['std_reward']:.2f}")
+    # Summary
+    print("\n" + "=" * 60)
+    print("  CURRICULUM TRAINING COMPLETE")
+    print("=" * 60)
+    print(f"  Final model: {checkpoint_path}")
+    print(f"  Phases completed: {len(CURRICULUM_ORDER)}")
+    # Save curriculum summary
+    summary = {
+        "phases": CURRICULUM_ORDER,
+        "epochs_per_phase": args.epochs,
+        "results": {k: {t: {"avg": round(r["avg_reward"], 2)} for t, r in v.items()} for k, v in all_results.items()},
+        "final_model": checkpoint_path,
+    }
+    summary_path = Path(args.output_dir) / "curriculum_summary.json"
+    with open(summary_path, "w") as f:
+        json.dump(summary, f, indent=2)
+    print(f"  Summary: {summary_path}")
+    return summary
 # ============================================================================
 # Main
 # ============================================================================
     parser.add_argument("--model", default="Qwen/Qwen2.5-1.5B-Instruct",
                         help="HuggingFace model name or path")
     parser.add_argument("--task", default="task_easy", choices=list(TASKS.keys()),
+                        help="Which task to train on (ignored if --curriculum)")
     parser.add_argument("--epochs", type=int, default=3, help="Number of training epochs")
     parser.add_argument("--batch-size", type=int, default=2, help="Batch size per device")
     parser.add_argument("--num-prompts", type=int, default=50,
                         help="Use Unsloth for 4-bit quantized training")
     parser.add_argument("--test-mode", action="store_true",
                         help="Run pipeline verification without GPU")
+    parser.add_argument("--curriculum", action="store_true",
+                        help="Run curriculum training: karnataka_easy → medium → hard → full")
+    parser.add_argument("--resume-from", default=None,
+                        help="Resume training from a checkpoint path")
     args = parser.parse_args()
     # Create output directory
     Path(args.output_dir).mkdir(parents=True, exist_ok=True)
+    if args.curriculum:
+        run_curriculum(args)
+    else:
+        train_result = train_grpo(args)
+        print("\n[DONE] Training complete!")
+        print(f"  Output: {args.output_dir}")
 if __name__ == "__main__":