add flux map analysis script and configuration for detecting and tracking active regions

Browse files

Files changed (10) hide show

README.md +10 -3
analysis/ablation_analysis.py +126 -0
analysis/ablation_lollipop.py +162 -0
analysis/flux_map_analysis.py +916 -0
analysis/flux_map_config.yaml +67 -0
analysis/spatial_performance.py +1 -1
forecasting/inference/flare_analysis.py +0 -0
forecasting/inference/flare_analysis_poster.py +0 -0
pipeline_config.yaml +18 -1
run_pipeline.py +17 -17

README.md CHANGED Viewed

@@ -44,6 +44,11 @@ The solar soft X-ray (SXR) irradiance is a long-standing proxy of solar activity
 ```text
 FOXES
 ├── data                         # Data cleaning and preprocessing
 │   ├── align_data.py            # Align AIA and SXR timestamps; save matched pairs
 │   ├── euv_data_cleaning.py     # EUV image quality filtering and cleaning
@@ -67,8 +72,7 @@ FOXES
 │   ├── inference
 │   │   ├── inference.py         # Batch inference; writes predictions.csv
 │   │   ├── evaluation.py        # Compute metrics and generate evaluation plots
-│   │   ├── flare_analysis.py    # Detect, track, and match flares; generate plots
-│   │   ├── local_config.yaml    # Config for inference.py and flare_analysis.py
 │   │   └── evaluation_config.yaml  # Config for evaluation.py
 │   ├── models
 │   │   └── vit_patch_model_local.py   # ViTLocal: Vision Transformer with patch flux heads
@@ -126,7 +130,9 @@ FOXES uses a single orchestrator script (`run_pipeline.py`) and a top-level conf
 | 7 | `train` | Train the ViTLocal solar flare forecasting model                               |
 | 8 | `inference` | Run batch inference and save a predictions CSV                                 |
 | 9 | `evaluate` | Compute metrics and generate evaluation plots                                  |
-| 10 | `flare_analysis` | Detect, track, and match flares; generate plots/movies                         |
 ### Usage
@@ -245,6 +251,7 @@ Steps can also be run individually by calling their scripts directly:
 python forecasting/training/train.py -config forecasting/training/train_config.yaml
 python forecasting/inference/inference.py -config forecasting/inference/local_config.yaml
 python forecasting/inference/evaluation.py -config forecasting/inference/evaluation_config.yaml
 ```
 ---

 ```text
 FOXES
+├── analysis                     # Post-inference analysis scripts
+│   ├── flux_map_analysis.py     # Detect, track, and visualize active regions from flux maps
+│   ├── flux_map_config.yaml     # Config for flux_map_analysis.py
+│   ├── spatial_performance.py   # Flux-weighted spatial error heatmap on the solar disk
+│   └── ablation_analysis.py     # Ablation study visualization
 ├── data                         # Data cleaning and preprocessing
 │   ├── align_data.py            # Align AIA and SXR timestamps; save matched pairs
 │   ├── euv_data_cleaning.py     # EUV image quality filtering and cleaning
 │   ├── inference
 │   │   ├── inference.py         # Batch inference; writes predictions.csv
 │   │   ├── evaluation.py        # Compute metrics and generate evaluation plots
+│   │   ├── local_config.yaml    # Config for inference.py
 │   │   └── evaluation_config.yaml  # Config for evaluation.py
 │   ├── models
 │   │   └── vit_patch_model_local.py   # ViTLocal: Vision Transformer with patch flux heads
 | 7 | `train` | Train the ViTLocal solar flare forecasting model                               |
 | 8 | `inference` | Run batch inference and save a predictions CSV                                 |
 | 9 | `evaluate` | Compute metrics and generate evaluation plots                                  |
+| 10 | `ablation` | Run channel-masking ablation study on a pretrained model                       |
+| 11 | `spatial_performance` | Generate flux-weighted spatial error heatmap on the solar disk            |
+| 12 | `flux_map_analysis` | Detect and track active regions from flux maps; render frames and a movie  |
 ### Usage
 python forecasting/training/train.py -config forecasting/training/train_config.yaml
 python forecasting/inference/inference.py -config forecasting/inference/local_config.yaml
 python forecasting/inference/evaluation.py -config forecasting/inference/evaluation_config.yaml
+python analysis/flux_map_analysis.py --config analysis/flux_map_config.yaml
 ```
 ---

analysis/ablation_analysis.py ADDED Viewed

	@@ -0,0 +1,126 @@

+import pandas as pd
+import numpy as np
+import matplotlib.pyplot as plt
+import matplotlib.ticker as mticker
+from matplotlib import rcParams
+import sys
+from pathlib import Path
+PROJECT_ROOT = Path(__file__).parent.parent
+sys.path.insert(0, str(PROJECT_ROOT))
+from forecasting.inference.evaluation import setup_barlow_font
+setup_barlow_font()
+DATA_DIR = "/Users/griffingoodwin/Documents/gitrepos/FOXES/Untracked/data"
+WAVELENGTHS = ["94", "131", "171", "193", "211", "304", "335", "stereo", "all"]
+LABELS = ["Ablate 94 Å", "Ablate 131 Å", "Ablate 171 Å", "Ablate 193 Å",
+          "Ablate 211 Å", "Ablate 304 Å", "Ablate 335 Å", "Ablate STEREO", "Ablate All"]
+rcParams['font.family'] = 'sans-serif'
+rcParams['font.sans-serif'] = ['Barlow', 'Arial', 'DejaVu Sans']
+FLARE_CLASSES = {
+    'A1.0': (1e-8, 1e-7),
+    'B1.0': (1e-7, 1e-6),
+    'C1.0': (1e-6, 1e-5),
+    'M1.0': (1e-5, 1e-4),
+    'X1.0': (1e-4, 1e-3),
+}
+text_color  = 'black'
+grid_color  = '#CCCCCC'
+VMIN_GLOBAL = 1e-9
+VMAX_GLOBAL = 1e-2
+def add_flare_class_axes(ax, vmin, vmax):
+    def identity(x):
+        return x
+    ax_top   = ax.secondary_xaxis('top',   functions=(identity, identity))
+    ax_right = ax.secondary_yaxis('right', functions=(identity, identity))
+    positions, labels = [], []
+    for cls, (lo, hi) in FLARE_CLASSES.items():
+        if vmin <= lo <= vmax:
+            positions.append(lo)
+            labels.append(cls)
+    ax_top.set_xticks(positions)
+    ax_top.set_xticklabels(labels, fontsize=6, color=text_color, rotation=45, ha='left')
+    ax_top.grid(False)
+    ax_top.tick_params(length=3)
+    ax_right.set_yticks(positions)
+    ax_right.set_yticklabels(labels, fontsize=6, color=text_color)
+    ax_right.grid(False)
+    ax_right.tick_params(length=3)
+fig, axes = plt.subplots(3, 3, figsize=(16, 14), layout='constrained')
+axes = axes.flatten()
+hb_last = None  # for shared colorbar
+for i, (wav, label) in enumerate(zip(WAVELENGTHS, LABELS)):
+    ab  = pd.read_csv(f"{DATA_DIR}/ablate_{wav}_global_1.csv")
+    gt  = ab["groundtruth"].values
+    pred = ab["predictions"].values
+    mask = (gt > 0) & (pred > 0)
+    gt, pred = gt[mask], pred[mask]
+    log_mae = np.mean(np.abs(np.log10(gt) - np.log10(pred)))
+    vmin = max(VMIN_GLOBAL, min(gt.min(), pred.min()))
+    vmax = min(VMAX_GLOBAL, max(gt.max(), pred.max()))
+    ax = axes[i]
+    ax.set_facecolor("#FFFFFF")
+    hb = ax.hexbin(gt, pred, gridsize=80, xscale='log', yscale='log',
+                   cmap='bone', mincnt=1, bins='log',
+                   extent=(np.log10(vmin), np.log10(vmax),
+                           np.log10(vmin), np.log10(vmax)))
+    hb_last = hb
+    # 1:1 line
+    ax.plot([vmin, vmax], [vmin, vmax], ls='--', c='red', alpha=0.85, lw=1.2)
+    ax.set_xlim(vmin, vmax)
+    ax.set_ylim(vmin, vmax)
+    ax.set_xscale('log')
+    ax.set_yscale('log')
+    #ax.set_title(label, fontsize=11, fontweight='bold', color=text_color)
+    ax.set_xlabel(r'Ground Truth (W/m$^2$)', fontsize=8, color=text_color)
+    ax.set_ylabel(r'Prediction (W/m$^2$)', fontsize=8, color=text_color)
+    ax.tick_params(labelsize=7, colors=text_color)
+    ax.grid(True, alpha=0.5, color=grid_color, linewidth=0.5)
+    ax.set_axisbelow(True)
+    for lbl in ax.get_xticklabels():
+        lbl.set_fontfamily('Barlow')
+    for lbl in ax.get_yticklabels():
+        lbl.set_fontfamily('Barlow')
+    ax.text(0.04, 0.96, f"Log MAE = {log_mae:.3f}",
+            transform=ax.transAxes, fontsize=8, va='top', color=text_color,
+            bbox=dict(boxstyle='round,pad=0.3', facecolor='white',
+                      edgecolor='#CCCCCC', alpha=0.85))
+    add_flare_class_axes(ax, vmin, vmax)
+# Shared colorbar
+cbar = fig.colorbar(hb_last, ax=axes.tolist(), orientation='vertical', shrink=0.6, pad=0.01)
+cbar.set_label("Count (log)", fontsize=11, color=text_color)
+cbar.ax.tick_params(labelsize=9, colors=text_color)
+cbar.ax.yaxis.set_minor_locator(mticker.LogLocator(base=10, subs='auto', numticks=10))
+cbar.ax.tick_params(which='minor', colors=text_color)
+#fig.suptitle("Ablation Study: Channel Masking vs. Baseline", fontsize=14, fontweight='bold')
+plt.savefig("/Users/griffingoodwin/Documents/gitrepos/FOXES/analysis/ablation_3x3.png", dpi=150, bbox_inches="tight")
+plt.show()
+print("Saved: analysis/ablation_3x3.png")

analysis/ablation_lollipop.py ADDED Viewed

	@@ -0,0 +1,162 @@

+import os
+import pandas as pd
+import numpy as np
+import matplotlib.pyplot as plt
+import matplotlib.patches as mpatches
+import matplotlib.font_manager as fm
+from matplotlib import rcParams
+def setup_barlow_font():
+    try:
+        barlow_fonts = [f.name for f in fm.fontManager.ttflist
+                        if 'barlow' in f.name.lower() or 'barlow' in f.fname.lower()]
+        if barlow_fonts:
+            rcParams['font.family'] = 'Barlow'
+        else:
+            for path in ['/usr/share/fonts/truetype/barlow/Barlow-Regular.ttf',
+                         '/Users/griffingoodwin/Library/Fonts/Barlow-Regular.otf']:
+                if os.path.exists(path):
+                    fm.fontManager.addfont(path)
+                    rcParams['font.family'] = 'Barlow'
+                    break
+            else:
+                rcParams['font.family'] = 'sans-serif'
+    except Exception:
+        rcParams['font.family'] = 'sans-serif'
+setup_barlow_font()
+DATA_DIR     = "/Users/griffingoodwin/Documents/gitrepos/FOXES/Untracked/data"
+BASELINE_CSV = "/Volumes/T9/FOXES_Misc/batch_results/vit/vit_predictions_test.csv"
+WAVELENGTHS = ["94", "131", "171", "193", "211", "304", "335","STEREO"]
+LABELS = {
+    "94":     "Ablate 94 Å",
+    "131":    "Ablate 131 Å",
+    "171":    "Ablate 171 Å",
+    "193":    "Ablate 193 Å",
+    "211":    "Ablate 211 Å",
+    "304":    "Ablate 304 Å",
+    "335":    "Ablate 335 Å",
+    "STEREO": "Ablate 94, 131, 335 Å\n(STEREO)",
+}
+FLARE_CLASSES = {
+    '< C': (1e-15, 1e-6),
+    'C':  (1e-6, 1e-5),
+    'M':  (1e-5, 1e-4),
+    'X':  (1e-4, 1e-2),
+}
+CLASS_COLORS = {
+    '< C': '#4C9BE8',
+    'C':  '#56C490',
+    'M':  '#F5A623',
+    'X':  '#E84C4C',
+}
+# ── Compute metrics ────────────────────────────────────────────────────────────
+def compute_row(label, gt, pred, is_baseline=False):
+    mask = (gt > 0) & (pred > 0)
+    gt, pred = gt[mask], pred[mask]
+    overall = np.mean(np.abs(np.log10(gt) - np.log10(pred)))
+    row = {"label": label, "overall": overall, "is_baseline": is_baseline}
+    for cls, (lo, hi) in FLARE_CLASSES.items():
+        m = (gt >= lo) & (gt < hi)
+        row[cls] = np.mean(np.abs(np.log10(gt[m]) - np.log10(pred[m]))) if m.sum() > 5 else np.nan
+    return row
+records = []
+# Baseline
+bl = pd.read_csv(BASELINE_CSV)
+records.append(compute_row("FOXES (no ablation)",
+                           bl["groundtruth"].values, bl["predictions"].values,
+                           is_baseline=True))
+for wav in WAVELENGTHS:
+    ab = pd.read_csv(f"{DATA_DIR}/ablate_{wav}_global_1.csv")
+    records.append(compute_row(LABELS[wav], ab["groundtruth"].values, ab["predictions"].values))
+# Sort ablation rows by overall MAE (worst first), keep baseline pinned at bottom
+ablation_df = pd.DataFrame([r for r in records if not r["is_baseline"]])
+ablation_df = ablation_df.sort_values("overall", ascending=False).reset_index(drop=True)
+baseline_df = pd.DataFrame([r for r in records if r["is_baseline"]])
+df = pd.concat([ablation_df, baseline_df], ignore_index=True)
+# ── Plot ───────────────────────────────────────────────────────────────────────
+n_rows = len(df)
+fig, ax = plt.subplots(figsize=(11, 0.6 * n_rows + 1.5))
+#ax.set_facecolor("#FAFAFA")
+fig.patch.set_facecolor("#FFFFFF")
+y_positions = np.arange(n_rows)
+# Separator line between ablations and baseline
+ax.axhline(y=n_rows - 1.5, color="#BBBBBB", linewidth=1, linestyle=":", zorder=1)
+for i, row in df.iterrows():
+    y = y_positions[i]
+    is_bl = row["is_baseline"]
+    # Highlight baseline row
+    if is_bl:
+        ax.axhspan(y - 0.45, y + 0.45, color="#EEF6FF", zorder=0)
+    # Span line across per-class range
+    class_vals = [row[c] for c in FLARE_CLASSES if not np.isnan(row[c])]
+    if class_vals:
+        ax.hlines(y, min(class_vals), max(class_vals),
+                  color="#CCCCCC", linewidth=2, zorder=1)
+    # Stem from 0 to overall
+    ax.hlines(y, 0, row["overall"],
+              color="#AAAAAA", linewidth=1.2, linestyle="--", zorder=0, alpha=0.6)
+    # Per-class dots
+    for cls in FLARE_CLASSES:
+        val = row[cls]
+        if not np.isnan(val):
+            ax.scatter(val, y, color=CLASS_COLORS[cls], s=80, zorder=4,
+                       edgecolors="white", linewidths=0.6, alpha=0.75)
+    # Overall dot
+    outline_color = "#1A6BBF" if is_bl else "black"
+    ax.scatter(row["overall"], y, color="white", s=190, zorder=3,
+               edgecolors=outline_color, linewidths=2.0 if is_bl else 1.5, alpha=0.75)
+    ax.scatter(row["overall"], y, color=outline_color, s=75, zorder=3,
+               marker="|", linewidths=1.5, alpha=0.75)
+tick_colors = ["black"] * n_rows
+tick_colors[-1] = "#1A6BBF"  # baseline label in blue
+ax.set_yticks(y_positions)
+ax.set_yticklabels(df["label"], fontsize=12)
+for ticklabel, color in zip(ax.get_yticklabels(), tick_colors):
+    ticklabel.set_color(color)
+    if color != "black":
+        ticklabel.set_fontweight("bold")
+ax.set_xlabel("MAE (log$_{10}$ scale)", fontsize=12)
+ax.grid(True, axis="x", alpha=0.4, color="#CCCCCC", linewidth=0.6)
+ax.set_axisbelow(True)
+ax.spines[["top", "right"]].set_visible(False)
+ax.tick_params(axis="y", length=0, labelsize=11)
+ax.tick_params(axis="x", labelsize=10)
+# Legend
+class_patches = [
+    mpatches.Patch(color=CLASS_COLORS[c], label=f"{c}-class") for c in FLARE_CLASSES
+]
+overall_patch   = mpatches.Patch(facecolor="white", edgecolor="black",  label="Overall")
+#baseline_patch  = mpatches.Patch(facecolor="white", edgecolor="#1A6BBF", label="Baseline (overall)")
+ax.legend(handles=class_patches + [overall_patch],
+          loc="upper right", fontsize=10, framealpha=0.9,
+          edgecolor="#CCCCCC")
+# ax.set_title("Ablation Study — Log MAE by Channel & Flare Class",
+#              fontsize=14, fontweight="bold", pad=14)
+plt.xlim(0, .85)
+plt.tight_layout()
+plt.savefig("ablation_lollipop.png", dpi=450, bbox_inches="tight")
+plt.show()
+print("Saved: analysis/ablation_lollipop.png")

analysis/flux_map_analysis.py ADDED Viewed

	@@ -0,0 +1,916 @@

+#!/usr/bin/env python3
+"""
+Flare Analysis — Frame & Movie Generator
+Detects and tracks active regions from flux contribution maps,
+then renders per-timestamp frames and stitches them into a movie.
+Usage:
+    python flux_map_analysis.py --config flux_map_config.yaml
+"""
+from __future__ import annotations
+import argparse
+import os
+import time
+import warnings
+from dataclasses import dataclass
+from datetime import datetime
+from heapq import heappush, heappop
+from multiprocessing import Pool
+from pathlib import Path
+from typing import Dict, List, Optional, Tuple
+import imageio.v2 as imageio
+import imageio_ffmpeg
+import matplotlib
+matplotlib.use('Agg')
+import matplotlib.dates as mdates
+import matplotlib.font_manager as fm
+import matplotlib.pyplot as plt
+import numpy as np
+import pandas as pd
+import yaml
+from matplotlib import rcParams
+from scipy.ndimage import maximum_filter, gaussian_filter
+from tqdm import tqdm
+warnings.filterwarnings('ignore')
+# =============================================================================
+# Configuration
+# =============================================================================
+@dataclass
+class FlareAnalysisConfig:
+    """Configuration for flare analysis."""
+    # Paths
+    flux_path: Optional[str] = None
+    aia_path: Optional[str] = None
+    predictions_csv: Optional[str] = None
+    output_dir: Optional[str] = None
+    # Time range
+    start_time: Optional[str] = None
+    end_time: Optional[str] = None
+    # Detection
+    min_flux_threshold: float = 1e-7
+    threshold_std_multiplier: float = 3.0
+    spatial_smoothing_sigma: float = 1.0
+    radial_expansion_threshold_percentile: float = 30.0
+    peak_neighborhood_sizes: Tuple[int, ...] = (10, 15, 20, 25)
+    peak_min_scale_agreement: int = 2
+    peak_scale_tolerance: int = 2
+    min_peak_distance: int = 10
+    # Grid
+    grid_size: Tuple[int, int] = (64, 64)
+    patch_size: int = 8
+    input_size: int = 512
+    # Tracking
+    max_tracking_distance: int = 8
+    flux_ratio_weight: float = 0.1
+    size_ratio_weight: float = 0.1
+    distance_weight: float = 1.0
+    age_bonus_weight: float = 1.0  # scales 1/(1+age) penalty on new tracks
+    cadence_seconds: float = 60.0
+    max_gap_frames: int = 1  # frames a track can persist without a detection before expiring
+    # Movie / output
+    create_movie: bool = False
+    plot_window_hours: float = 4.0
+    movie_fps: float = 2.0
+    movie_frame_interval_minutes: float = 1.0
+    movie_num_workers: int = 4
+    movie_dpi: float = 75.0
+    movie_frame_format: str = 'jpg'
+    movie_jpeg_quality: int = 90
+    @classmethod
+    def from_yaml(cls, path: str) -> "FlareAnalysisConfig":
+        with open(path) as f:
+            raw = yaml.safe_load(f) or {}
+        # Flatten one level of nesting
+        # The 'movie' section uses short keys (fps, dpi, …) — prefix them with 'movie_'
+        flat: Dict = {}
+        for key, val in raw.items():
+            if isinstance(val, dict):
+                if key == 'movie':
+                    valid = cls.__dataclass_fields__
+                    for k, v in val.items():
+                        if k in valid:
+                            flat[k] = v
+                        elif f'movie_{k}' in valid:
+                            flat[f'movie_{k}'] = v
+                        else:
+                            flat[k] = v
+                else:
+                    flat.update(val)
+            else:
+                flat[key] = val
+        # Renamed YAML keys
+        if 'start' in flat:
+            flat['start_time'] = flat.pop('start')
+        if 'end' in flat:
+            flat['end_time'] = flat.pop('end')
+        # Lists → tuples for tuple-typed fields
+        for k in ('grid_size', 'peak_neighborhood_sizes'):
+            if k in flat and isinstance(flat[k], list):
+                flat[k] = tuple(flat[k])
+        valid = {f for f in cls.__dataclass_fields__}
+        return cls(**{k: v for k, v in flat.items() if k in valid and v is not None})
+# =============================================================================
+# Utilities
+# =============================================================================
+def flux_to_goes_class(flux: float) -> str:
+    """Convert physical flux (W/m²) to GOES class string."""
+    if not isinstance(flux, (int, float)) or np.isnan(flux) or flux <= 0:
+        return "N/A"
+    if flux >= 1e-4:
+        prefix, scale = "X", 1e-4
+    elif flux >= 1e-5:
+        prefix, scale = "M", 1e-5
+    elif flux >= 1e-6:
+        prefix, scale = "C", 1e-6
+    elif flux >= 1e-7:
+        prefix, scale = "B", 1e-7
+    else:
+        prefix, scale = "A", 1e-8
+    magnitude = min(flux / scale, 9.9)
+    return f"{prefix}{magnitude:.1f}" if magnitude != int(magnitude) else f"{prefix}{int(magnitude)}.0"
+def setup_barlow_font() -> None:
+    """Register and activate the Barlow font if available."""
+    try:
+        barlow_fonts = [
+            (f.name, f.fname) for f in fm.fontManager.ttflist
+            if 'barlow' in f.name.lower()
+        ]
+        if barlow_fonts:
+            preferred = next((n for n, _ in barlow_fonts if n.lower() in ('barlow', 'barlow regular')), barlow_fonts[0][0])
+            rcParams['font.family'] = preferred
+            return
+        search_paths = [
+            os.path.expanduser('~/Library/Fonts/Barlow-Regular.otf'),
+            os.path.expanduser('~/Library/Fonts/Barlow-Regular.ttf'),
+            '/Library/Fonts/Barlow-Regular.otf',
+            '/usr/share/fonts/truetype/barlow/Barlow-Regular.ttf',
+        ]
+        for path in search_paths:
+            if os.path.exists(path):
+                fm.fontManager.addfont(path)
+                from matplotlib.font_manager import FontProperties
+                rcParams['font.family'] = FontProperties(fname=path).get_name()
+                return
+    except Exception:
+        pass
+    rcParams['font.family'] = 'sans-serif'
+def load_aia_image_at_time(aia_path: Path, timestamp: str) -> Optional[np.ndarray]:
+    """Load AIA image as normalised RGB composite (channels 0, 1, 2 → 94, 131, 171 Å)."""
+    if aia_path is None or not aia_path.exists():
+        return None
+    search_dirs = [aia_path] + [aia_path / s for s in ('test', 'train', 'val') if (aia_path / s).exists()]
+    for d in search_dirs:
+        fp = d / f"{timestamp}.npy"
+        if fp.exists():
+            try:
+                data = np.load(fp)           # (7, H, W)
+                if data.ndim == 3 and data.shape[0] >= 3:
+                    rgb = np.zeros((data.shape[1], data.shape[2], 3))
+                    for i in range(3):
+                        ch = data[i]
+                        r = ch.max() - ch.min()
+                        rgb[..., i] = (ch - ch.min()) / r if r > 0 else ch
+                    return rgb
+            except Exception:
+                continue
+    return None
+# =============================================================================
+# Region Detection & Tracking
+# =============================================================================
+class FluxContributionAnalyzer:
+    """Detects and tracks active regions from per-patch flux contribution maps."""
+    def __init__(self, config: FlareAnalysisConfig, output_dir: Optional[Path] = None):
+        self.config = config
+        self.flux_path = Path(config.flux_path) if config.flux_path else None
+        self.aia_path  = Path(config.aia_path)  if config.aia_path  else None
+        self.output_dir = output_dir
+        self.grid_size  = config.grid_size
+        self.patch_size = config.patch_size
+        self.input_size = config.input_size
+        self.region_labels_cache: Dict[str, np.ndarray] = {}
+        if config.predictions_csv:
+            self.predictions_df = pd.read_csv(config.predictions_csv)
+            self.predictions_df['datetime'] = pd.to_datetime(self.predictions_df['timestamp'])
+            self.predictions_df = self.predictions_df.sort_values('datetime')
+            if config.start_time and config.end_time:
+                start, end = pd.to_datetime(config.start_time), pd.to_datetime(config.end_time)
+                mask = (self.predictions_df['datetime'] >= start) & (self.predictions_df['datetime'] <= end)
+                self.predictions_df = self.predictions_df[mask].reset_index(drop=True)
+            print(f"Loaded {len(self.predictions_df)} predictions "
+                  f"({self.predictions_df['datetime'].min()} → {self.predictions_df['datetime'].max()})")
+        else:
+            self.predictions_df = pd.DataFrame()
+    # ------------------------------------------------------------------
+    # Data loading
+    # ------------------------------------------------------------------
+    def load_flux_contributions(self, timestamp: str) -> Optional[np.ndarray]:
+        if self.flux_path is None:
+            return None
+        fp = self.flux_path / f"{timestamp}.npy"
+        return np.load(fp) if fp.exists() else None
+    # ------------------------------------------------------------------
+    # Peak detection
+    # ------------------------------------------------------------------
+    def _find_flux_peaks_single_scale(self, flux: np.ndarray, size: int) -> Tuple[List, List]:
+        valid = np.isfinite(flux) & (flux > 0)
+        masked = np.where(valid, flux, -np.inf)
+        local_max = (maximum_filter(masked, size=size) == masked) & valid
+        ys, xs = np.where(local_max)
+        coords = list(zip(ys.tolist(), xs.tolist()))
+        fluxes = [float(flux[y, x]) for y, x in coords]
+        return coords, fluxes
+    def _find_flux_peaks_multiscale(self, flux: np.ndarray) -> Tuple[List, List]:
+        cfg = self.config
+        registry: Dict[Tuple, dict] = {}
+        for size in cfg.peak_neighborhood_sizes:
+            coords, fluxes = self._find_flux_peaks_single_scale(flux, size)
+            for (y, x), fv in zip(coords, fluxes):
+                matched = next(
+                    ((py, px) for (py, px) in registry
+                     if abs(y - py) <= cfg.peak_scale_tolerance and abs(x - px) <= cfg.peak_scale_tolerance),
+                    None
+                )
+                if matched:
+                    e = registry[matched]
+                    e['count'] += 1
+                    if fv > e['best_flux']:
+                        e['best_flux'] = fv
+                        e['best_coord'] = (y, x)
+                else:
+                    registry[(y, x)] = {'count': 1, 'best_flux': fv, 'best_coord': (y, x)}
+        stable = [(e['best_coord'], e['best_flux'])
+                  for e in registry.values() if e['count'] >= cfg.peak_min_scale_agreement]
+        if not stable:
+            return [], []
+        stable.sort(key=lambda p: p[1], reverse=True)
+        coords  = [p[0] for p in stable]
+        fluxes  = [p[1] for p in stable]
+        if cfg.min_peak_distance > 0 and len(coords) > 1:
+            coords, fluxes = self._merge_close_peaks(coords, fluxes, cfg.min_peak_distance)
+        return coords, fluxes
+    def _merge_close_peaks(self, coords, fluxes, min_dist):
+        order = np.argsort(fluxes)[::-1]
+        kept = []
+        for i in order:
+            if all(np.hypot(coords[i][0] - coords[j][0], coords[i][1] - coords[j][1]) >= min_dist
+                   for j in kept):
+                kept.append(i)
+        kept = sorted(kept)
+        return [coords[i] for i in kept], [fluxes[i] for i in kept]
+    # ------------------------------------------------------------------
+    # Region segmentation (radial flood-fill from peaks)
+    # ------------------------------------------------------------------
+    def _detect_regions_with_peak_clustering(
+        self, flux_contrib: np.ndarray, pred_data: pd.Series
+    ) -> Tuple[List[Dict], Optional[np.ndarray], str]:
+        cfg = self.config
+        valid = flux_contrib[np.isfinite(flux_contrib) & (flux_contrib > 0)]
+        if valid.size == 0:
+            return [], None, "no_valid_flux"
+        total_flux = float(flux_contrib[flux_contrib > 0].sum())
+        log_flux = np.log(valid)
+        threshold = max(
+            np.exp(np.median(log_flux) + cfg.threshold_std_multiplier * np.std(log_flux)),
+            cfg.min_flux_threshold,
+        )
+        above = int((flux_contrib > threshold).sum())
+        masked = np.where(flux_contrib > threshold, flux_contrib, 0.0)
+        if above == 0:
+            return [], None, f"all_below_threshold(thr={threshold:.3e} total={total_flux:.3e})"
+        if cfg.spatial_smoothing_sigma > 0:
+            masked = gaussian_filter(masked, sigma=cfg.spatial_smoothing_sigma)
+        peak_coords, peak_fluxes = self._find_flux_peaks_multiscale(masked)
+        if not peak_coords:
+            return [], None, f"no_peaks(thr={threshold:.3e} above={above} total={total_flux:.3e})"
+        # Radial flood-fill from all peaks simultaneously (Dijkstra-style)
+        labels = np.zeros_like(masked, dtype=np.int32)
+        valid_vals = masked[(masked > 0) & np.isfinite(masked)]
+        growth_threshold = np.percentile(valid_vals, cfg.radial_expansion_threshold_percentile) if valid_vals.size else 0
+        pq, counter = [], 0
+        for idx, ((py, px), _) in enumerate(zip(peak_coords, peak_fluxes)):
+            labels[py, px] = idx + 1
+            heappush(pq, (0.0, counter, py, px, idx + 1, py, px))
+            counter += 1
+        neighbors = [(-1, 0), (1, 0), (0, -1), (0, 1), (-1, -1), (-1, 1), (1, -1), (1, 1)]
+        H, W = masked.shape
+        while pq:
+            dist, _, y, x, label, py, px = heappop(pq)
+            for dy, dx in neighbors:
+                ny, nx = y + dy, x + dx
+                if 0 <= ny < H and 0 <= nx < W and labels[ny, nx] == 0 and masked[ny, nx] > growth_threshold:
+                    labels[ny, nx] = label
+                    new_dist = np.hypot(ny - py, nx - px)
+                    heappush(pq, (new_dist, counter, ny, nx, label, py, px))
+                    counter += 1
+        regions = []
+        skipped_below_min = 0
+        for lid in range(1, len(peak_coords) + 1):
+            mask = labels == lid
+            ys, xs = np.where(mask)
+            if ys.size == 0:
+                continue
+            fv = masked[mask]
+            total = float(fv.sum())
+            if total < cfg.min_flux_threshold:
+                skipped_below_min += 1
+                continue
+            cy, cx = float(ys.mean()), float(xs.mean())
+            peak_y, peak_x = peak_coords[lid - 1]
+            regions.append({
+                'id': len(regions) + 1,
+                'region_label': lid,
+                'size': int(ys.size),
+                'sum_flux': total,
+                'max_flux': float(fv.max()),
+                'centroid_patch_y': cy,
+                'centroid_patch_x': cx,
+                'centroid_img_y': cy * self.patch_size + self.patch_size // 2,
+                'centroid_img_x': cx * self.patch_size + self.patch_size // 2,
+                'peak_y': peak_y,
+                'peak_x': peak_x,
+                'peak_img_y': peak_y * self.patch_size + self.patch_size // 2,
+                'peak_img_x': peak_x * self.patch_size + self.patch_size // 2,
+                'peak_flux': peak_fluxes[lid - 1],
+                'mask': mask,
+            })
+        n_peaks = len(peak_coords)
+        reason = (f"ok: {len(regions)} regions from {n_peaks} peaks"
+                  f"  thr={threshold:.3e}  above={above}  total={total_flux:.3e}"
+                  + (f"  skipped={skipped_below_min}_below_min_flux" if skipped_below_min else ""))
+        return regions, labels, reason
+    def _detect_regions_worker(self, timestamp: str) -> Tuple[str, Optional[List], Optional[np.ndarray], str]:
+        try:
+            flux = self.load_flux_contributions(timestamp)
+            if flux is None:
+                return timestamp, None, None, "no_flux_file"
+            pred = self.predictions_df[self.predictions_df['timestamp'] == timestamp]
+            if pred.empty:
+                return timestamp, None, None, "no_prediction_row"
+            regions, labels, reason = self._detect_regions_with_peak_clustering(flux, pred.iloc[0])
+            return timestamp, regions, (labels.astype(np.int16) if labels is not None else None), reason
+        except Exception as e:
+            return timestamp, None, None, f"exception: {e}"
+    # ------------------------------------------------------------------
+    # Tracking
+    # ------------------------------------------------------------------
+    def track_regions_over_time(self, timestamps: List[str]) -> Dict:
+        cfg = self.config
+        print("Detecting regions (parallel)…")
+        n_workers = max(1, min((os.cpu_count() or 1) - 1, len(timestamps)))
+        all_regions: Dict[str, List] = {}
+        detection_reasons: Dict[str, str] = {}
+        with Pool(processes=n_workers) as pool:
+            for ts, regions, labels, reason in tqdm(
+                pool.imap(self._detect_regions_worker, timestamps),
+                total=len(timestamps), desc="Detecting regions"
+            ):
+                detection_reasons[ts] = reason
+                if regions is not None:
+                    all_regions[ts] = regions
+                if labels is not None:
+                    self.region_labels_cache[ts] = labels
+        print("Tracking regions across time…")
+        print(f"  max_tracking_distance={cfg.max_tracking_distance}  "
+              f"max_gap_frames={cfg.max_gap_frames}  "
+              f"age_bonus_weight={cfg.age_bonus_weight}  "
+              f"distance_weight={cfg.distance_weight}")
+        tracks: Dict[int, List] = {}
+        next_id = 1
+        last_seen: Dict[int, int] = {}  # track_id → frame index when last matched
+        _debug_log: List[str] = []  # per-frame tracking log
+        for frame_idx, ts in enumerate(tqdm(timestamps, desc="Tracking")):
+            # Expire tracks that haven't been seen within max_gap_frames
+            active = {tid for tid, fi in last_seen.items()
+                      if frame_idx - fi <= cfg.max_gap_frames}
+            if ts not in all_regions:
+                det_reason = detection_reasons.get(ts, "unknown")
+                _debug_log.append(f"{ts}  SKIP    {det_reason}")
+                continue
+            current_regions = all_regions[ts]
+            # Build all valid (score, region_idx, track_id) candidates
+            candidates = []
+            for ri, region in enumerate(current_regions):
+                cur_flux = region.get('sum_flux', 0.0)
+                cur_size = region.get('size', 1)
+                for tid in active:
+                    history = tracks[tid]
+                    # Smooth position over last few frames to reduce centroid jitter.
+                    # Use PATCH coordinates so max_tracking_distance is in patch units (matching config).
+                    n_smooth = min(5, len(history))
+                    avg_x = np.mean([h[1]['centroid_patch_x'] for h in history[-n_smooth:]])
+                    avg_y = np.mean([h[1]['centroid_patch_y'] for h in history[-n_smooth:]])
+                    dist = np.hypot(
+                        region['centroid_patch_x'] - avg_x,
+                        region['centroid_patch_y'] - avg_y,
+                    )
+                    _, last = history[-1]
+                    if dist >= cfg.max_tracking_distance:
+                        continue
+                    lf = last.get('sum_flux', 1e-15)
+                    ls = last.get('size', 1)
+                    flux_ratio = max(cur_flux, lf) / max(min(cur_flux, lf), 1e-15)
+                    size_ratio = max(cur_size, ls) / max(min(cur_size, ls), 1)
+                    track_age = len(tracks[tid])
+                    # Discount grows with age: 0 (new) → age_bonus_weight (very old)
+                    # Makes established tracks harder to beat at equal distance
+                    age_discount = cfg.age_bonus_weight * track_age / (1.0 + track_age)
+                    score = (cfg.distance_weight * dist
+                             + cfg.flux_ratio_weight * flux_ratio
+                             + cfg.size_ratio_weight * size_ratio
+                             - age_discount)
+                    candidates.append((score, ri, tid))
+            # Greedy one-to-one assignment: best scores first, each region/track used once
+            candidates.sort()
+            assigned_regions: set = set()
+            assigned_tracks:  set = set()
+            assignments: Dict[int, int] = {}   # region_idx → track_id
+            for score, ri, tid in candidates:
+                if ri in assigned_regions or tid in assigned_tracks:
+                    continue
+                assignments[ri] = tid
+                assigned_regions.add(ri)
+                assigned_tracks.add(tid)
+            # Log detection outcome for this frame
+            det_reason = detection_reasons.get(ts, "unknown")
+            _debug_log.append(f"{ts}  DETECT  {det_reason}")
+            # Log active-but-unmatched tracks (gaps)
+            for tid in active:
+                if tid not in assigned_tracks:
+                    gap = frame_idx - last_seen.get(tid, frame_idx)
+                    cx = tracks[tid][-1][1]['centroid_patch_x']
+                    cy = tracks[tid][-1][1]['centroid_patch_y']
+                    _debug_log.append(
+                        f"{ts}  GAP     track={tid:3d}  age={len(tracks[tid]):4d}  "
+                        f"gap_frames={gap:2d}  last_patch=({cx:.1f},{cy:.1f})"
+                    )
+            # Apply assignments; spawn new track for unmatched regions
+            for ri, region in enumerate(current_regions):
+                r = region.copy()
+                r['timestamp'] = ts
+                if ri in assignments:
+                    tid = assignments[ri]
+                    r['id'] = tid
+                    tracks[tid].append((ts, r))
+                    cx, cy = r['centroid_patch_x'], r['centroid_patch_y']
+                    _debug_log.append(
+                        f"{ts}  MATCH   track={tid:3d}  age={len(tracks[tid]):4d}  "
+                        f"patch=({cx:.1f},{cy:.1f})  flux={r.get('sum_flux', 0):.3e}"
+                    )
+                else:
+                    r['id'] = next_id
+                    tracks[next_id] = [(ts, r)]
+                    cx, cy = r['centroid_patch_x'], r['centroid_patch_y']
+                    _debug_log.append(
+                        f"{ts}  NEW     track={next_id:3d}  age=   1  "
+                        f"patch=({cx:.1f},{cy:.1f})  flux={r.get('sum_flux', 0):.3e}"
+                    )
+                    next_id += 1
+                    tid = r['id']
+                last_seen[tid] = frame_idx
+        tracks = {k: v for k, v in tracks.items() if v}
+        print(f"Found {len(tracks)} region tracks across {len(timestamps)} timestamps")
+        if self.output_dir and _debug_log:
+            log_path = Path(self.output_dir) / "tracking_debug.log"
+            with open(log_path, 'w') as f:
+                f.write(f"# Tracking log — {len(tracks)} tracks, {len(timestamps)} timestamps\n")
+                f.write(f"# max_tracking_distance={cfg.max_tracking_distance}  "
+                        f"max_gap_frames={cfg.max_gap_frames}  "
+                        f"age_bonus_weight={cfg.age_bonus_weight}\n")
+                f.write("#\n# timestamp               event   track  age   detail\n")
+                f.write('\n'.join(_debug_log))
+            print(f"Tracking debug log → {log_path}")
+        return tracks
+    def detect_flare_events(self, timestamps: Optional[List[str]] = None) -> pd.DataFrame:
+        """Run detection + tracking and return a per-timestamp events DataFrame."""
+        if timestamps is None:
+            timestamps = self.predictions_df['timestamp'].tolist()
+        tracks = self.track_regions_over_time(timestamps)
+        rows = []
+        for track_id, history in tracks.items():
+            for ts, r in history:
+                pred = self.predictions_df[self.predictions_df['timestamp'] == ts]
+                if pred.empty:
+                    continue
+                pred = pred.iloc[0]
+                rows.append({
+                    'timestamp': ts,
+                    'datetime': pred['datetime'],
+                    'prediction': pred['predictions'],
+                    'groundtruth': pred.get('groundtruth', None),
+                    'region_size': r.get('size', 0),
+                    'sum_flux': r.get('sum_flux', 0.0),
+                    'max_flux': r.get('max_flux', 0.0),
+                    'mean_flux': r.get('sum_flux', 0.0) / max(r.get('size', 1), 1),
+                    'centroid_patch_y': r.get('centroid_patch_y', 0.0),
+                    'centroid_patch_x': r.get('centroid_patch_x', 0.0),
+                    'centroid_img_y': r.get('centroid_img_y', 0.0),
+                    'centroid_img_x': r.get('centroid_img_x', 0.0),
+                    'peak_img_y': r.get('peak_img_y', None),
+                    'peak_img_x': r.get('peak_img_x', None),
+                    'region_label': r.get('region_label', None),
+                    'track_id': track_id,
+                })
+        print(f"Recorded {len(rows)} events from {len(tracks)} tracks")
+        return pd.DataFrame(rows) if rows else pd.DataFrame()
+# =============================================================================
+# Frame Generation
+# =============================================================================
+# Colours cycled across FOXES tracks
+_TRACK_COLORS = [
+    '#E6194B', '#3CB44B', '#FFE119', '#4363D8', '#F58231',
+    '#911EB4', '#42D4F4', '#F032E6', '#BFEF45', '#FABED4',
+    '#469990', '#DCBEFF', '#9A6324', '#FFFAC8', '#800000',
+    '#AAFFC3', '#808000', '#FFD8B1', '#000075', '#A9A9A9',
+]
+def _generate_single_frame(args: Tuple) -> Optional[str]:
+    """Render one frame. Designed for multiprocessing."""
+    setup_barlow_font()
+    frame_idx, timestamp, fd = args
+    try:
+        flare_events_df    = fd['flare_events_df']
+        predictions_df     = fd['predictions_df']
+        region_labels_cache = fd['region_labels_cache']
+        config             = fd['config']
+        track_color_map    = fd['track_color_map']
+        plot_window_hours  = fd['plot_window_hours']
+        aia_path           = fd['aia_path']
+        frames_dir         = Path(fd['frames_dir'])
+        current_time  = pd.to_datetime(timestamp)
+        window_start  = current_time - pd.Timedelta(hours=plot_window_hours / 2)
+        window_end    = current_time + pd.Timedelta(hours=plot_window_hours / 2)
+        # ── Figure: AIA (left) + SXR timeseries (right) ─────────────────────
+        fig = plt.figure(figsize=(14, 7))
+        gs  = fig.add_gridspec(1, 2, width_ratios=[1, 1], wspace=0.3,
+                               left=0.07, right=0.97, top=0.93, bottom=0.10)
+        ax_aia = fig.add_subplot(gs[0])
+        ax_sxr = fig.add_subplot(gs[1])
+        # ── AIA image ────────────────────────────────────────────────────────
+        aia_image = load_aia_image_at_time(Path(aia_path), timestamp) if aia_path else None
+        if aia_image is not None:
+            ax_aia.imshow(aia_image, origin='lower', aspect='equal', alpha=0.9)
+        else:
+            ax_aia.imshow(np.zeros((512, 512, 3)), origin='lower', aspect='equal')
+        ax_aia.set_title(f'{current_time.strftime("%Y-%m-%d %H:%M:%S")}', fontsize=11)
+        ax_aia.set_xlabel('X (pixels)', fontsize=9)
+        ax_aia.set_ylabel('Y (pixels)', fontsize=9)
+        # ── Region contours + FOXES markers ──────────────────────────────────
+        region_labels = region_labels_cache.get(timestamp)
+        current_events = (
+            flare_events_df[flare_events_df['timestamp'] == timestamp].copy()
+            if not flare_events_df.empty and 'timestamp' in flare_events_df.columns
+            else pd.DataFrame()
+        )
+        plotted_tracks: set = set()
+        for _, ev in current_events.iterrows():
+            tid = ev['track_id']
+            if tid in plotted_tracks:
+                continue
+            plotted_tracks.add(tid)
+            cx, cy = ev.get('centroid_img_x'), ev.get('centroid_img_y')
+            if pd.isna(cx) or pd.isna(cy) or not (0 <= cx <= 512) or not (0 <= cy <= 512):
+                continue
+            px = ev.get('peak_img_x') if pd.notna(ev.get('peak_img_x')) else cx
+            py = ev.get('peak_img_y') if pd.notna(ev.get('peak_img_y')) else cy
+            color = track_color_map.get(tid, _TRACK_COLORS[0])
+            cur_flux  = ev.get('sum_flux', 0.0)
+            is_active = cur_flux >= config.min_flux_threshold
+            # Contour
+            rl = ev.get('region_label')
+            if region_labels is not None and pd.notna(rl) and int(rl) > 0:
+                region_mask = region_labels == int(rl)
+                if np.any(region_mask):
+                    try:
+                        # Upsample 64×64 mask to 512×512 for crisp contours on AIA image
+                        scale = 512 // region_labels.shape[0]
+                        mask_up = region_mask.repeat(scale, axis=0).repeat(scale, axis=1).astype(float)
+                        ax_aia.contour(mask_up, levels=[0.5],
+                                       colors=color, linewidths=4.0 if is_active else 2.5,
+                                       alpha=0.9, extent=[0, 512, 0, 512])
+                    except Exception:
+                        pass
+            # Marker
+            if is_active:
+                ax_aia.plot(px, py, '*', markersize=15, color=color,
+                            markeredgecolor='black', markeredgewidth=2, alpha=0.7, zorder=15)
+                ax_aia.annotate(f'FOXES: {flux_to_goes_class(cur_flux)}', (px, py),
+                                xytext=(15, 15), textcoords='offset points', fontsize=11,
+                                color='black', weight='bold',
+                                bbox=dict(boxstyle='round,pad=0.3', facecolor=color,
+                                          alpha=0.95, edgecolor='black', linewidth=2))
+            else:
+                ax_aia.plot(px, py, 'o', markersize=10, color=color,
+                            markeredgecolor='white', markeredgewidth=1.5, alpha=0.8, zorder=12)
+        # ── SXR timeseries ───────────────────────────────────────────────────
+        if predictions_df is not None and not predictions_df.empty:
+            in_win = predictions_df[
+                (predictions_df['datetime'] >= window_start) &
+                (predictions_df['datetime'] <= window_end)
+            ]
+            if not in_win.empty:
+                if 'groundtruth' in in_win.columns:
+                    ax_sxr.plot(in_win['datetime'], in_win['groundtruth'],
+                                'b-', linewidth=1.5, alpha=0.8, label='GOES (Truth)')
+                if 'predictions' in in_win.columns:
+                    ax_sxr.plot(in_win['datetime'], in_win['predictions'],
+                                'r--', linewidth=1.5, alpha=0.8, label='FOXES')
+        # Track fluxes
+        all_tracks_in_win = (
+            flare_events_df[
+                (flare_events_df['datetime'] >= window_start) &
+                (flare_events_df['datetime'] <= window_end)
+            ] if not flare_events_df.empty else pd.DataFrame()
+        )
+        first_other = True
+        for tid, tdata in (all_tracks_in_win.groupby('track_id') if not all_tracks_in_win.empty else []):
+            tdata = tdata.sort_values('datetime')
+            color = track_color_map.get(tid, _TRACK_COLORS[0])
+            is_active = tdata['sum_flux'].max() >= config.min_flux_threshold
+            if is_active:
+                ax_sxr.plot(tdata['datetime'], tdata['sum_flux'],
+                            color=color, linewidth=2.5, alpha=0.9, label=f'Track {tid}', zorder=4)
+            else:
+                label = 'Other tracks' if first_other else None
+                ax_sxr.plot(tdata['datetime'], tdata['sum_flux'],
+                            color=color, linewidth=0.9, alpha=0.35, label=label, zorder=3)
+                first_other = False
+        ax_sxr.axvline(current_time, color='#E5446D', linewidth=2, alpha=0.8, zorder=10)
+        ax_sxr.set_xlim(window_start, window_end)
+        ax_sxr.set_yscale('log')
+        ax_sxr.set_ylabel('Flux (W/m²)', fontsize=9)
+        ax_sxr.set_xlabel('Time (UTC)', fontsize=9)
+        ax_sxr.xaxis.set_major_formatter(mdates.DateFormatter('%H:%M'))
+        ax_sxr.xaxis.set_major_locator(mdates.HourLocator(interval=1))
+        plt.setp(ax_sxr.xaxis.get_majorticklabels(), rotation=0)
+        ax_sxr.legend(loc='lower right', fontsize=8, framealpha=1)
+        ax_sxr.grid(True, alpha=0.3)
+        plt.tight_layout()
+        fmt = getattr(config, 'movie_frame_format', 'jpg').lower()
+        dpi = getattr(config, 'movie_dpi', 75.0)
+        ext = 'jpg' if fmt in ('jpg', 'jpeg') else 'png'
+        frame_path = frames_dir / f"frame_{frame_idx:06d}.{ext}"
+        plt.savefig(frame_path, dpi=dpi, format=ext)
+        plt.close()
+        return str(frame_path)
+    except Exception as e:
+        plt.close('all')
+        print(f"Error creating frame {frame_idx} ({timestamp}): {e}")
+        return None
+# =============================================================================
+# Movie Assembly
+# =============================================================================
+def create_flare_movie(
+    flare_events_df: pd.DataFrame,
+    output_dir: Path,
+    config: FlareAnalysisConfig,
+    predictions_csv: Optional[str] = None,
+    analyzer: Optional[FluxContributionAnalyzer] = None,
+    fps: float = 2.0,
+    frame_interval_minutes: float = 1.0,
+    num_workers: int = 4,
+) -> Optional[str]:
+    """Generate per-timestamp frames and stitch into an MP4."""
+    setup_barlow_font()
+    if flare_events_df.empty:
+        print("No flare data — skipping movie.")
+        return None
+    output_dir = Path(output_dir)
+    movie_dir  = output_dir / "movies"
+    movie_dir.mkdir(parents=True, exist_ok=True)
+    # Load predictions for timeseries
+    predictions_df = None
+    if predictions_csv and Path(predictions_csv).exists():
+        predictions_df = pd.read_csv(predictions_csv)
+        dt_col = 'datetime' if 'datetime' in predictions_df.columns else 'timestamp'
+        predictions_df['datetime'] = pd.to_datetime(predictions_df[dt_col])
+    flare_events_df = flare_events_df.copy()
+    flare_events_df['datetime'] = pd.to_datetime(flare_events_df['datetime'])
+    all_timestamps = sorted(flare_events_df['timestamp'].unique())
+    # Subsample by frame_interval_minutes
+    timestamps_to_use, last_dt = [], None
+    for ts in all_timestamps:
+        dt = pd.to_datetime(ts)
+        if last_dt is None or (dt - last_dt).total_seconds() >= frame_interval_minutes * 60:
+            timestamps_to_use.append(ts)
+            last_dt = dt
+    print(f"Creating movie: {len(timestamps_to_use)} frames @ {fps} fps")
+    # Assign consistent colours to tracks
+    unique_tracks = flare_events_df['track_id'].unique()
+    track_color_map = {tid: _TRACK_COLORS[i % len(_TRACK_COLORS)] for i, tid in enumerate(unique_tracks)}
+    frames_dir = movie_dir / "frames_temp"
+    frames_dir.mkdir(exist_ok=True)
+    frame_data = {
+        'flare_events_df':     flare_events_df,
+        'predictions_df':      predictions_df,
+        'frames_dir':          str(frames_dir),
+        'region_labels_cache': analyzer.region_labels_cache if analyzer else {},
+        'config':              config,
+        'track_color_map':     track_color_map,
+        'plot_window_hours':   config.plot_window_hours,
+        'aia_path':            config.aia_path,
+    }
+    frame_args = [(i, ts, frame_data) for i, ts in enumerate(timestamps_to_use)]
+    if num_workers > 1:
+        with Pool(processes=num_workers) as pool:
+            results = list(tqdm(pool.imap(_generate_single_frame, frame_args),
+                                total=len(frame_args), desc="Generating frames"))
+    else:
+        results = [_generate_single_frame(a) for a in tqdm(frame_args, desc="Generating frames")]
+    frame_paths = sorted(
+        (Path(p) for p in results if p is not None),
+        key=lambda p: p.name
+    )
+    if not frame_paths:
+        print("No frames generated.")
+        return None
+    # Stitch into MP4 via imageio (reads frames as RGB → passes to ffmpeg correctly)
+    datetimes  = [pd.to_datetime(ts) for ts in timestamps_to_use]
+    movie_name = (f"flare_movie_{datetimes[0].strftime('%Y%m%d')}"
+                  f"_{datetimes[-1].strftime('%Y%m%d')}.mp4")
+    movie_path = movie_dir / movie_name
+    # Read first frame to get dimensions
+    first_frame = imageio.imread(str(frame_paths[0]))
+    h, w = first_frame.shape[:2]
+    # yuv420p requires even dimensions
+    w = w if w % 2 == 0 else w - 1
+    h = h if h % 2 == 0 else h - 1
+    t0 = time.time()
+    writer = imageio_ffmpeg.write_frames(
+        str(movie_path),
+        size=(w, h),
+        fps=fps,
+        codec='libx264',
+        pix_fmt_in='rgb24',
+        pix_fmt_out='yuv420p',
+        output_params=['-preset', 'veryfast', '-crf', '25', '-movflags', '+faststart'],
+    )
+    writer.send(None)  # initialise
+    for fp in tqdm(frame_paths, desc="Writing movie"):
+        if fp.exists():
+            frame = imageio.imread(str(fp))
+            writer.send(frame[:h, :w].tobytes())
+    writer.close()
+    print(f"Movie saved → {movie_path}  ({time.time() - t0:.1f}s)")
+    print(f"Frames kept → {frames_dir}")
+    return str(movie_path)
+# =============================================================================
+# Entry point
+# =============================================================================
+def main() -> None:
+    parser = argparse.ArgumentParser(description="Flare Analysis — Frame & Movie Generator")
+    parser.add_argument("--config", required=True, help="Path to YAML config file")
+    args = parser.parse_args()
+    config = FlareAnalysisConfig.from_yaml(args.config)
+    run_ts    = datetime.now().strftime("%Y%m%d_%H%M%S")
+    out_dir   = Path(config.output_dir or '.') / f"run_{run_ts}"
+    out_dir.mkdir(parents=True, exist_ok=True)
+    print(f"Output: {out_dir}")
+    analyzer        = FluxContributionAnalyzer(config, output_dir=out_dir)
+    flare_events_df = analyzer.detect_flare_events()
+    if not flare_events_df.empty:
+        flare_events_df.to_csv(out_dir / "flare_events.csv", index=False)
+        print(f"Saved {len(flare_events_df)} events → {out_dir / 'flare_events.csv'}")
+    if config.create_movie:
+        create_flare_movie(
+            flare_events_df  = flare_events_df,
+            output_dir       = out_dir,
+            config           = config,
+            predictions_csv  = config.predictions_csv,
+            analyzer         = analyzer,
+            fps              = config.movie_fps,
+            frame_interval_minutes = config.movie_frame_interval_minutes,
+            num_workers      = config.movie_num_workers,
+        )
+    print(f"\nDone. Results in {out_dir}")
+if __name__ == "__main__":
+    main()

analysis/flux_map_config.yaml ADDED Viewed

	@@ -0,0 +1,67 @@

+# =============================================================================
+# Flare Analysis Configuration
+# =============================================================================
+# Usage: python analysis/flux_map_analysis.py --config analysis/flux_map_config.yaml
+# =============================================================================
+# -----------------------------------------------------------------------------
+# Paths
+# -----------------------------------------------------------------------------
+paths:
+  flux_path:        "/Volumes/T9/FOXES_Data/flux"
+  aia_path:         "/Volumes/T9/FOXES_Data/AIA_processed"
+  predictions_csv:  "/Volumes/T9/FOXES_Misc/batch_results/vit/vit_predictions_test.csv"
+  output_dir:       "/Volumes/T9/FOXES_Data/flare_analysis"
+# -----------------------------------------------------------------------------
+# Time Range  (null = use full predictions CSV range)
+# -----------------------------------------------------------------------------
+time_range:
+  start: "2024-03-23T00:00:00"   # e.g. "2024-03-23T00:00:00"
+  end:   "2024-03-23T3:00:00"
+# -----------------------------------------------------------------------------
+# Detection
+# -----------------------------------------------------------------------------
+detection:
+  min_flux_threshold:                    1.0e-7   # W/m² — patches below this are ignored
+  threshold_std_multiplier:              4.0      # flux mask: mean + N*std
+  spatial_smoothing_sigma:               1.0      # Gaussian pre-smoothing (patches, 0 = off)
+  radial_expansion_threshold_percentile: 30.0     # flood-fill growth cutoff percentile
+  peak_neighborhood_sizes:               [10, 15, 20, 25]  # multi-scale local-max windows
+  peak_min_scale_agreement:              2       # peaks must appear at N scales
+  peak_scale_tolerance:                  10        # patch-distance to count as "same peak"
+  min_peak_distance:                     5       # min patches between distinct peaks
+# -----------------------------------------------------------------------------
+# Grid / Patch Parameters
+# -----------------------------------------------------------------------------
+grid:
+  grid_size:   [64, 64]
+  patch_size:  8
+  input_size:  512
+# -----------------------------------------------------------------------------
+# Region Tracking
+# -----------------------------------------------------------------------------
+tracking:
+  max_tracking_distance: 10     # max patch-distance between frames to link regions
+  flux_ratio_weight:     0    # weight of flux-ratio term in linking score
+  size_ratio_weight:     0    # weight of size-ratio term in linking score
+  distance_weight:       1.0    # weight of spatial distance in linking score
+  age_bonus_weight:      2.0    # bias toward established tracks (scales 1/(1+age))
+  cadence_seconds:       60.0   # expected data cadence
+  max_gap_frames:        15     # frames a track can go undetected before expiring
+# -----------------------------------------------------------------------------
+# Movie / Output
+# -----------------------------------------------------------------------------
+movie:
+  create_movie:             true
+  plot_window_hours:        2.0    # SXR plot time window around current frame
+  fps:                      30.0
+  frame_interval_minutes:   1.0    # one frame per minute of data
+  num_workers:              8
+  dpi:                      75.0
+  frame_format:             "jpg"  # "jpg" (fast) or "png" (quality)
+  jpeg_quality:             90

analysis/spatial_performance.py CHANGED Viewed

@@ -46,7 +46,7 @@ CROP_FACTOR     = 1.1   # AIA images cropped at 1.1 solar radii
 SOLAR_RADIUS_PATCHES = (GRID_SIZE / 2) / CROP_FACTOR   # ≈ 29.1 patches
 # Patches beyond ±PATCH_CROP_RADIUS from center (in original 64×64 patch units) are masked.
-PATCH_CROP_RADIUS = 19
 # Percentile cap for colorbar scaling (applied to non-NaN values).
 # e.g. 99 clips the top 1% of values so detail in the bulk is visible.

 SOLAR_RADIUS_PATCHES = (GRID_SIZE / 2) / CROP_FACTOR   # ≈ 29.1 patches
 # Patches beyond ±PATCH_CROP_RADIUS from center (in original 64×64 patch units) are masked.
+PATCH_CROP_RADIUS = 24
 # Percentile cap for colorbar scaling (applied to non-NaN values).
 # e.g. 99 clips the top 1% of values so detail in the bulk is visible.

forecasting/inference/flare_analysis.py DELETED Viewed

The diff for this file is too large to render. See raw diff

forecasting/inference/flare_analysis_poster.py DELETED Viewed

The diff for this file is too large to render. See raw diff

pipeline_config.yaml CHANGED Viewed

@@ -5,7 +5,7 @@
 #
 # Usage:
 #   python run_pipeline.py --config pipeline_config.yaml --steps all
-#   python run_pipeline.py --config pipeline_config.yaml --steps train,inference,flare_analysis
 #   python run_pipeline.py --list
 #
 # Variables
@@ -152,6 +152,23 @@ spatial_performance:
   predictions_csv: "${base_dir}/inference/predictions.csv"
   out_dir:         "${base_dir}/inference/spatial_performance"
 # -----------------------------------------------------------------------------
 # Evaluation  (step: evaluate)
 # -----------------------------------------------------------------------------

 #
 # Usage:
 #   python run_pipeline.py --config pipeline_config.yaml --steps all
+#   python run_pipeline.py --config pipeline_config.yaml --steps train,inference,flux_map_analysis
 #   python run_pipeline.py --list
 #
 # Variables
   predictions_csv: "${base_dir}/inference/predictions.csv"
   out_dir:         "${base_dir}/inference/spatial_performance"
+# -----------------------------------------------------------------------------
+# Flux map analysis  (step: flux_map_analysis)
+# Detects and tracks active regions from per-patch flux contribution maps,
+# renders side-by-side AIA + SXR frames, and stitches them into a movie.
+# -----------------------------------------------------------------------------
+flux_map_analysis:
+  config: "analysis/flux_map_config.yaml"
+  # overrides:                        # uncomment to override config values
+  #   paths:
+  #     flux_path:       "${base_dir}/flux"
+  #     aia_path:        "${base_dir}/AIA_processed"
+  #     predictions_csv: "${base_dir}/inference/predictions.csv"
+  #     output_dir:      "${base_dir}/inference/flux_map_analysis"
+  #   time_range:
+  #     start: null      # null = full predictions CSV range
+  #     end:   null
 # -----------------------------------------------------------------------------
 # Evaluation  (step: evaluate)
 # -----------------------------------------------------------------------------

run_pipeline.py CHANGED Viewed

@@ -13,12 +13,12 @@ Runs any combination of pipeline steps in order:
   6. normalize      - Compute SXR normalization stats on train split (data/sxr_normalization.py)
   7. train          - Train the ViTLocal forecasting model (forecasting/training/train.py)
   8. inference      - Run batch inference on val/test data (forecasting/inference/inference.py)
-  9. flare_analysis - Detect, track, and match flares (forecasting/inference/flare_analysis.py)
 Usage:
   python run_pipeline.py --list
   python run_pipeline.py --config pipeline_config.yaml --steps all
-  python run_pipeline.py --config pipeline_config.yaml --steps train,inference,flare_analysis
 """
 import argparse
@@ -116,9 +116,9 @@ STEP_ORDER = [
     "train",
     "inference",
     "evaluate",
-    "flare_analysis",
     "ablation",
     "spatial_performance",
 ]
 STEP_INFO = {
@@ -166,10 +166,6 @@ STEP_INFO = {
         "description": "Compute metrics and generate evaluation plots from predictions CSV",
         "script": ROOT / "forecasting" / "inference" / "evaluation.py",
     },
-    "flare_analysis": {
-        "description": "Detect, track, and match flares; generate plots/movies",
-        "script": ROOT / "forecasting" / "inference" / "flare_analysis.py",
-    },
     "ablation": {
         "description": "Run Gaussian noise channel-masking ablation study on pretrained model",
         "script": ROOT / "forecasting" / "inference" / "ablation_inference.py",
@@ -178,6 +174,10 @@ STEP_INFO = {
         "description": "Generate flux-weighted spatial error heatmap on the solar disk",
         "script": ROOT / "analysis" / "spatial_performance.py",
     },
 }
@@ -329,15 +329,6 @@ def build_commands(step: str, cfg: dict, force: bool) -> list[list[str]] | None:
             config_path = str(write_merged_config(config_path, ev["overrides"], "evaluate_config"))
         return [base + ["-config", config_path]]
-    if step == "flare_analysis":
-        if not require(["config"], "inference"):
-            return None
-        inf = cfg["inference"]
-        config_path = inf["config"]
-        if inf.get("overrides"):
-            config_path = str(write_merged_config(config_path, inf["overrides"], "inference_config"))
-        return [base + ["--config", config_path]]
     if step == "ablation":
         if not require(["config"], "ablation"):
             return None
@@ -358,6 +349,15 @@ def build_commands(step: str, cfg: dict, force: bool) -> list[list[str]] | None:
             cmd += ["--out_dir", sp["out_dir"]]
         return [cmd]
     return [base]
@@ -398,7 +398,7 @@ def list_steps():
         print(f"  {i}. {step:<16} {STEP_INFO[step]['description']}")
     print()
     print("Use --steps all to run every step, or comma-separate specific steps.")
-    print("Example: --steps train,inference,flare_analysis\n")
 def main():

   6. normalize      - Compute SXR normalization stats on train split (data/sxr_normalization.py)
   7. train          - Train the ViTLocal forecasting model (forecasting/training/train.py)
   8. inference      - Run batch inference on val/test data (forecasting/inference/inference.py)
+  9. flux_map_analysis - Detect, track, and match flares (analysis/flux_map_analysis.py)
 Usage:
   python run_pipeline.py --list
   python run_pipeline.py --config pipeline_config.yaml --steps all
+  python run_pipeline.py --config pipeline_config.yaml --steps train,inference
 """
 import argparse
     "train",
     "inference",
     "evaluate",
     "ablation",
     "spatial_performance",
+    "flux_map_analysis",
 ]
 STEP_INFO = {
         "description": "Compute metrics and generate evaluation plots from predictions CSV",
         "script": ROOT / "forecasting" / "inference" / "evaluation.py",
     },
     "ablation": {
         "description": "Run Gaussian noise channel-masking ablation study on pretrained model",
         "script": ROOT / "forecasting" / "inference" / "ablation_inference.py",
         "description": "Generate flux-weighted spatial error heatmap on the solar disk",
         "script": ROOT / "analysis" / "spatial_performance.py",
     },
+    "flux_map_analysis": {
+        "description": "Detect and track active regions from flux maps; render per-frame movie",
+        "script": ROOT / "analysis" / "flux_map_analysis.py",
+    },
 }
             config_path = str(write_merged_config(config_path, ev["overrides"], "evaluate_config"))
         return [base + ["-config", config_path]]
     if step == "ablation":
         if not require(["config"], "ablation"):
             return None
             cmd += ["--out_dir", sp["out_dir"]]
         return [cmd]
+    if step == "flux_map_analysis":
+        if not require(["config"], "flux_map_analysis"):
+            return None
+        fma = cfg["flux_map_analysis"]
+        config_path = fma["config"]
+        if fma.get("overrides"):
+            config_path = str(write_merged_config(config_path, fma["overrides"], "flux_map_analysis_config"))
+        return [base + ["--config", config_path]]
     return [base]
         print(f"  {i}. {step:<16} {STEP_INFO[step]['description']}")
     print()
     print("Use --steps all to run every step, or comma-separate specific steps.")
+    print("Example: --steps train,inference\n")
 def main():