"""WebRTC integration using aiortc for low-latency bi-directional media.

This module exposes:
- POST /webrtc/offer : Accepts an SDP offer from browser, returns SDP answer.
- GET  /webrtc/ice   : (Optional) polling ICE candidates (simplified; trickle or full offer/answer)

Media Flow (Phase 1):
Browser camera/mic -> WebRTC -> aiortc PeerConnection ->
  Video track -> frame hook -> pipeline.process_video_frame -> return video track to client
  Audio track -> chunk hook  -> pipeline.process_audio_chunk -> return audio track to client

Control/Data channel: "control" used for lightweight JSON messages:
  {"type":"metrics_request"} -> server replies {"type":"metrics","payload":...}
  {"type":"set_reference","image_jpeg_base64":...}

Fallback: If aiortc not supported in environment or import fails, endpoint returns 503.

Security: (basic) Optional shared secret via X-API-Key header (env MIRAGE_API_KEY).

NOTE: This is a minimal, production-ready skeleton focusing on structure, error handling,
resource cleanup and integration points. Actual model inference now resides exclusively in swap_pipeline.FaceSwapPipeline.
"""
from __future__ import annotations

import asyncio
import base64
import json
import logging
import os
import time
from dataclasses import dataclass
import hashlib
import hmac
import inspect
import secrets as pysecrets
import base64 as pybase64
import random
from typing import Optional, Dict, Any

from fastapi import APIRouter, HTTPException, Header

try:
    from aiortc import RTCPeerConnection, RTCSessionDescription, MediaStreamTrack, RTCConfiguration, RTCIceServer, VideoStreamTrack
    from aiortc.contrib.media import MediaBlackhole
    import av  # noqa: F401 (required by aiortc for codecs)
    AIORTC_AVAILABLE = True
except Exception as e:  # pragma: no cover
    AIORTC_IMPORT_ERROR = str(e)
    AIORTC_AVAILABLE = False

import numpy as np
import cv2
try:
    from webrtc_connection_monitoring import add_connection_monitoring  # optional diagnostics
except Exception:
    add_connection_monitoring = None

logger = logging.getLogger(__name__)

# Lazy pipeline getter with safe pass-through fallback to ensure router mounts
_pipeline_singleton = None

class _PassThroughPipeline:
    def __init__(self):
        # Mark as loaded so initialization is skipped
        self.loaded = True

    def initialize(self):
        return True

    def set_source_image(self, img):
        return False

    def process_video_frame(self, img, frame_idx=None):
        # Pass-through video
        return img

    def process_audio_chunk(self, pcm):
        # Pass-through audio (bytes or np array)
        return pcm

    def get_performance_stats(self):
        return {}

def get_pipeline():  # type: ignore
    global _pipeline_singleton
    if _pipeline_singleton is not None:
        return _pipeline_singleton
    try:
        from swap_pipeline import get_pipeline as _real_get_pipeline
        _pipeline_singleton = _real_get_pipeline()
    except Exception as e:
        logger.error(f"swap_pipeline unavailable, using pass-through: {e}")
        _pipeline_singleton = _PassThroughPipeline()
    return _pipeline_singleton


async def _ensure_pipeline_initialized() -> bool:
    """Ensure the face swap pipeline is initialized.

    This function was missing previously resulting in a NameError and a 500
    response from /webrtc/offer before a peer connection could be created.
    Initialization can be moderately heavy (model loads), so we offload it to
    a thread executor to keep the event loop responsive.

    Returns True if initialized (or already initialized), False on failure.
    """
    try:
        pipe = get_pipeline()
        if getattr(pipe, 'initialized', False):
            return True
        loop = asyncio.get_running_loop()
        def _init_blocking():  # executed in thread
            try:
                pipe.initialize()
                return True
            except Exception as e:  # noqa: BLE001
                logger.error(f"Pipeline initialization error: {e}")
                return False
        return await loop.run_in_executor(None, _init_blocking)
    except Exception as e:  # pragma: no cover - defensive
        logger.error(f"_ensure_pipeline_initialized failure: {e}")
        return False

# Router mounted by app with prefix "/webrtc"; declare here without its own prefix
router = APIRouter(tags=["webrtc"])

API_KEY = os.getenv("MIRAGE_API_KEY")
REQUIRE_API_KEY = os.getenv("MIRAGE_REQUIRE_API_KEY", "0").strip().lower() in {"1","true","yes","on"}
TOKEN_TTL_SECONDS = int(os.getenv("MIRAGE_TOKEN_TTL", "300"))  # 5 minutes default
STUN_URLS = os.getenv(
    "MIRAGE_STUN_URLS",
    "stun:stun.l.google.com:19302,stun:stun1.l.google.com:19302,stun:stun2.l.google.com:19302,stun:stun3.l.google.com:19302,stun:stun4.l.google.com:19302,stun:stun.stunprotocol.org:3478"
)
TURN_URL = os.getenv("MIRAGE_TURN_URL")
TURN_USER = os.getenv("MIRAGE_TURN_USER")
TURN_PASS = os.getenv("MIRAGE_TURN_PASS")
METERED_API_KEY = os.getenv("MIRAGE_METERED_API_KEY")
TURN_TLS_ONLY = os.getenv("MIRAGE_TURN_TLS_ONLY", "1").strip().lower() in {"1","true","yes","on"}
PREFER_H264 = os.getenv("MIRAGE_PREFER_H264", "0").strip().lower() in {"1","true","yes","on"}
FORCE_RELAY = os.getenv("MIRAGE_FORCE_RELAY", "0").strip().lower() in {"1","true","yes","on"}
DISABLE_METERED = os.getenv("MIRAGE_DISABLE_METERED", "0").strip().lower() in {"1","true","yes","on"}


def _b64u(data: bytes) -> str:
    return pybase64.urlsafe_b64encode(data).decode('ascii').rstrip('=')


def _b64u_decode(data: str) -> bytes:
    pad = '=' * (-len(data) % 4)
    return pybase64.urlsafe_b64decode(data + pad)


async def _test_turn_connectivity(ice_servers):
    """Test TURN server connectivity to diagnose NAT traversal issues."""
    import socket
    from urllib.parse import urlparse
    
    turn_tests = []
    for server in ice_servers:
        urls = server.urls if isinstance(server.urls, list) else [server.urls]
        for url in urls:
            if url.startswith('turn'):
                try:
                    parsed = urlparse(url.replace('turn:', 'http://').replace('turns:', 'https://'))
                    host = parsed.hostname
                    port = parsed.port or (443 if url.startswith('turns:') else 3478)
                    
                    # Basic TCP connectivity test
                    sock = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
                    sock.settimeout(3)
                    result = sock.connect_ex((host, port))
                    sock.close()
                    
                    if result == 0:
                        logger.info(f"TURN server reachable: {host}:{port}")
                        turn_tests.append(True)
                    else:
                        logger.warning(f"TURN server unreachable: {host}:{port} (error {result})")
                        turn_tests.append(False)
                        
                except Exception as e:
                    logger.warning(f"TURN connectivity test failed for {url}: {e}")
                    turn_tests.append(False)
    
    if turn_tests:
        reachable = sum(turn_tests)
        total = len(turn_tests)
        if reachable == 0:
            logger.error(f"All {total} TURN servers are unreachable - NAT traversal will likely fail")
        elif reachable < total:
            logger.warning(f"Only {reachable}/{total} TURN servers are reachable")
        else:
            logger.info(f"All {total} TURN servers are reachable")


def _mint_token() -> str:
    """Stateless signed token: base64url(ts:nonce:mac)."""
    ts = str(int(time.time()))
    nonce = _b64u(pysecrets.token_bytes(12))
    msg = f"{ts}:{nonce}".encode('utf-8')
    mac = hmac.new(API_KEY.encode('utf-8'), msg, hashlib.sha256).digest()
    return _b64u(msg) + '.' + _b64u(mac)


@router.get("/ping")
async def webrtc_ping():
    """Lightweight check indicating the WebRTC router is mounted.
    Returns aiortc availability and import error (if any)."""
    return {
        "router": True,
        "aiortc_available": AIORTC_AVAILABLE,
        "aiortc_error": None if AIORTC_AVAILABLE else AIORTC_IMPORT_ERROR,
        "turn_configured": bool(TURN_URL and TURN_USER and TURN_PASS),
        "metered_configured": bool(METERED_API_KEY)
    }

# Minimal root to confirm router is mounted
@router.get("")
async def webrtc_root():
    return {"webrtc": True, "aiortc_available": AIORTC_AVAILABLE}

@router.get("/ice_config")
async def webrtc_ice_config():
    """Expose ICE server configuration so the client can include TURN if configured.
    Returns a structure compatible with RTCPeerConnection's configuration.
    """
    try:
        cfg = _ice_configuration()
        servers: list[dict[str, object]] = []
        stun_count = 0
        turn_count = 0
        for s in cfg.iceServers:
            entry: dict[str, object] = {"urls": s.urls}
            # Classify counts (s.urls may be list or str)
            urls_list = s.urls if isinstance(s.urls, list) else [s.urls]
            for u in urls_list:
                if isinstance(u, str):
                    if u.startswith('turn'):
                        turn_count += 1
                    elif u.startswith('stun'):
                        stun_count += 1
            if getattr(s, 'username', None):
                entry["username"] = s.username
            if getattr(s, 'credential', None):
                entry["credential"] = s.credential
            servers.append(entry)
        payload: dict[str, object] = {"iceServers": servers, "stunCount": stun_count, "turnCount": turn_count}
        if FORCE_RELAY:
            payload["forceRelay"] = True
            if turn_count == 0:
                # Hint to client that relay-only will fail with no TURN
                payload["relayOnlyWarning"] = "FORCE_RELAY enabled but no TURN servers available"
        return payload
    except Exception as e:
        # Fallback to public STUN
        return {"iceServers": [{"urls": ["stun:stun.l.google.com:19302"]}], "error": str(e), "stunCount": 1, "turnCount": 0}


@router.get("/debug_state")
async def webrtc_debug_state():
    """Return simplified current peer connection debug info."""
    try:
        st = _peer_state
        if st is None:
            return {
                "active": False,
                "last_connection_state": None,
                "last_ice_state": None,
            }
        pc = st.pc
        senders = getattr(pc, 'getSenders', lambda: [])()
        def _sender_info(s):
            try:
                tr = s.track
                info = {
                    "kind": getattr(tr, 'kind', None) if tr else None,
                    "readyState": getattr(tr, 'readyState', None) if tr else None,
                    "exists": tr is not None
                }
                # Include frame emission counter if available
                try:
                    if tr and getattr(tr, 'kind', None) == 'video' and hasattr(tr, '_debug_emitted'):
                        info["frames_emitted"] = getattr(tr, '_debug_emitted')
                        # Outbound diagnostics (VideoStreamTrack subclass fields)
                        diag_pairs = [
                            ('_placeholder_active','placeholder_active'),
                            ('_placeholder_sent','placeholder_frames'),
                            ('_relay_failures','relay_failures'),
                            ('_relay_last_error','relay_last_error'),
                            ('_relay_last_error_ts','relay_last_error_ts'),
                            ('_first_relay_ts','first_relay_ts'),
                            ('_placeholder_initial_ts','placeholder_initial_ts'),
                            ('_placeholder_deactivated_ts','placeholder_deactivated_ts'),
                            ('_raw_frames_in','raw_frames_in'),
                        ]
                        for attr, key in diag_pairs:
                            if hasattr(tr, attr):
                                info[key] = getattr(tr, attr)
                except Exception:
                    pass
                return info
            except Exception:
                return {"kind": None, "exists": False}
        return {
            "active": True,
            "connectionState": getattr(pc, 'connectionState', None),
            "iceConnectionState": getattr(pc, 'iceConnectionState', None),
            "senders": [_sender_info(s) for s in senders],
            "control_channel_ready": st.control_channel_ready,
            "last_connection_state": st.last_connection_state,
            "last_ice_state": st.last_ice_state,
        }
    except Exception as e:
        return {"active": False, "error": str(e)}


def _verify_token(token: str) -> bool:
    try:
        parts = token.split('.')
        if len(parts) != 2:
            return False
        msg_b64, mac_b64 = parts
        msg = _b64u_decode(msg_b64)
        mac = _b64u_decode(mac_b64)
        ts_str, nonce = msg.decode('utf-8').split(':', 1)
        ts = int(ts_str)
        if time.time() - ts > TOKEN_TTL_SECONDS:
            return False
        expected = hmac.new(API_KEY.encode('utf-8'), msg, hashlib.sha256).digest()
        return hmac.compare_digest(expected, mac)
    except Exception:
        return False


def _check_api_key(header_val: Optional[str], token_val: Optional[str] = None):
    # If no API key configured, allow
    if not API_KEY:
        return
    # If enforcement disabled, allow
    if not REQUIRE_API_KEY:
        return
    # Accept raw key or signed token
    if header_val and header_val == API_KEY:
        return
    if token_val and _verify_token(token_val):
        return
    raise HTTPException(status_code=401, detail="Unauthorized")


def _ice_configuration() -> RTCConfiguration:
    """Build RTCConfiguration, preferring metered TURN, then static, then STUN.
    
    Includes a 5-second timeout for the metered fetch.
    """
    servers = []
    static_turn_available = bool(TURN_URL and TURN_USER and TURN_PASS)
    use_metered = bool(METERED_API_KEY) and not DISABLE_METERED and not static_turn_available
    
    # 1. Try Metered Service (e.g., Twilio) with a timeout
    if use_metered:
        try:
            import httpx
            logger.info("Fetching metered ICE servers...")
            # Timeout set to 5s to avoid long hangs on unresponsive service
            with httpx.Client(timeout=5.0) as client:
                response = client.post(
                    "https://api.metered.ca/api/v1/turn/credentials?apiKey=" + METERED_API_KEY
                )
                response.raise_for_status()
                servers.extend([RTCIceServer(**s) for s in response.json()])
                logger.info(f"Successfully fetched {len(servers)} metered ICE servers.")
        except Exception as e:
            warn_msg = f"Metered ICE fetch failed: {e}"
            logger.warning(warn_msg)
            # Surface additional context if the host cannot be resolved (common on HF Spaces without outbound DNS)
            try:
                import socket
                import urllib.parse
                parsed = urllib.parse.urlparse("https://api.metered.ca")
                host = parsed.hostname
                if host:
                    socket.gethostbyname(host)
            except socket.gaierror as dns_err:
                logger.warning(f"Metered ICE DNS lookup failed: {dns_err}. Verify outbound DNS/HTTPS access from the container or disable MIRAGE_METERED_API_KEY.")
            except Exception:
                pass
    elif METERED_API_KEY and DISABLE_METERED:
        logger.info("Metered ICE fetch disabled via MIRAGE_DISABLE_METERED=1")
    elif METERED_API_KEY and static_turn_available:
        logger.info("Skipping metered ICE fetch because static TURN credentials are configured")

    # 2. Fallback to static TURN if metered fetch failed or wasn't configured
    if not any('turn:' in s.urls for s in servers) and static_turn_available:
        logger.info("No metered TURN servers loaded, adding static TURN configuration.")
        servers.append(
            RTCIceServer(
                urls=TURN_URL,
                username=TURN_USER,
                credential=TURN_PASS
            )
        )

    # 3. Add public STUN servers if none are configured
    if not servers or not any('stun:' in s.urls for s in servers):
        logger.info("Adding default STUN servers.")
        stun_server_urls = [s.strip() for s in STUN_URLS.split(',') if s.strip()]
        if stun_server_urls:
            servers.append(RTCIceServer(urls=stun_server_urls))

    # 4. Asynchronously test TURN connectivity if any TURN servers are configured
    if any('turn:' in s.urls for s in servers):
        asyncio.create_task(_test_turn_connectivity(servers))

    return RTCConfiguration(iceServers=servers)


def _prefer_codec(sdp: str, media_type: str, codec: str) -> str:
    """Very small helper to move the preferred codec to the front of the m-line.

    This is a simplified, defensive implementation; if anything goes wrong we
    just return the original SDP. Only used when PREFER_H264=1 to bias browser
    selection toward H264 for better hardware decode compatibility on some
    platforms (e.g., macOS Safari, older Chromium builds on low-power devices).
    """
    try:
        lines = sdp.splitlines()
        m_indices = [i for i,l in enumerate(lines) if l.startswith('m=') and media_type in l]
        if not m_indices:
            return sdp
        # Find payload types for desired codec
        codec_payloads = []
        for i,l in enumerate(lines):
            if l.startswith('a=rtpmap:') and codec.lower() in l.lower():
                try:
                    pt = l.split(':',1)[1].split()[0]
                    if '/' in pt:
                        pt = pt.split()[0]
                    codec_payloads.append(pt)
                except Exception:
                    continue
        if not codec_payloads:
            return sdp
        for mi in m_indices:
            parts = lines[mi].split()
            if len(parts) > 3:
                header = parts[:3]
                payloads = parts[3:]
                # Stable ordering: preferred codec payloads first, then remaining
                new_payloads = [p for p in payloads if p in codec_payloads] + [p for p in payloads if p not in codec_payloads]
                lines[mi] = ' '.join(header + new_payloads)
        return '\r\n'.join(lines) + '\r\n'
    except Exception:
        return sdp


@router.on_event("startup")
async def on_startup():
    """Startup tasks: test TURN connectivity, etc."""
    try:
        # Initial TURN connectivity test (async)
        ice_config = _ice_configuration()
        if ice_config.iceServers:
            asyncio.create_task(_test_turn_connectivity(ice_config.iceServers))
    except Exception as e:
        logger.warning(f"Startup tasks error: {e}")


@dataclass
class PeerState:
    pc: RTCPeerConnection
    created: float
    control_channel_ready: bool = False
    last_connection_state: Optional[str] = None
    last_ice_state: Optional[str] = None
    cleanup_task: Optional[asyncio.Task] = None
    outbound_video: Optional['OutboundVideoTrack'] = None
    incoming_video_track: Optional['IncomingVideoTrack'] = None
    ice_samples: list[dict[str, Any]] = None  # rolling ICE stats snapshots
    ice_sampler_task: Optional[asyncio.Task] = None
    ice_watchdog_task: Optional[asyncio.Task] = None
    received_video: bool = False
    received_audio: bool = False
    incoming_frames: int = 0
    incoming_first_frame_ts: Optional[float] = None
    last_disconnect_reason: Optional[str] = None
    outbound_sender_mid: Optional[str] = None
    outbound_bind_method: Optional[str] = None
    outbound_sender_bind_ts: Optional[float] = None


# In-memory single peer (extend to dict for multi-user)
_peer_state: Optional[PeerState] = None
_peer_lock = asyncio.Lock()
_last_peer_snapshot: Optional[dict[str, Any]] = None
_negotiation_events: list[dict[str, Any]] = []  # rolling recent negotiation stage events


class IncomingVideoTrack(MediaStreamTrack):
    kind = "video"

    def __init__(self, track: MediaStreamTrack, peer_state: Optional[PeerState] = None):
        super().__init__()  # base init
        self.track = track
        self.pipeline = get_pipeline()
        self.frame_id = 0
        self._last_processed: Optional[np.ndarray] = None
        self._processing_task: Optional[asyncio.Task] = None
        self._lock = asyncio.Lock()
        self._peer_state_ref = peer_state
        # Latency / timing metrics
        self._capture_ts: Optional[float] = None
        self._last_latency_ms: Optional[float] = None
        self._avg_latency_ms: Optional[float] = None
        self._lat_hist: list[float] = []
        self._queue_wait_last_ms: Optional[float] = None
        self._queue_wait_hist: list[float] = []
        self._frames_passthrough = 0
        self._frames_processed = 0
        self._frames_dropped = 0
        self._placeholder_active = True
        self._sync_if_idle = os.getenv('MIRAGE_SYNC_IF_IDLE','1').lower() in ('1','true','yes','on')
        self._pts_origin: Optional[float] = None  # monotonic origin
        self._last_sent_pts: Optional[int] = None
        self._time_base = (1, 90000)  # 90kHz typical video clock
        self._raw_frames_in = 0

    async def recv(self):  # type: ignore[override]
        frame = await self.track.recv()
        self._raw_frames_in += 1
        if self._peer_state_ref is not None:
            try:
                self._peer_state_ref.incoming_frames += 1
                if self._peer_state_ref.incoming_first_frame_ts is None:
                    self._peer_state_ref.incoming_first_frame_ts = time.time()
            except Exception:
                pass
        if self._raw_frames_in == 1:
            try:
                logger.info("IncomingVideoTrack first frame received size=%sx%s" % (getattr(frame, 'width', '?'), getattr(frame, 'height', '?')))
            except Exception:
                pass
        self.frame_id += 1
        capture_t = time.time()
        if self._pts_origin is None:
            self._pts_origin = capture_t
        # Convert to numpy BGR for pipeline
        img = frame.to_ndarray(format="bgr24")
        h, w, _ = img.shape
        proc_input = img
        # Optional downscale (same as prior)
        try:
            max_dim_cfg = int(os.getenv('MIRAGE_PROC_MAX_DIM', '512') or '512')
            if max_dim_cfg < 64:
                max_dim_cfg = 64
            if max(h, w) > max_dim_cfg:
                if w >= h:
                    scale_w = max_dim_cfg
                    scale_h = int(h * (max_dim_cfg / w))
                else:
                    scale_h = max_dim_cfg
                    scale_w = int(w * (max_dim_cfg / h))
                proc_input = cv2.resize(img, (max(1, scale_w), max(1, scale_h)))
        except Exception as e:
            logger.debug(f"Video downscale skip: {e}")

        expected_size = (w, h)
        processed: Optional[np.ndarray] = None

        # Hybrid processing: inline if no background task running OR sync flag set; else schedule
        if self._sync_if_idle and (self._processing_task is None):
            t_q_start = time.time()
            try:
                out_small = self.pipeline.process_video_frame(proc_input, self.frame_id)
                if out_small is not None and (out_small.shape[1], out_small.shape[0]) != expected_size:
                    processed = cv2.resize(out_small, expected_size)
                else:
                    processed = out_small if out_small is not None else img
                self._queue_wait_last_ms = (time.time() - t_q_start) * 1000.0  # inclusive (no wait, pure proc)
                self._queue_wait_hist.append(self._queue_wait_last_ms)
                if len(self._queue_wait_hist) > 300:
                    self._queue_wait_hist.pop(0)
                self._frames_processed += 1
            except Exception as ex:
                logger.debug(f"inline processing error: {ex}")
                processed = img
        else:
            # Background path
            if self._processing_task is None:
                async def _process_async(inp: np.ndarray, expected_size: tuple[int,int], fid: int, enqueue_t: float):
                    try:
                        out_small = self.pipeline.process_video_frame(inp, fid)
                        out = out_small
                        if out_small is not None and (out_small.shape[1], out_small.shape[0]) != expected_size:
                            out = cv2.resize(out_small, expected_size)
                        elif out is None:
                            out = inp  # fallback
                        async with self._lock:
                            self._last_processed = out
                        q_wait = (time.time() - enqueue_t) * 1000.0
                        self._queue_wait_last_ms = q_wait
                        self._queue_wait_hist.append(q_wait)
                        if len(self._queue_wait_hist) > 300:
                            self._queue_wait_hist.pop(0)
                        self._frames_processed += 1
                    except Exception as ex:
                        logger.debug(f"video processing error(bg): {ex}")
                    finally:
                        self._processing_task = None
                self._processing_task = asyncio.create_task(_process_async(proc_input, expected_size, self.frame_id, time.time()))
            # Use last processed snapshot; count passthrough if not yet available
            async with self._lock:
                if self._last_processed is not None:
                    processed = self._last_processed
                else:
                    processed = img
                    self._frames_passthrough += 1
                    # We'll consider this frame 'dropped' re: processing freshness if a task already running
                    if self._processing_task is not None:
                        self._frames_dropped += 1

        # Metrics update
        proc_latency_ms = (time.time() - capture_t) * 1000.0
        self._last_latency_ms = proc_latency_ms
        self._lat_hist.append(proc_latency_ms)
        if len(self._lat_hist) > 300:
            self._lat_hist.pop(0)
        self._avg_latency_ms = float(np.mean(self._lat_hist)) if self._lat_hist else None

        # Placeholder becomes inactive as soon as we emit a frame post-first capture
        if self._placeholder_active:
            self._placeholder_active = False

        # Timestamp handling: derive pts from capture time relative to origin on a 90kHz clock
        try:
            clock_rate = 90000
            rel_sec = capture_t - (self._pts_origin or capture_t)
            pts = int(rel_sec * clock_rate)
            # Guard against monotonic regressions
            if self._last_sent_pts is not None and pts <= self._last_sent_pts:
                pts = self._last_sent_pts + int(clock_rate / 30)  # assume ~30fps minimal increment
            self._last_sent_pts = pts
        except Exception:
            pts = frame.pts if frame.pts is not None else 0

        import av as _av
        vframe = _av.VideoFrame.from_ndarray(processed, format="bgr24")
        vframe.pts = pts
        vframe.time_base = _av.time_base.TimeBase(num=1, den=90000) if hasattr(_av, 'time_base') else frame.time_base
        if (self.frame_id % 120) == 0:
            logger.debug(
                f"vid frame={self.frame_id} inline={self._sync_if_idle and self._processing_task is None} "
                f"proc_ms={proc_latency_ms:.1f} avg_ms={self._avg_latency_ms:.1f if self._avg_latency_ms else None} "
                f"queue_wait_last={self._queue_wait_last_ms} passthrough={self._frames_passthrough} dropped={self._frames_dropped}"
            )
        return vframe


class OutboundVideoTrack(VideoStreamTrack):
    """Outbound track that sends black frames until a real source is attached.
    Once set_source is called with a MediaStreamTrack, it relays frames from that track.
    """
    kind = "video"

    def __init__(self, width: int = 320, height: int = 240, fps: int = 15):
        super().__init__()
        self._source: Optional[MediaStreamTrack] = None
        self._width = width
        self._height = height
        self._frame_interval = 1.0 / max(1, fps)
        self._last_ts = time.time()
        self._frame_count = 0
        self._debug_emitted = 0
        self._placeholder_sent = 0
        # Placeholder mode active until first successful frame relay OR timeout
        self._placeholder_active = True
        self._placeholder_timeout = time.time() + 5.0
        # Diagnostics
        self._relay_failures = 0
        self._relay_last_error: Optional[str] = None
        self._relay_last_error_ts: Optional[float] = None
        self._first_relay_ts: Optional[float] = None
        self._placeholder_deactivated_ts: Optional[float] = None
        self._placeholder_initial_ts: float = time.time()
        # Extended diagnostics
        self._luma_last: Optional[float] = None
        self._luma_samples: list[float] = []
        self._real_frames: int = 0
        self._placeholder_frames: int = 0
        self._bind_attempts: int = 0
        self._bound_at: Optional[float] = None

    def set_source(self, track: MediaStreamTrack):
        self._bind_attempts += 1
        # Guard: ignore if already bound and active to avoid accidental overwrite
        if self._source is None:
            self._source = track
            self._bound_at = time.time()
            logger.info("OutboundVideoTrack source bound (attempt=%d)" % self._bind_attempts)
        else:
            logger.warning("OutboundVideoTrack set_source called but source already set (attempt=%d)" % self._bind_attempts)
        
    def clear_source(self):
        """Clear the source to prevent hanging on failed connections"""
        self._source = None
        self._placeholder_active = True  # Revert to placeholder mode
        self._placeholder_timeout = time.time() + 5.0  # Reset timeout

    async def recv(self):  # type: ignore[override]
        src = self._source
        if src is not None:
            try:
                f = await src.recv()
                # Detect if frame is still a raw passthrough sized frame (heuristic: placeholder period or frame_count==0)
                self._frame_count += 1
                self._debug_emitted += 1
                if self._placeholder_active:
                    self._placeholder_active = False
                    self._placeholder_deactivated_ts = time.time()
                # Luminance sample every 15 frames
                if (self._frame_count % 15) == 0:
                    try:
                        arr = f.to_ndarray(format="bgr24")
                        # convert to gray cheaply
                        luma = float(np.mean(arr))
                        self._luma_last = luma
                        self._luma_samples.append(luma)
                        if len(self._luma_samples) > 200:
                            self._luma_samples.pop(0)
                    except Exception as _ex:
                        if (self._frame_count % 150) == 0:
                            logger.debug(f"luma sample failed: {_ex}")
                self._real_frames += 1
                if (self._frame_count % 30) == 0:
                    try:
                        logger.info(f"OutboundVideoTrack relayed frame {self._frame_count} size={getattr(f, 'width', '?')}x{getattr(f, 'height', '?')}")
                    except Exception:
                        pass
                if self._first_relay_ts is None:
                    self._first_relay_ts = time.time()
                return f
            except Exception as e:
                self._relay_failures += 1
                if self._relay_failures <= 5 or (self._relay_failures % 50) == 0:
                    logger.warning(f"OutboundVideoTrack relay failure count={self._relay_failures} err={e}")
                self._relay_last_error = str(e)
                self._relay_last_error_ts = time.time()
                # fall back to placeholder pattern
        # generate black/diagnostic placeholder frame at target fps (early stage before processed frames ready)
        now = time.time()
        delay = self._frame_interval - (now - self._last_ts)
        if delay > 0:
            await asyncio.sleep(delay)
        self._last_ts = time.time()
        # Diagnostic test pattern only while placeholder active and before timeout
        frame = np.zeros((self._height, self._width, 3), dtype=np.uint8)
        if self._placeholder_active and time.time() > self._placeholder_timeout:
            self._placeholder_active = False
        placeholder_active = self._placeholder_active
        if placeholder_active and (self._frame_count % 15) == 0:
            try:
                logger.warning(f"[video-placeholder] still active fc={self._frame_count} src={'set' if self._source else 'none'} timeout_in={int(self._placeholder_timeout-time.time())}")
            except Exception:
                pass
        try:
            # Color bars
            num_bars = 6
            bar_w = max(1, self._width // num_bars)
            colors = [
                (0,0,255),    # Red
                (0,255,0),    # Green
                (255,0,0),    # Blue
                (0,255,255),  # Yellow
                (255,0,255),  # Magenta
                (255,255,0),  # Cyan
            ]
            for i in range(num_bars):
                x0 = i*bar_w
                x1 = self._width if i==num_bars-1 else (i+1)*bar_w
                frame[:, x0:x1] = colors[i]
            # Moving square / indicator
            t = int(time.time()*2)
            sq = max(10, min(self._height, self._width)//10)
            x = (t*25) % max(1, (self._width - sq))
            y = (t*18) % max(1, (self._height - sq))
            color = (255,255,255) if placeholder_active else (0,0,0)
            cv2.rectangle(frame, (x,y), (x+sq,y+sq), color, thickness=-1)
            # Text with frame count
            text = f"OUT {self._frame_count}{' P' if placeholder_active else ''}"
            cv2.putText(frame, text, (10, self._height-10), cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0,0,0), 2, cv2.LINE_AA)
            cv2.putText(frame, text, (10, self._height-10), cv2.FONT_HERSHEY_SIMPLEX, 0.5, (255,255,255), 1, cv2.LINE_AA)
        except Exception:
            # If OpenCV drawing fails for any reason, keep plain black
            pass
        import av as _av
        vframe = _av.VideoFrame.from_ndarray(frame, format="bgr24")
        # Provide monotonically increasing timestamps for encoder
        pts, time_base = await self.next_timestamp()
        vframe.pts = pts
        vframe.time_base = time_base
        self._frame_count += 1
        self._debug_emitted += 1
        self._placeholder_frames += 1
        if placeholder_active:
            self._placeholder_sent += 1
            if self._placeholder_sent in (1, 10):
                try:
                    logger.info(f"OutboundVideoTrack placeholder frame emitted (count={self._placeholder_sent})")
                except Exception:
                    pass
        if (self._frame_count % 30) == 0 and not placeholder_active:
            try:
                logger.info(f"OutboundVideoTrack generated pattern frame {self._frame_count} {self._width}x{self._height}")
            except Exception:
                pass
        return vframe


class IncomingAudioTrack(MediaStreamTrack):
    kind = "audio"

    def __init__(self, track: MediaStreamTrack):
        super().__init__()
        self.track = track
        self.pipeline = get_pipeline()
        self._resample_to_16k = None
        self._resample_from_16k = None

    async def recv(self):  # type: ignore[override]
        frame = await self.track.recv()
        # frame is an AudioFrame (PCM)
        try:
            import av
            from av.audio.resampler import AudioResampler
            # Initialize resamplers once using input characteristics
            if self._resample_to_16k is None:
                self._resample_to_16k = AudioResampler(format='s16', layout='mono', rate=16000)
            if self._resample_from_16k is None:
                # Back to original sample rate and layout; keep s16 for low overhead
                target_layout = frame.layout.name if frame.layout else 'mono'
                target_rate = frame.sample_rate or 48000
                self._resample_from_16k = AudioResampler(format='s16', layout=target_layout, rate=target_rate)

            # 1) To mono s16 @16k for pipeline
            f_16k_list = self._resample_to_16k.resample(frame)
            if isinstance(f_16k_list, list):
                f_16k = f_16k_list[0]
            else:
                f_16k = f_16k_list
            pcm16k = f_16k.to_ndarray()  # (channels, samples), dtype=int16
            if pcm16k.ndim == 2:
                # convert to mono if needed
                if pcm16k.shape[0] > 1:
                    pcm16k = np.mean(pcm16k, axis=0, keepdims=True).astype(np.int16)
                # drop channel dim -> (samples,)
                pcm16k = pcm16k.reshape(-1)

            # 2) Pipeline processing (mono 16k int16 ndarray)
            processed_arr = self.pipeline.process_audio_chunk(pcm16k)
            if isinstance(processed_arr, bytes):
                processed_bytes = processed_arr
            else:
                processed_bytes = np.asarray(processed_arr, dtype=np.int16).tobytes()

            # 3) Wrap processed back into an av frame @16k mono s16
            samples = len(processed_bytes) // 2
            f_proc_16k = av.AudioFrame(format='s16', layout='mono', samples=samples)
            f_proc_16k.sample_rate = 16000
            f_proc_16k.planes[0].update(processed_bytes)

            # 4) Resample back to original sample rate/layout
            f_out_list = self._resample_from_16k.resample(f_proc_16k)
            if isinstance(f_out_list, list) and len(f_out_list) > 0:
                f_out = f_out_list[0]
            else:
                f_out = f_proc_16k  # fallback

            # Preserve timing as best-effort
            f_out.pts = frame.pts
            f_out.time_base = frame.time_base
            return f_out
        except Exception as e:
            logger.error(f"Audio processing error: {e}")
            return frame


@router.post("/offer")
async def webrtc_offer(offer: Dict[str, Any], x_api_key: Optional[str] = Header(default=None), x_auth_token: Optional[str] = Header(default=None)):
    """Accept SDP offer (from browser) and return SDP answer.

    Instrumented with lightweight negotiation stage logging so we can pinpoint
    where a 500 originates (outbound track setup, createAnswer, etc.). The
    browser is *always* responsible for creating the *offer*; the server only
    ever creates the *answer*. This endpoint performs no browser/client-side
    JS; it strictly handles SDP, media track plumbing and pipeline binding.
    """
    global _peer_state, _last_peer_snapshot  # declare once at top to avoid 'used prior to global declaration'
    negotiation_id = f"neg-{int(time.time()*1000)}-{random.randint(1000,9999)}"  # best-effort unique ID
    DEBUG_NEG = os.getenv("MIRAGE_DEBUG_NEGOTIATION", "0").strip().lower() in {"1","true","yes","on"}

    def stage(msg: str, level: str = "info"):
        line = f"[{negotiation_id}] {msg}"
        evt = {"ts": time.time(), "negotiation_id": negotiation_id, "msg": msg, "level": level}
        try:
            _negotiation_events.append(evt)
            # Keep only last 80 events
            if len(_negotiation_events) > 80:
                del _negotiation_events[: len(_negotiation_events) - 80]
        except Exception:
            pass
        if level == "error":
            logger.error(line)
        elif level == "warning":
            logger.warning(line)
        else:
            logger.info(line)

    stage("offer_received")
    # If enforcement enabled, require a valid signed token; otherwise allow
    if REQUIRE_API_KEY:
        if not (x_auth_token and _verify_token(x_auth_token)):
            raise HTTPException(status_code=401, detail="Unauthorized")
    if not AIORTC_AVAILABLE:
        raise HTTPException(status_code=503, detail=f"aiortc not available: {AIORTC_IMPORT_ERROR}")

    async with _peer_lock:
        # Ensure pipeline is ready before wiring tracks
        init_ok = await _ensure_pipeline_initialized()
        if not init_ok:
            stage("pipeline_init_failed", level="error")
            raise HTTPException(status_code=500, detail="pipeline_init_failed")
        # Cleanup existing peer if present - critical for retry scenarios
        if _peer_state is not None:
            try:
                await _peer_state.pc.close()
                stage("previous_pc_closed")
            except Exception:
                pass
            # Clear outbound video source from previous connection
            if _peer_state.outbound_video:
                _peer_state.outbound_video.clear_source()
                stage("previous_outbound_video_cleared")
            # Reset pipeline state for clean reconnection
            try:
                from swap_pipeline import reset_pipeline
                reset_pipeline()
                stage("pipeline_reset_for_new_offer")
            except Exception as e:
                stage(f"pipeline_reset_failed: {e}", level="warning")
            _last_peer_snapshot = {
                "event": "pre_offer_cleanup",
                "connection_state": getattr(_peer_state, 'last_connection_state', None),
                "ice_state": getattr(_peer_state, 'last_ice_state', None),
                "received_video": getattr(_peer_state, 'received_video', False),
                "incoming_frames": getattr(_peer_state, 'incoming_frames', 0),
            }
            _peer_state = None

    ice_config = _ice_configuration()
    # Log ICE configuration for diagnostics
    server_summary = []
    for server in ice_config.iceServers:
        urls = server.urls if isinstance(server.urls, list) else [server.urls]
        has_auth = bool(getattr(server, 'username', None))
        for url in urls:
            server_type = 'TURN' if url.startswith('turn') else 'STUN'
            server_summary.append(f"{server_type}:{url}{'(auth)' if has_auth else ''}")
    logger.info(f"ICE servers configured: {', '.join(server_summary)}")
    
    # Test TURN server connectivity (async, don't block connection)
    if ice_config.iceServers:
        asyncio.create_task(_test_turn_connectivity(ice_config.iceServers))
    
    pc = RTCPeerConnection(configuration=ice_config)
    blackhole = MediaBlackhole()  # optional sink

    try:
        outbound_video = OutboundVideoTrack()
        stage("outbound_video_constructed")
    except Exception as e:
        stage(f"outbound_video_construct_failed: {e}", level="error")
        try:
            await pc.close()
        except Exception:
            pass
        raise HTTPException(status_code=500, detail=f"outbound_video_setup: {e}")

    _peer_state = PeerState(pc=pc, created=time.time(), outbound_video=outbound_video)
    _peer_state.ice_samples = []
    _last_peer_snapshot = None

    @pc.on("datachannel")
    def on_datachannel(channel):
        logger.info("Data channel received: %s", channel.label)
        if channel.label == "control":
            # Mark control channel readiness on open/close
            @channel.on("open")
            def _on_open():
                try:
                    global _peer_state
                    if _peer_state is not None:
                        _peer_state.control_channel_ready = True
                except Exception:
                    pass

            @channel.on("close")
            def _on_close():
                try:
                    global _peer_state
                    if _peer_state is not None:
                        _peer_state.control_channel_ready = False
                except Exception:
                    pass
            def send_metrics():
                pipeline = get_pipeline()
                stats = pipeline.get_performance_stats() if pipeline.loaded else {}
                payload = json.dumps({"type": "metrics", "payload": stats})
                try:
                    channel.send(payload)
                except Exception:
                    logger.debug("Failed sending metrics")

            @channel.on("message")
            def on_message(message):
                    try:
                        if isinstance(message, bytes):
                            return
                        data = json.loads(message)
                        mtype = data.get("type")
                        if mtype == "ping":
                            channel.send(json.dumps({"type": "pong", "t": time.time()}))
                        elif mtype == "metrics_request":
                            send_metrics()
                        elif mtype == "set_reference":
                            b64 = data.get("image_jpeg_base64") or data.get("image_base64")
                            if b64:
                                async def _set_ref_async(b64data: str):
                                    try:
                                        # Allow moderately large images; cap to ~6MB base64 length
                                        if len(b64data) > 6_000_000:
                                            channel.send(json.dumps({"type": "error", "message": "reference too large"}))
                                            return
                                        raw = base64.b64decode(b64data)
                                        arr = np.frombuffer(raw, np.uint8)
                                        # cv2.imdecode handles JPEG, PNG, WebP, etc. automatically
                                        img = cv2.imdecode(arr, cv2.IMREAD_COLOR)
                                        if img is None:
                                            channel.send(json.dumps({"type": "error", "message": "decode failed (unsupported image or corrupt)"}))
                                            return
                                        # Downscale to max 512 for stability
                                        h, w = img.shape[:2]
                                        scale = max(h, w)
                                        if scale > 512:
                                            if w >= h:
                                                new_w = 512
                                                new_h = max(1, int(h * (512 / w)))
                                            else:
                                                new_h = 512
                                                new_w = max(1, int(w * (512 / h)))
                                            img = cv2.resize(img, (new_w, new_h))
                                        pipeline = get_pipeline()
                                        loop = asyncio.get_running_loop()
                                        def _set_ref_blocking():
                                            return pipeline.set_reference_frame(img)
                                        ok = await loop.run_in_executor(None, _set_ref_blocking)
                                        if ok:
                                            channel.send(json.dumps({"type": "reference_ack"}))
                                        else:
                                            channel.send(json.dumps({"type": "error", "message": "no suitable face found"}))
                                    except Exception as e:
                                        logger.error(f"set_reference error: {e}")
                                        try:
                                            channel.send(json.dumps({"type": "error", "message": str(e)}))
                                        except Exception:
                                            pass
                                asyncio.create_task(_set_ref_async(b64))
                    except Exception as e:
                        logger.error(f"Data channel message error: {e}")

    @pc.on("connectionstatechange")
    async def on_state_change():
        global _peer_state, _last_peer_snapshot  # single global declaration for entire handler
        logger.info("Peer connection state: %s", pc.connectionState)
        try:
            if _peer_state is not None:
                _peer_state.last_connection_state = pc.connectionState
        except Exception:
            pass
        # Immediately close failed connections to prevent resource leaks
        if pc.connectionState in ("failed", "disconnected", "closed"):
            try:
                # Clean pipeline resources on connection failure/close
                from swap_pipeline import reset_pipeline
                reset_pipeline()
                logger.info(f"Pipeline reset due to connection state: {pc.connectionState}")
            except Exception as e:
                logger.warning(f"Pipeline reset failed on state change: {e}")
            
            # Clear global peer state to allow clean retry
            async with _peer_lock:
                if _peer_state is not None and _peer_state.pc == pc:
                    logger.info("Clearing global peer state due to connection failure")
                    try:
                        _peer_state.last_disconnect_reason = f"pc_state:{pc.connectionState}"
                    except Exception:
                        pass
                    try:
                        _last_peer_snapshot = {
                            "event": "connectionstatechange",
                            "state": pc.connectionState,
                            "ice_state": getattr(pc, 'iceConnectionState', None),
                            "received_video": getattr(_peer_state, 'received_video', False),
                            "received_audio": getattr(_peer_state, 'received_audio', False),
                            "incoming_frames": getattr(_peer_state, 'incoming_frames', 0),
                            "incoming_first_frame_ts": getattr(_peer_state, 'incoming_first_frame_ts', None),
                            "outbound_bind_method": getattr(_peer_state, 'outbound_bind_method', None),
                            "outbound_sender_mid": getattr(_peer_state, 'outbound_sender_mid', None),
                            "timestamp": time.time(),
                        }
                    except Exception:
                        _last_peer_snapshot = {"event": "connectionstatechange", "state": pc.connectionState}
                    # Clear outbound video source to prevent hanging on retry
                    if _peer_state.outbound_video:
                        _peer_state.outbound_video.clear_source()
                        logger.info("Cleared outbound video source")
                    _peer_state = None
            
            if pc.connectionState == "failed":
                try:
                    await pc.close()
                    logger.info("Closed failed peer connection")
                except Exception:
                    pass

    @pc.on("iceconnectionstatechange")
    async def on_ice_state_change():
        global _peer_state
        logger.info("ICE connection state: %s", pc.iceConnectionState)
        try:
            if _peer_state is not None:
                _peer_state.last_ice_state = pc.iceConnectionState
        except Exception:
            pass
        
        # Log detailed ICE failure diagnostics
        if pc.iceConnectionState in ("disconnected", "failed"):
            try:
                # Log ICE transport stats if available
                stats = await pc.getStats()
                ice_candidates = []
                ice_pairs = []
                for stat_id, stat in stats.items():
                    if hasattr(stat, 'type'):
                        if stat.type == "local-candidate":
                            ice_candidates.append(f"local:{getattr(stat, 'candidateType', '?')}:{getattr(stat, 'protocol', '?')}:{getattr(stat, 'address', '?')}:{getattr(stat, 'port', '?')}")
                        elif stat.type == "remote-candidate": 
                            ice_candidates.append(f"remote:{getattr(stat, 'candidateType', '?')}:{getattr(stat, 'protocol', '?')}:{getattr(stat, 'address', '?')}:{getattr(stat, 'port', '?')}")
                        elif stat.type == "candidate-pair":
                            state = getattr(stat, 'state', '?')
                            ice_pairs.append(f"pair:{state}:{getattr(stat, 'priority', '?')}")
                
                logger.warning(f"ICE {pc.iceConnectionState} - candidates: {len(ice_candidates)} pairs: {len(ice_pairs)}")
                if ice_candidates:
                    logger.info(f"ICE candidates: {', '.join(ice_candidates[:10])}")  # Limit to first 10
                if ice_pairs:
                    logger.info(f"ICE pairs: {', '.join(ice_pairs[:5])}")  # Limit to first 5
                    
            except Exception as e:
                logger.debug(f"ICE stats collection failed: {e}")
    
    @pc.on("icegatheringstatechange") 
    async def on_ice_gathering_change():
        logger.info("ICE gathering state: %s", pc.iceGatheringState)
        
    @pc.on("icecandidate")
    async def on_ice_candidate(candidate):
        if candidate:
            logger.debug(f"ICE candidate: {candidate.candidate}")
        else:
            logger.info("ICE gathering complete (end-of-candidates)")
    

    @pc.on("track")
    def on_track(track):
        logger.info("Track received: %s", track.kind)
        if track.kind == "video":
            state_ref = _peer_state
            local = IncomingVideoTrack(track, state_ref)
            if state_ref is not None:
                try:
                    state_ref.incoming_video_track = local
                except Exception:
                    pass
            try:
                outbound_video.set_source(local)
                logger.info("Outbound video source bound to incoming video")
            except Exception as e:
                logger.error(f"video source assign error: {e}")
                if state_ref is not None:
                    state_ref.last_disconnect_reason = f"video_source_assign_error:{e}"
                return

            async def _bind_outbound_sender():
                bound_method = None
                sender_mid = None
                try:
                    # If the outbound track is already bound, record and exit
                    existing_sender = None
                    for s in pc.getSenders():
                        if getattr(s, "track", None) is outbound_video:
                            existing_sender = s
                            break
                    if existing_sender:
                        bound_method = "existing_sender"
                        sender_mid = getattr(existing_sender, "mid", None)
                        stage("outbound_video_sender_already_bound")
                        return

                    transceiver = None
                    for trans in pc.getTransceivers():
                        try:
                            recv = getattr(trans, "receiver", None)
                            if recv is not None and getattr(recv, "track", None) is track:
                                transceiver = trans
                                break
                        except Exception:
                            continue
                    if transceiver and getattr(transceiver, "sender", None):
                        sender = transceiver.sender
                        result = sender.replaceTrack(outbound_video)
                        if inspect.isawaitable(result):
                            await result
                        bound_method = "transceiver.replaceTrack"
                        sender_mid = getattr(sender, "mid", None)
                        stage("outbound_video_sender_bound_existing")
                    else:
                        sender = pc.addTrack(outbound_video)
                        bound_method = "pc.addTrack"
                        sender_mid = getattr(sender, "mid", None)
                        stage("outbound_video_sender_added_fallback")
                except Exception as bind_exc:
                    stage(f"outbound_video_sender_bind_failed: {bind_exc}", level="error")
                    logger.error(f"Failed to bind outbound video sender: {bind_exc}")
                    if state_ref is not None:
                        state_ref.last_disconnect_reason = f"video_sender_bind_failed:{bind_exc}"
                    return
                finally:
                    if state_ref is not None:
                        try:
                            state_ref.outbound_bind_method = bound_method
                            state_ref.outbound_sender_bind_ts = time.time()
                            if sender_mid is not None:
                                state_ref.outbound_sender_mid = sender_mid
                        except Exception:
                            pass

                if state_ref is not None:
                    try:
                        state_ref.outbound_video = outbound_video
                    except Exception:
                        pass

            asyncio.create_task(_bind_outbound_sender())
            if state_ref is not None:
                try:
                    state_ref.received_video = True
                except Exception:
                    pass
        elif track.kind == "audio":
            local_a = IncomingAudioTrack(track)
            try:
                pc.addTrack(local_a)
                logger.info("Loopback processed audio track added")
                try:
                    if _peer_state is not None:
                        _peer_state.received_audio = True
                except Exception:
                    pass
            except Exception as e:
                logger.error(f"audio addTrack error: {e}")

    # Ensure we both SEND avatar video and RECEIVE client camera by using a transceiver with sendrecv direction.
    # Prior implementation used addTrack (sendonly) which prevented inbound video track reception on some browsers,
    # leading to perpetual placeholder frames / black output. This explicit transceiver resolves that.
    try:
        # Attempt to reuse an existing sender first to avoid duplicate binding errors
        existing_sender = None
        for s in pc.getSenders():
            trk = getattr(s, 'track', None)
            if trk and getattr(trk, 'kind', None) == 'video':
                existing_sender = s
                break
        if existing_sender:
            # Replace existing track only if different
            if existing_sender.track != outbound_video:
                result = existing_sender.replaceTrack(outbound_video)
                if inspect.isawaitable(result):
                    await result
                stage("outbound_video_sender_replaced_existing")
            else:
                stage("outbound_video_sender_prebound")
            if _peer_state is not None:
                _peer_state.outbound_bind_method = "existing_sender"
                _peer_state.outbound_sender_mid = getattr(existing_sender, 'mid', None)
                _peer_state.outbound_sender_bind_ts = time.time()
        else:
            # No existing video sender; try transceiver path first
            try:
                video_trans = pc.addTransceiver('video', direction='sendrecv')
                stage("outbound_video_transceiver_created")
                sender = getattr(video_trans, 'sender', None)
                if sender is None:
                    raise RuntimeError('transceiver.sender missing')
                result = sender.replaceTrack(outbound_video)
                if inspect.isawaitable(result):
                    await result
                stage("outbound_video_sender_bound")
                try:
                    params = sender.getParameters()
                    if params and hasattr(params, 'encodings'):
                        if not params.encodings:
                            params.encodings = [{}]
                        for enc in params.encodings:
                            enc['maxBitrate'] = min(enc.get('maxBitrate', 300_000), 300_000)
                            enc.setdefault('scaleResolutionDownBy', 2.0)
                            enc.setdefault('degradationPreference', 'maintain-resolution')
                    sender.setParameters(params)
                except Exception:
                    pass
                if _peer_state is not None:
                    _peer_state.outbound_bind_method = "transceiver.replaceTrack"
                    _peer_state.outbound_sender_mid = getattr(sender, 'mid', None)
                    _peer_state.outbound_sender_bind_ts = time.time()
            except Exception as te:
                stage(f"transceiver_path_failed: {te}", level='warning')
                # Fallback to addTrack
                try:
                    sender = pc.addTrack(outbound_video)
                    stage("outbound_video_added_fallback")
                    if _peer_state is not None:
                        _peer_state.outbound_bind_method = "pc.addTrack"
                        _peer_state.outbound_sender_mid = getattr(sender, 'mid', None)
                        _peer_state.outbound_sender_bind_ts = time.time()
                except Exception as e2:
                    if 'Track already has a sender' in str(e2):
                        # Benign: treat as success (track was already bound earlier in this negotiation)
                        stage("outbound_video_add_already_bound_ignored")
                    else:
                        stage(f"outbound_video_add_failed: {e2}", level='error')
                        raise HTTPException(status_code=500, detail=f"outbound_video_setup: {e2}")
    except HTTPException:
        raise
    except Exception as e:
        stage(f"outbound_video_setup_unexpected: {e}", level='error')
        raise HTTPException(status_code=500, detail=f"outbound_video_setup: {e}")

    # Proactively create an audio transceiver (recvonly) so inbound audio is not blocked by lack of direction
    try:
        pc.addTransceiver('audio', direction='recvonly')
        stage("audio_transceiver_added")
    except Exception as e:
        stage(f"audio_transceiver_failed: {e}", level='warning')

    # Now apply the remote description (offer)
    try:
        desc = RTCSessionDescription(sdp=offer["sdp"], type=offer["type"])
        await pc.setRemoteDescription(desc)
        stage("remote_description_set")
    except Exception as e:
        stage(f"remote_description_failed: {e}", level="error")
        try:
            await pc.close()
        except Exception:
            pass
        if _peer_state is not None and getattr(_peer_state, 'pc', None) == pc:
            try:
                _peer_state.last_disconnect_reason = f"remote_description_failed:{e}"
            except Exception:
                pass
            _last_peer_snapshot = {
                "event": "remote_description_failed",
                "error": str(e),
            }
            _peer_state = None
        raise HTTPException(status_code=400, detail=f"Invalid SDP offer: {e}")

    # Create answer with error surfacing
    try:
        answer = await pc.createAnswer()
        stage("answer_created")
    except Exception as e:
        stage(f"createAnswer_failed: {e}", level="error")
        try:
            await pc.close()
        except Exception:
            pass
        if _peer_state is not None and getattr(_peer_state, 'pc', None) == pc:
            try:
                _peer_state.last_disconnect_reason = f"createAnswer_failed:{e}"
            except Exception:
                pass
            _last_peer_snapshot = {
                "event": "createAnswer_failed",
                "error": str(e),
            }
            _peer_state = None
        raise HTTPException(status_code=500, detail=f"createAnswer: {e}")
    # Avoid SDP munging to reduce negotiation fragility
    try:
        # Optionally prefer H264 for broader compatibility
        if PREFER_H264 and isinstance(answer.sdp, str):
            try:
                answer = RTCSessionDescription(sdp=_prefer_codec(answer.sdp, 'video', 'H264'), type=answer.type)
            except Exception:
                pass
        await pc.setLocalDescription(answer)
        stage("local_description_set")
    except Exception as e:
        stage(f"setLocalDescription_failed: {e}", level="error")
        try:
            await pc.close()
        except Exception:
            pass
        if _peer_state is not None and getattr(_peer_state, 'pc', None) == pc:
            try:
                _peer_state.last_disconnect_reason = f"setLocalDescription_failed:{e}"
            except Exception:
                pass
            _last_peer_snapshot = {
                "event": "setLocalDescription_failed",
                "error": str(e),
            }
            _peer_state = None
        raise HTTPException(status_code=500, detail=f"setLocalDescription: {e}")

    async def _sample_ice_loop(state_ref: PeerState):  # pragma: no cover diagnostic
        try:
            while True:
                await asyncio.sleep(3)
                pc_local = state_ref.pc
                if pc_local.connectionState in ("closed", "failed"):
                    break
                try:
                    stats = await pc_local.getStats()
                    summary = {
                        'ts': time.time(),
                        'connectionState': pc_local.connectionState,
                        'iceState': pc_local.iceConnectionState,
                        'pairs': 0,
                        'succeeded_pairs': 0,
                        'nominated_pairs': 0,
                        'local_candidates': 0,
                        'remote_candidates': 0,
                    }
                    for sid, rep in stats.items():
                        tp = getattr(rep, 'type', None)
                        if tp == 'candidate-pair':
                            summary['pairs'] += 1
                            st = getattr(rep, 'state', None)
                            if st == 'succeeded':
                                summary['succeeded_pairs'] += 1
                            if getattr(rep, 'nominated', False):
                                summary['nominated_pairs'] += 1
                        elif tp == 'local-candidate':
                            summary['local_candidates'] += 1
                        elif tp == 'remote-candidate':
                            summary['remote_candidates'] += 1
                    samples = state_ref.ice_samples
                    if samples is not None:
                        samples.append(summary)
                        # Keep last 20 samples
                        if len(samples) > 20:
                            samples.pop(0)
                except Exception as e:
                    logger.debug(f"ICE sample failed: {e}")
                # Stop sampling if connected (we keep last snapshots)
                if pc_local.connectionState == 'connected':
                    break
        except Exception:
            pass

    async def _ice_watchdog(state_ref: PeerState):  # pragma: no cover diagnostic
        try:
            # Wait 18s; if still 'checking' without any succeeded pair, close to force client retry logic
            await asyncio.sleep(18)
            pc_local = state_ref.pc
            if pc_local.iceConnectionState == 'checking' and pc_local.connectionState == 'connecting':
                # Inspect latest sample to confirm lack of progress
                last = state_ref.ice_samples[-1] if state_ref.ice_samples else {}
                if last.get('succeeded_pairs', 0) == 0:
                    logger.warning('ICE watchdog: still checking after 18s with 0 succeeded pairs - closing PC to unblock client')
                    try:
                        await pc_local.close()
                    except Exception:
                        pass
        except Exception:
            pass

    _peer_state.ice_sampler_task = asyncio.create_task(_sample_ice_loop(_peer_state))
    _peer_state.ice_watchdog_task = asyncio.create_task(_ice_watchdog(_peer_state))

    stage("answer_ready_returning")
    payload = {"sdp": pc.localDescription.sdp, "type": pc.localDescription.type}
    if DEBUG_NEG:
        payload["negotiation_id"] = negotiation_id
    return payload

@router.get("/negotiations")
async def negotiations():
    """Return recent negotiation stage events and last peer snapshot.

    Useful when /webrtc/ice_stats shows inactive (active:false) to see how far
    the last negotiation progressed before failure.
    """
    try:
        return {
            "events": _negotiation_events[-50:],  # last 50 for brevity
            "last_peer_snapshot": _last_peer_snapshot,
            "active": _peer_state is not None,
        }
    except Exception as e:
        return {"error": str(e)}

@router.get("/ice_gather_test")
async def ice_gather_test():
    """Perform a standalone ICE gathering cycle (no media) to enumerate local candidates.

    This helps distinguish TURN credential / gathering failures from SDP / negotiation issues.
    """
    if not AIORTC_AVAILABLE:
        raise HTTPException(status_code=503, detail="aiortc unavailable")
    try:
        cfg = _ice_configuration()
        pc = RTCPeerConnection(configuration=cfg)
        # Force creation of audio+video transceivers; some stacks gather more
        # aggressively when media components exist vs. data-only.
        try:
            pc.addTransceiver('audio', direction='recvonly')
        except Exception:
            pass
        try:
            pc.addTransceiver('video', direction='recvonly')
        except Exception:
            pass
        # Create data channel to exercise SCTP as well
        try:
            pc.createDataChannel("probe")
        except Exception:
            pass
        offer = await pc.createOffer()
        await pc.setLocalDescription(offer)
        t0 = time.time()
        # Wait at least one loop tick even if state flips to complete instantly
        await asyncio.sleep(0.3)
        while pc.iceGatheringState != 'complete' and (time.time() - t0) < 8.0:
            await asyncio.sleep(0.25)
        stats = await pc.getStats()
        summary = {
            'local_candidates': 0,
            'local_types': {},
            'elapsed_ms': int((time.time() - t0) * 1000),
            'gathering_state': pc.iceGatheringState,
            'ice_servers_supplied': [
                s.urls if isinstance(s.urls, list) else s.urls for s in cfg.iceServers
            ],
        }
        candidate_details = []
        for sid, rep in stats.items():
            tp = getattr(rep, 'type', None)
            if tp == 'local-candidate':
                summary['local_candidates'] += 1
                ctype = getattr(rep, 'candidateType', 'unknown')
                summary['local_types'][ctype] = summary['local_types'].get(ctype, 0) + 1
                if len(candidate_details) < 40:
                    candidate_details.append({
                        'type': ctype,
                        'protocol': getattr(rep, 'protocol', None),
                        'address': getattr(rep, 'address', None),
                        'port': getattr(rep, 'port', None),
                        'foundation': getattr(rep, 'foundation', None),
                    })
        try:
            await pc.close()
        except Exception:
            pass
        summary['candidates'] = candidate_details
        if summary['local_candidates'] == 0:
            summary['note'] = 'No local candidates gathered. Possible TURN auth or interface enumeration failure.'
        return summary
    except Exception as e:
        return {"error": str(e)}

@router.get("/net_info")
async def net_info():
    """Enumerate local network interfaces & IPv4/IPv6 addresses to explain absence of host candidates."""
    import socket
    info = []
    try:
        # socket.getaddrinfo on hostname
        try:
            hn = socket.gethostname()
            host_addrs = list({ai[4][0] for ai in socket.getaddrinfo(hn, None) if ai and ai[4]})
        except Exception as e:
            host_addrs = [f"error:{e}"]
        # Iterate common interfaces via /sys/class/net (Linux in HF Spaces)
        sys_net = '/sys/class/net'
        if os.path.isdir(sys_net):
            for iface in os.listdir(sys_net):
                if iface.startswith('lo'):
                    continue
                addrs = []
                try:
                    # Attempt IPv4 probe using dummy UDP socket bind trick
                    s = socket.socket(socket.AF_INET, socket.SOCK_DGRAM)
                    try:
                        s.connect(('8.8.8.8', 80))
                        addrs.append(s.getsockname()[0])
                    except Exception:
                        pass
                    finally:
                        s.close()
                except Exception:
                    pass
                info.append({"iface": iface, "addresses": list(set(addrs))})
        return {"hostname_addrs": host_addrs, "ifaces": info}
    except Exception as e:
        return {"error": str(e)}


@router.get("/token")
async def mint_token():
    """Return a short-lived signed token that can be used as X-Auth-Token.
    Public endpoint; signature uses server-held API key, if configured.
    """
    if not API_KEY:
        raise HTTPException(status_code=400, detail="API key not configured")
    return {"token": _mint_token(), "ttl": TOKEN_TTL_SECONDS}


@router.post("/cleanup")
async def cleanup_peer(x_api_key: Optional[str] = Header(default=None), x_auth_token: Optional[str] = Header(default=None)):
    # Accept either raw API key or signed auth token when enforcement enabled
    _check_api_key(x_api_key, token_val=x_auth_token)
    async with _peer_lock:
        global _peer_state
        if _peer_state is None:
            return {"status": "no_peer"}
        try:
            await _peer_state.pc.close()
        except Exception:
            pass
        # Clean up pipeline resources to prevent hang on reconnection
        try:
            from swap_pipeline import reset_pipeline
            reset_pipeline()
        except Exception as e:
            logger.warning(f"Pipeline reset failed: {e}")
        _peer_state = None
        return {"status": "closed"}

@router.get("/frame_counter")
async def frame_counter():
    """Expose outbound video diagnostics to aid in debugging blank/black feed issues.

    Returns
    -------
    active: bool - whether a peer exists
    frames_emitted: int | None - total frames sent out the outbound track
    placeholder_active: bool | None - whether placeholder pattern mode is still active
    placeholder_sent: int | None - number of placeholder frames emitted
    real_frames: int | None - relayed (non-placeholder) frames from source
    placeholder_frames: int | None - internally generated placeholder frames
    luma_last / luma_avg: float | None - last / rolling average luminance (0-255 BGR mean heuristic)
    relay_failures / relay_last_error - relay attempt error counts/last error
    source_bound: bool - whether outbound track has a source bound
    first_relay_ts: float | None - timestamp of first successful source frame relay
    bound_at: float | None - when set_source first succeeded
    """
    try:
        st = _peer_state
        if st is None:
            return {"active": False, "last": _last_peer_snapshot}
        pc = st.pc
        # Find outbound track
        ov = None
        try:
            for s in pc.getSenders():
                tr = getattr(s, 'track', None)
                if tr and getattr(tr, 'kind', None) == 'video' and hasattr(tr, '_placeholder_active') and hasattr(tr, '_real_frames'):
                    ov = tr
                    break
        except Exception:
            pass
        if ov is None:
            return {"active": True, "frames_emitted": None, "note": "outbound track not found"}
        # Compute rolling luma average
        luma_avg = None
        try:
            samples = getattr(ov, '_luma_samples', None)
            if samples:
                import numpy as _np
                luma_avg = float(_np.mean(samples))
        except Exception:
            luma_avg = None
        peer_meta = {
            "connection_state": getattr(st.pc, 'connectionState', None),
            "ice_state": getattr(st.pc, 'iceConnectionState', None),
            "received_video": getattr(st, 'received_video', False),
            "received_audio": getattr(st, 'received_audio', False),
            "incoming_frames": getattr(st, 'incoming_frames', 0),
            "incoming_first_frame_ts": getattr(st, 'incoming_first_frame_ts', None),
            "control_channel_ready": getattr(st, 'control_channel_ready', False),
            "last_connection_state": getattr(st, 'last_connection_state', None),
            "last_ice_state": getattr(st, 'last_ice_state', None),
            "incoming_track_bound": st.incoming_video_track is not None,
            "outbound_bind_method": getattr(st, 'outbound_bind_method', None),
            "outbound_sender_mid": getattr(st, 'outbound_sender_mid', None),
            "outbound_sender_bind_ts": getattr(st, 'outbound_sender_bind_ts', None),
        }
        return {
            "active": True,
            "frames_emitted": getattr(ov, '_frame_count', None),
            "placeholder_active": getattr(ov, '_placeholder_active', None),
            "placeholder_sent": getattr(ov, '_placeholder_sent', None),
            "real_frames": getattr(ov, '_real_frames', None),
            "placeholder_frames": getattr(ov, '_placeholder_frames', None),
            "luma_last": getattr(ov, '_luma_last', None),
            "luma_avg": luma_avg,
            "relay_failures": getattr(ov, '_relay_failures', None),
            "relay_last_error": getattr(ov, '_relay_last_error', None),
            "source_bound": getattr(ov, '_source', None) is not None,
            "bound_at": getattr(ov, '_bound_at', None),
            "first_relay_ts": getattr(ov, '_first_relay_ts', None),
            "peer": peer_meta,
        }
    except Exception as e:
        return {"active": False, "error": str(e)}

@router.get("/pipeline_stats")
async def pipeline_stats():
    """Return merged swap pipeline stats and live video track latency metrics."""
    try:
        pipeline = get_pipeline()
        base_stats = pipeline.get_performance_stats() if getattr(pipeline, 'loaded', False) else {}
        # Attempt to locate the active IncomingVideoTrack via peer senders
        track_stats = {}
        try:
            st = _peer_state
            if st is not None:
                pc = st.pc
                for sender in pc.getSenders():
                    tr = getattr(sender, 'track', None)
                    if tr and isinstance(tr, MediaStreamTrack) and getattr(tr, 'kind', None) == 'video':
                        # Heuristic: if it has our added attributes
                        for attr in [
                            '_last_latency_ms','_avg_latency_ms','_queue_wait_last_ms','_frames_passthrough',
                            '_frames_processed','_frames_dropped','_placeholder_active','_raw_frames_in'
                        ]:
                            if hasattr(tr, attr):
                                track_stats[attr.lstrip('_')] = getattr(tr, attr)
                        # Outbound diagnostics (if this is the outbound track)
                        for oattr, key in [
                            ('_relay_failures','relay_failures'),
                            ('_relay_last_error','relay_last_error'),
                            ('_relay_last_error_ts','relay_last_error_ts'),
                            ('_placeholder_sent','placeholder_frames'),
                            ('_placeholder_initial_ts','placeholder_initial_ts'),
                            ('_placeholder_deactivated_ts','placeholder_deactivated_ts'),
                        ]:
                            if hasattr(tr, oattr):
                                track_stats[key] = getattr(tr, oattr)
                        break
        except Exception as e:
            track_stats['error'] = f"track_stats: {e}" 
        return {"pipeline": base_stats, "video_track": track_stats}
    except Exception as e:
        return {"error": str(e)}

@router.get("/ice_stats")
async def ice_stats():  # pragma: no cover diagnostic endpoint
    try:
        st = _peer_state
        if st is None:
            return {"active": False}
        samples = st.ice_samples or []
        latest = samples[-1] if samples else None
        return {
            'active': True,
            'connectionState': getattr(st.pc, 'connectionState', None),
            'iceState': getattr(st.pc, 'iceConnectionState', None),
            'samples': samples,
            'latest': latest,
        }
    except Exception as e:
        return {'active': False, 'error': str(e)}

# Optional: connection monitoring endpoint for diagnostics
if add_connection_monitoring is not None:
    try:
        # Provide a getter to reflect live _peer_state rather than a stale snapshot
        def _get_peer_state():
            return _peer_state
        add_connection_monitoring(router, _get_peer_state)
    except Exception:
        pass
# Force rebuild Thu Sep 25 13:03:20 EDT 2025

# ---------------- TURN Diagnostic Endpoints -----------------
# Narrowly scoped endpoints to inspect and probe TURN connectivity without
# exposing arbitrary command execution. These are safe to leave enabled in
# production; they redact credentials and impose short timeouts.

@router.get("/turn_config")
async def turn_config():
    """Return current TURN/STUN configuration summary (no network tests)."""
    try:
        cfg = _ice_configuration()
        turn_urls = []
        stun_urls = []
        for s in cfg.iceServers:
            urls = s.urls if isinstance(s.urls, list) else [s.urls]
            for u in urls:
                if isinstance(u, str):
                    if u.startswith('turn'):
                        turn_urls.append(u)
                    elif u.startswith('stun'):
                        stun_urls.append(u)
        return {
            "turn_urls": turn_urls,
            "stun_urls": stun_urls,
            "static_turn_configured": bool(TURN_URL and TURN_USER and TURN_PASS),
            "metered_api_key_present": bool(METERED_API_KEY),
            "metered_disabled": DISABLE_METERED,
            "force_relay": FORCE_RELAY,
            "prefer_h264": PREFER_H264,
        }
    except Exception as e:
        return {"error": str(e)}

@router.get("/turn_probe")
async def turn_probe():
    """Actively probe TURN endpoints for DNS, TCP (and TLS for turns) reachability.

    Returns per-URL diagnostics. Each probe uses short (<=3s) timeouts so the
    entire call returns quickly even if endpoints are unreachable.
    """
    import socket, ssl, urllib.parse
    cfg = _ice_configuration()
    # Collect unique TURN URLs (avoid duplicate probing)
    urls: list[str] = []
    for s in cfg.iceServers:
        _urls = s.urls if isinstance(s.urls, list) else [s.urls]
        for u in _urls:
            if isinstance(u, str) and u.startswith('turn') and u not in urls:
                urls.append(u)

    async def _probe(url: str):
        result: dict[str, object] = {"url": url}
        try:
            # Normalize to parse (replace turn(s): with scheme placeholder acceptable to urlparse)
            # We retain original scheme to decide TLS.
            scheme = 'turns' if url.startswith('turns:') else 'turn'
            # Convert to http/https just for parsing host/port path cleanly
            fake = url.replace('turn:', 'http://').replace('turns:', 'https://')
            parsed = urllib.parse.urlparse(fake)
            host = parsed.hostname
            port = parsed.port or (443 if scheme == 'turns' else 3478)
            result['host'] = host
            result['port'] = port
            dns_info: dict[str, object] = {}
            tcp_info: dict[str, object] = {}
            tls_info: dict[str, object] = {}
            if not host:
                result['error'] = 'parse_failed'
                return result
            loop = asyncio.get_running_loop()
            # DNS resolve
            try:
                t0 = time.perf_counter()
                addrs = await asyncio.wait_for(loop.getaddrinfo(host, port, type=socket.SOCK_STREAM), timeout=2.5)
                dns_info['latency_ms'] = (time.perf_counter() - t0) * 1000.0
                dns_info['resolved'] = True
                # Extract unique IPs
                ips = []
                for fam, socktype, proto, canon, sockaddr in addrs:
                    ip = sockaddr[0]
                    if ip not in ips:
                        ips.append(ip)
                dns_info['addresses'] = ips[:5]
            except Exception as e:
                dns_info['resolved'] = False
                dns_info['error'] = str(e)
            result['dns'] = dns_info
            # Skip further probes if DNS failed
            if not dns_info.get('resolved'):
                return result
            # TCP connect (first resolved address)
            try:
                target_ip = dns_info['addresses'][0] if dns_info.get('addresses') else host
                t1 = time.perf_counter()
                sock = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
                sock.settimeout(3.0)
                err = sock.connect_ex((target_ip, port))
                if err == 0:
                    tcp_info['ok'] = True
                else:
                    tcp_info['ok'] = False
                    tcp_info['error_code'] = err
                tcp_info['latency_ms'] = (time.perf_counter() - t1) * 1000.0
                sock_ok = (err == 0)
                # TLS handshake if scheme turns and TCP succeeded
                if sock_ok and scheme == 'turns':
                    try:
                        ctx = ssl.create_default_context()
                        # TURN servers sometimes use certificates not matching host; allow override if needed
                        if os.getenv('MIRAGE_TURN_TLS_NO_VERIFY','0').lower() in ('1','true','yes','on'):
                            ctx.check_hostname = False
                            ctx.verify_mode = ssl.CERT_NONE
                        t2 = time.perf_counter()
                        tls_sock = ctx.wrap_socket(sock, server_hostname=host)
                        # perform handshake implicitly by wrap
                        tls_info['ok'] = True
                        tls_info['latency_ms'] = (time.perf_counter() - t2) * 1000.0
                        tls_sock.close()
                    except Exception as e:
                        tls_info['ok'] = False
                        tls_info['error'] = str(e)
                sock.close()
            except Exception as e:
                tcp_info['ok'] = False
                tcp_info['error'] = str(e)
            result['tcp_connect'] = tcp_info
            if tls_info:
                result['tls_handshake'] = tls_info
        except Exception as e:  # pragma: no cover - defensive
            result['error'] = str(e)
        return result

    probes = await asyncio.gather(*[_probe(u) for u in urls]) if urls else []
    return {
        "static_turn_configured": bool(TURN_URL and TURN_USER and TURN_PASS),
        "metered_api_key_present": bool(METERED_API_KEY),
        "metered_disabled": DISABLE_METERED,
        "force_relay": FORCE_RELAY,
        "turn_urls": urls,
        "probes": probes,
    }