Spaces:

dreamlessx
/

LandmarkDiff

Running

App Files Files Community

dreamlessx commited on 13 days ago

Commit

92264a1

verified ·

1 Parent(s): 30cc2b8

Update landmarkdiff/morphometry.py to v0.3.2

Browse files

Files changed (1) hide show

landmarkdiff/morphometry.py +342 -0

landmarkdiff/morphometry.py ADDED Viewed

	@@ -0,0 +1,342 @@

+"""Nasal morphometry and facial symmetry evaluation.
+Geometric evaluation metrics derived from Varghaei et al. (2025),
+adapted for evaluating surgical prediction outputs.
+Computes five nasal ratios plus bilateral facial symmetry from
+MediaPipe 478-point landmarks, enabling interpretable clinical
+quality assessment beyond perceptual metrics (LPIPS, FID).
+Usage::
+    from landmarkdiff.morphometry import NasalMorphometry, FacialSymmetry
+    morph = NasalMorphometry()
+    ratios = morph.compute(landmarks_478)
+    sym = FacialSymmetry()
+    score = sym.compute(landmarks_478)
+"""
+from __future__ import annotations
+import logging
+from dataclasses import dataclass
+import numpy as np
+logger = logging.getLogger(__name__)
+# MediaPipe landmark indices (478-point mesh)
+# Reference: https://github.com/google/mediapipe/blob/master/mediapipe/modules/face_geometry/data/canonical_face_model_uv_visualization.png
+NOSE_TIP = 1
+LEFT_NOSTRIL = 98
+RIGHT_NOSTRIL = 327
+LEFT_INNER_EYE = 133
+RIGHT_INNER_EYE = 362
+LEFT_OUTER_EYE = 33
+RIGHT_OUTER_EYE = 263
+LEFT_CHEEK = 234
+RIGHT_CHEEK = 454
+CHIN = 152
+FOREHEAD = 10
+GLABELLA = 168
+@dataclass
+class NasalRatios:
+    """Five nasal morphometric ratios from Varghaei et al. (2025).
+    Attributes:
+        alar_intercanthal: Alar width / intercanthal distance.
+            Ideal ~1.0 (nose width equals eye spacing).
+        alar_face_width: Alar width / face width.
+            Ideal ~0.20 (nose is 1/5 of face width).
+        nose_length_face_height: Nose length / face height.
+            Proportional measure of nose vertical extent.
+        tip_midline_deviation: Horizontal offset of nose tip from
+            facial midline, normalized by face width. Lower is better.
+        nostril_vertical_asymmetry: Vertical height difference between
+            nostrils, normalized by face height. Lower is better.
+    """
+    alar_intercanthal: float = 0.0
+    alar_face_width: float = 0.0
+    nose_length_face_height: float = 0.0
+    tip_midline_deviation: float = 0.0
+    nostril_vertical_asymmetry: float = 0.0
+    def improvement_score(self, reference: NasalRatios) -> dict[str, bool]:
+        """Check which ratios improved relative to reference (pre-op).
+        A ratio 'improved' if the prediction moved it closer to the
+        anthropometric ideal compared to the reference.
+        """
+        ideals = {
+            "alar_intercanthal": 1.0,
+            "alar_face_width": 0.20,
+        }
+        results = {}
+        for name, ideal in ideals.items():
+            pred_val = getattr(self, name)
+            ref_val = getattr(reference, name)
+            results[name] = abs(pred_val - ideal) < abs(ref_val - ideal)
+        # For deviation/asymmetry, lower is always better
+        results["tip_midline_deviation"] = (
+            self.tip_midline_deviation < reference.tip_midline_deviation
+        )
+        results["nostril_vertical_asymmetry"] = (
+            self.nostril_vertical_asymmetry < reference.nostril_vertical_asymmetry
+        )
+        return results
+    def to_dict(self) -> dict[str, float]:
+        return {
+            "alar_intercanthal": self.alar_intercanthal,
+            "alar_face_width": self.alar_face_width,
+            "nose_length_face_height": self.nose_length_face_height,
+            "tip_midline_deviation": self.tip_midline_deviation,
+            "nostril_vertical_asymmetry": self.nostril_vertical_asymmetry,
+        }
+class NasalMorphometry:
+    """Compute nasal morphometric ratios from MediaPipe landmarks.
+    Five geometric features following Varghaei et al. (2025):
+    1. Alar width / intercanthal distance (ideal ~1.0)
+    2. Alar width / face width (ideal ~0.20)
+    3. Nose length / face height
+    4. Tip midline deviation (normalized)
+    5. Nostril vertical asymmetry (normalized)
+    """
+    def compute(self, landmarks: np.ndarray) -> NasalRatios:
+        """Compute all five nasal ratios.
+        Args:
+            landmarks: (N, 2) or (N, 3) array of MediaPipe landmarks.
+                Must have at least 478 points. Uses only x, y.
+        Returns:
+            NasalRatios dataclass with computed values.
+        """
+        pts = landmarks[:, :2]  # use only x, y
+        # Key points
+        nose_tip = pts[NOSE_TIP]
+        left_nostril = pts[LEFT_NOSTRIL]
+        right_nostril = pts[RIGHT_NOSTRIL]
+        left_inner_eye = pts[LEFT_INNER_EYE]
+        right_inner_eye = pts[RIGHT_INNER_EYE]
+        left_cheek = pts[LEFT_CHEEK]
+        right_cheek = pts[RIGHT_CHEEK]
+        forehead = pts[FOREHEAD]
+        chin = pts[CHIN]
+        glabella = pts[GLABELLA]
+        # Distances (cast to float for mypy compatibility)
+        alar_width: float = float(np.linalg.norm(left_nostril - right_nostril))
+        intercanthal: float = max(float(np.linalg.norm(left_inner_eye - right_inner_eye)), 1e-6)
+        face_width: float = max(float(np.linalg.norm(left_cheek - right_cheek)), 1e-6)
+        face_height: float = max(float(np.linalg.norm(forehead - chin)), 1e-6)
+        nose_length: float = float(np.linalg.norm(glabella - nose_tip))
+        # Facial midline (between outer eye corners)
+        midline_x = (pts[LEFT_OUTER_EYE][0] + pts[RIGHT_OUTER_EYE][0]) / 2
+        # Ratios
+        alar_intercanthal = float(alar_width / intercanthal)
+        alar_face = float(alar_width / face_width)
+        nose_face = float(nose_length / face_height)
+        tip_deviation = float(abs(nose_tip[0] - midline_x) / face_width)
+        nostril_asymmetry = float(abs(left_nostril[1] - right_nostril[1]) / face_height)
+        return NasalRatios(
+            alar_intercanthal=alar_intercanthal,
+            alar_face_width=alar_face,
+            nose_length_face_height=nose_face,
+            tip_midline_deviation=tip_deviation,
+            nostril_vertical_asymmetry=nostril_asymmetry,
+        )
+    def compute_from_image(self, image: np.ndarray) -> NasalRatios | None:
+        """Extract landmarks from image and compute ratios.
+        Args:
+            image: BGR uint8 image (H, W, 3).
+        Returns:
+            NasalRatios or None if landmark detection fails.
+        """
+        try:
+            import mediapipe as mp
+        except ImportError:
+            logger.warning("mediapipe required for landmark extraction")
+            return None
+        with mp.solutions.face_mesh.FaceMesh(
+            static_image_mode=True,
+            max_num_faces=1,
+            refine_landmarks=True,
+            min_detection_confidence=0.5,
+        ) as face_mesh:
+            import cv2
+            rgb = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
+            results = face_mesh.process(rgb)
+            if not results.multi_face_landmarks:
+                return None
+            h, w = image.shape[:2]
+            face = results.multi_face_landmarks[0]
+            landmarks = np.array([(lm.x * w, lm.y * h) for lm in face.landmark])
+            return self.compute(landmarks)
+class FacialSymmetry:
+    """Bilateral facial symmetry scoring.
+    Measures deviation from perfect bilateral symmetry by reflecting
+    left-side landmarks across the facial midline and computing
+    distances to nearest right-side counterparts.
+    Lower scores indicate greater symmetry.
+    """
+    def compute(
+        self,
+        landmarks: np.ndarray,
+        left_eye_idx: int = LEFT_OUTER_EYE,
+        right_eye_idx: int = RIGHT_OUTER_EYE,
+    ) -> float:
+        """Compute bilateral symmetry error.
+        Args:
+            landmarks: (N, 2) or (N, 3) array. Uses only x, y.
+            left_eye_idx: Landmark index for left outer eye corner.
+            right_eye_idx: Landmark index for right outer eye corner.
+        Returns:
+            Mean symmetry error (lower = more symmetric).
+            Normalized by inter-ocular distance.
+        """
+        pts = landmarks[:, :2].copy()
+        # Midline from eye corners
+        midline_x = (pts[left_eye_idx][0] + pts[right_eye_idx][0]) / 2
+        iod = abs(pts[left_eye_idx][0] - pts[right_eye_idx][0])
+        if iod < 1e-6:
+            return 0.0
+        # Partition into left and right
+        left_mask = pts[:, 0] < midline_x
+        right_mask = pts[:, 0] > midline_x
+        left_pts = pts[left_mask]
+        right_pts = pts[right_mask]
+        if len(left_pts) == 0 or len(right_pts) == 0:
+            return 0.0
+        # Reflect left across midline
+        reflected = left_pts.copy()
+        reflected[:, 0] = 2 * midline_x - reflected[:, 0]
+        # KDTree nearest-neighbor matching
+        try:
+            from scipy.spatial import KDTree
+            tree = KDTree(right_pts)
+            distances, _ = tree.query(reflected)
+            return float(np.mean(distances) / iod)
+        except ImportError:
+            # Fallback: brute force
+            total = 0.0
+            for pt in reflected:
+                dists = np.linalg.norm(right_pts - pt, axis=1)
+                total += np.min(dists)
+            return float(total / (len(reflected) * iod))
+    def compute_from_image(self, image: np.ndarray) -> float | None:
+        """Extract landmarks from image and compute symmetry.
+        Args:
+            image: BGR uint8 image (H, W, 3).
+        Returns:
+            Symmetry error or None if detection fails.
+        """
+        try:
+            import mediapipe as mp
+        except ImportError:
+            logger.warning("mediapipe required for landmark extraction")
+            return None
+        with mp.solutions.face_mesh.FaceMesh(
+            static_image_mode=True,
+            max_num_faces=1,
+            refine_landmarks=True,
+            min_detection_confidence=0.5,
+        ) as face_mesh:
+            import cv2
+            rgb = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
+            results = face_mesh.process(rgb)
+            if not results.multi_face_landmarks:
+                return None
+            h, w = image.shape[:2]
+            face = results.multi_face_landmarks[0]
+            landmarks = np.array([(lm.x * w, lm.y * h) for lm in face.landmark])
+            return self.compute(landmarks)
+def compare_morphometry(
+    pred_image: np.ndarray,
+    input_image: np.ndarray,
+    procedure: str = "rhinoplasty",
+) -> dict:
+    """Compare morphometric quality between prediction and input.
+    Computes nasal ratios and symmetry for both images and reports
+    which metrics improved. Useful for evaluating whether the predicted
+    surgical output shows clinically meaningful improvement.
+    Args:
+        pred_image: Predicted output (BGR uint8).
+        input_image: Original input (BGR uint8).
+        procedure: Procedure type (affects which metrics are relevant).
+    Returns:
+        Dict with 'input_ratios', 'pred_ratios', 'improvements',
+        'input_symmetry', 'pred_symmetry', 'symmetry_improved'.
+    """
+    morph = NasalMorphometry()
+    sym = FacialSymmetry()
+    input_ratios = morph.compute_from_image(input_image)
+    pred_ratios = morph.compute_from_image(pred_image)
+    input_sym = sym.compute_from_image(input_image)
+    pred_sym = sym.compute_from_image(pred_image)
+    result: dict = {
+        "procedure": procedure,
+        "input_ratios": input_ratios.to_dict() if input_ratios else None,
+        "pred_ratios": pred_ratios.to_dict() if pred_ratios else None,
+        "input_symmetry": input_sym,
+        "pred_symmetry": pred_sym,
+        "symmetry_improved": (
+            pred_sym < input_sym if pred_sym is not None and input_sym is not None else None
+        ),
+    }
+    if input_ratios and pred_ratios:
+        result["improvements"] = pred_ratios.improvement_score(input_ratios)
+    else:
+        result["improvements"] = None
+    return result