Spaces:

ar07xd
/

deepshield

Running

App Files Files Community

ar07xd commited on 4 days ago

Commit

72ccda8

verified ·

1 Parent(s): 07ff735

Sync from GitHub via hub-sync

Browse files

Files changed (3) hide show

api/v1/analyze.py +2 -7
models/model_loader.py +5 -0
services/image_service.py +71 -0

api/v1/analyze.py CHANGED Viewed

@@ -42,7 +42,7 @@ from services.screenshot_service import (
 )
 from services.ela_service import generate_ela_base64
 from services.exif_service import extract_exif, rescore_exif_trust
-from services.image_service import classify_image, load_image_from_bytes
 from services.llm_explainer import generate_llm_summary
 from schemas.common import ProcessingSummary, Verdict
 from services.artifact_detector import scan_artifacts
@@ -396,12 +396,7 @@ async def analyze_image(
         try:
             vlm_bd = generate_vlm_breakdown(pil, record_id=analysis_id)
             if vlm_bd:
-                clf = classify_image(
-                    pil,
-                    artifact_indicators=indicators,
-                    exif=exif_summary,
-                    vlm_breakdown=vlm_bd,
-                )
                 stages.append("vlm_evidence_fusion")
         except Exception as e:  # noqa: BLE001
             logger.warning(f"VLM evidence fusion failed, continuing: {e}")

 )
 from services.ela_service import generate_ela_base64
 from services.exif_service import extract_exif, rescore_exif_trust
+from services.image_service import classify_image, load_image_from_bytes, apply_vlm_to_classification
 from services.llm_explainer import generate_llm_summary
 from schemas.common import ProcessingSummary, Verdict
 from services.artifact_detector import scan_artifacts
         try:
             vlm_bd = generate_vlm_breakdown(pil, record_id=analysis_id)
             if vlm_bd:
+                clf = apply_vlm_to_classification(clf, vlm_bd)
                 stages.append("vlm_evidence_fusion")
         except Exception as e:  # noqa: BLE001
             logger.warning(f"VLM evidence fusion failed, continuing: {e}")

models/model_loader.py CHANGED Viewed

@@ -39,6 +39,7 @@ class ModelLoader:
                     cls._instance._efficientnet_detector = None
                     cls._instance._ffpp_model = None
                     cls._instance._ffpp_processor = None
                     cls._instance._densenet_model = None
                     cls._instance._densenet_meta = None
                     cls._instance._densenet_unavailable = False
@@ -289,6 +290,8 @@ class ModelLoader:
             return None
         if self._ffpp_model is not None:
             return self._ffpp_model, self._ffpp_processor
         configured_path = Path(settings.FFPP_MODEL_PATH)
         repo_root = Path(__file__).resolve().parent.parent.parent
@@ -306,6 +309,7 @@ class ModelLoader:
             else:
                 tried = ", ".join(str(p) for p in candidates)
                 logger.warning(f"FFPP ViT checkpoint not found. Tried: {tried} — skipping")
                 return None
         try:
@@ -322,6 +326,7 @@ class ModelLoader:
             return self._ffpp_model, self._ffpp_processor
         except Exception as e:
             logger.warning(f"FFPP ViT load failed (continuing without it): {e}")
             return None
     # ---------- DenseNet121 face-GAN specialist ----------

                     cls._instance._efficientnet_detector = None
                     cls._instance._ffpp_model = None
                     cls._instance._ffpp_processor = None
+                    cls._instance._ffpp_unavailable = False
                     cls._instance._densenet_model = None
                     cls._instance._densenet_meta = None
                     cls._instance._densenet_unavailable = False
             return None
         if self._ffpp_model is not None:
             return self._ffpp_model, self._ffpp_processor
+        if self._ffpp_unavailable:
+            return None
         configured_path = Path(settings.FFPP_MODEL_PATH)
         repo_root = Path(__file__).resolve().parent.parent.parent
             else:
                 tried = ", ".join(str(p) for p in candidates)
                 logger.warning(f"FFPP ViT checkpoint not found. Tried: {tried} — skipping")
+                self._ffpp_unavailable = True
                 return None
         try:
             return self._ffpp_model, self._ffpp_processor
         except Exception as e:
             logger.warning(f"FFPP ViT load failed (continuing without it): {e}")
+            self._ffpp_unavailable = True
             return None
     # ---------- DenseNet121 face-GAN specialist ----------

services/image_service.py CHANGED Viewed

@@ -525,6 +525,77 @@ def classify_image(
     )
 def preprocess_and_classify(raw_bytes: bytes) -> Tuple[Image.Image, ImageClassification]:
     """Convenience: decode bytes → PIL → classify. Returns the PIL image too so
     downstream steps (heatmap, artifact scan) can reuse it.

     )
+def apply_vlm_to_classification(
+    clf: ImageClassification,
+    vlm_breakdown: "VLMBreakdown",
+) -> ImageClassification:
+    """Fold VLM evidence into an already-computed ImageClassification.
+    Recomputes only the fusion math — no model inference is repeated.
+    Returns clf unchanged if evidence_fusion is absent or VLM yields no signal.
+    """
+    if clf.evidence_fusion is None:
+        return clf
+    vlm_prob = _vlm_fake_probability(vlm_breakdown)
+    if vlm_prob is None:
+        return clf
+    components = dict(clf.evidence_fusion["components"])
+    weights = dict(clf.evidence_fusion["weights"])
+    is_video_frame = clf.evidence_fusion.get("is_video_frame", False)
+    components["vlm"] = vlm_prob
+    weights["vlm"] = settings.VLM_WEIGHT_FACE
+    total_w = sum(weights.values())
+    pre_gating_prob = (
+        sum(components[k] * weights[k] for k in weights) / total_w if total_w else 0.0
+    )
+    pre_gating_prob = max(0.0, min(1.0, pre_gating_prob))
+    general_fake_prob = components.get("general")
+    ensemble_prob, gating_reason = _apply_hard_gating(
+        fake_prob=pre_gating_prob,
+        general_fake_prob=general_fake_prob,
+        artifacts=[],
+    )
+    ensemble_prob, synthetic_reason = _apply_synthetic_still_overrides(
+        fake_prob=ensemble_prob,
+        general_fake_prob=general_fake_prob,
+        is_video_frame=is_video_frame,
+    )
+    # Preserve artifact-based gating floor from the original classification
+    if clf.gating_applied and "gan_artifact" in clf.gating_applied:
+        ensemble_prob = max(ensemble_prob, settings.GATING_FAKE_FLOOR)
+    final_gating_reason = synthetic_reason or gating_reason or clf.gating_applied
+    label = "Fake" if ensemble_prob >= 0.5 else "Real"
+    logger.info(
+        f"VLM fusion applied: vlm_prob={vlm_prob:.3f} "
+        f"pre_gating={pre_gating_prob:.3f} -> {ensemble_prob:.3f} ({label})"
+    )
+    return ImageClassification(
+        label=label,
+        confidence=ensemble_prob,
+        all_scores={**clf.all_scores, "vlm_fake_prob": vlm_prob},
+        models_used=clf.models_used,
+        ensemble_method=clf.ensemble_method,
+        calibrator_applied=clf.calibrator_applied,
+        no_face_analysis=clf.no_face_analysis,
+        evidence_fusion={
+            **clf.evidence_fusion,
+            "components": components,
+            "weights": weights,
+            "pre_gating": pre_gating_prob,
+        },
+        gating_applied=final_gating_reason,
+    )
 def preprocess_and_classify(raw_bytes: bytes) -> Tuple[Image.Image, ImageClassification]:
     """Convenience: decode bytes → PIL → classify. Returns the PIL image too so
     downstream steps (heatmap, artifact scan) can reuse it.