Spaces:

Mr-HASSAN
/

testing

Paused

App Files Files Community

Mr-HASSAN commited on Nov 25, 2025

Commit

fa53bfa

verified ·

1 Parent(s): 3cb49a8

Update app.py

Browse files

Files changed (1) hide show

app.py +46 -32

app.py CHANGED Viewed

@@ -5,15 +5,10 @@ import google.generativeai as genai
 from ultralytics import YOLO
 import tempfile
 import torch
 # =============================
-# اختيار الجهاز (GPU / CPU)
-# =============================
-DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
-print(f"🚀 Using device: {DEVICE}")
-# =============================
-# إعداد مفتاح Gemini (مكتوب صريح في الكود)
 # =============================
 GEMINI_API_KEY = "AIzaSyAvm28ZnTMaZ1Jtg9sYM-EO4qlAN2W4BIQ"
@@ -31,7 +26,6 @@ SYSTEM_PROMPT = (
 )
 def fix_with_gemini(raw_text: str) -> str:
     if not raw_text:
         return ""
@@ -45,18 +39,18 @@ def fix_with_gemini(raw_text: str) -> str:
 # =============================
-# إعدادات YOLO + السرعة
 # =============================
 WEIGHTS_PATH = "best.pt"
 IMG_SIZE = 320
-CONF_THRESHOLD = 0.25  # خفضناها عشان يسوي ديتكشن أسهل
 # إعدادات تجميع الحروف
-MIN_STABLE_FRAMES = 1     # اعتبر الحرف من أول مرة للاستكشاف
-FRAME_SKIP = 1            # حلّل كل فريم (مع GPU تقدر تخليه 1)
-MAX_FRAMES = 1000         # حد أقصى للفريمات
-WORD_GAP_FRAMES = 10      # فجوة (بدون حروف) لنهاية الكلمة
 arabic_map = {
     "aleff": "ا",
@@ -93,21 +87,41 @@ arabic_map = {
     "la": "لا",
 }
-print("🔹 Loading YOLO model...")
-model = YOLO(WEIGHTS_PATH)
-# ننقل الموديل إلى كرت الشاشة لو موجود
-try:
-    model.to(DEVICE)
-    print("✅ YOLO model moved to", DEVICE)
-except Exception as e:
-    print("⚠️ تعذر نقل الموديل إلى الجهاز:", e)
-print("📚 Classes:", model.names)
 # =============================
-# ضغط الفيديو قبل المعالجة (دقة 360p تقريباً + تقليل FPS)
 # =============================
 def preprocess_video(input_path: str, target_width: int = 640, target_fps: int = 8) -> str:
@@ -131,7 +145,6 @@ def preprocess_video(input_path: str, target_width: int = 640, target_fps: int =
         frame_step = max(1, int(round(orig_fps / target_fps)))
         out_fps = orig_fps / frame_step
-    # ارتفاع النسخة 360p تقريباً حسب نسبة الأبعاد
     target_height = int(target_width * h / w)
     fd, tmp_path = tempfile.mkstemp(suffix=".mp4")
@@ -146,7 +159,6 @@ def preprocess_video(input_path: str, target_width: int = 640, target_fps: int =
         if not ret:
             break
-        # نأخذ كل frame_step فريم واحد فقط
         if frame_idx % frame_step == 0:
             resized = cv2.resize(frame, (target_width, target_height), interpolation=cv2.INTER_AREA)
             out.write(resized)
@@ -160,17 +172,19 @@ def preprocess_video(input_path: str, target_width: int = 640, target_fps: int =
 # =============================
-# معالجة فريم واحد (YOLO على GPU)
 # =============================
 def detect_frame(frame_bgr):
     frame_rgb = cv2.cvtColor(frame_bgr, cv2.COLOR_BGR2RGB)
     result = model.predict(
         frame_rgb,
         conf=CONF_THRESHOLD,
         imgsz=IMG_SIZE,
         verbose=False,
-        device=DEVICE  # هنا نحدد إنه يشتغل على cuda لو متوفر
     )[0]
     boxes = result.boxes
@@ -222,7 +236,7 @@ def extract_and_render(video_path: str):
     height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
     if fps <= 0:
-        fps = 8.0  # fallback
     out = cv2.VideoWriter(out_path, fourcc, fps, (width, height))
@@ -285,16 +299,16 @@ def extract_and_render(video_path: str):
 # =============================
-# Gradio واجهة كاملة
 # =============================
 def run(file):
     if file is None:
         return "لم يتم رفع فيديو", "", None
     video_path = file.name
-    # خطوة تسريع الفيديو قبل التحليل (360p + ~8fps)
     light_path = preprocess_video(video_path, target_width=640, target_fps=8)
     raw, processed_path = extract_and_render(light_path)
@@ -307,7 +321,7 @@ def run(file):
 with gr.Blocks() as demo:
-    gr.Markdown("## 🤟 ASL → Arabic (YOLO + Gemini) مع إعادة فيديو المعالجة 🎥 — نسخة GPU")
     inp = gr.File(label="ارفع فيديو الإشارة")
     raw = gr.Textbox(label="النص الخام", lines=3)

 from ultralytics import YOLO
 import tempfile
 import torch
+import spaces  # مهم لـ @spaces.GPU
 # =============================
+# إعداد مفتاح Gemini (حطه هنا)
 # =============================
 GEMINI_API_KEY = "AIzaSyAvm28ZnTMaZ1Jtg9sYM-EO4qlAN2W4BIQ"
 )
 def fix_with_gemini(raw_text: str) -> str:
     if not raw_text:
         return ""
 # =============================
+# إعدادات YOLO + متغيرات عامة
 # =============================
 WEIGHTS_PATH = "best.pt"
 IMG_SIZE = 320
+CONF_THRESHOLD = 0.25  # تخفيض للسهولة
 # إعدادات تجميع الحروف
+MIN_STABLE_FRAMES = 1
+FRAME_SKIP = 1
+MAX_FRAMES = 1000
+WORD_GAP_FRAMES = 10
 arabic_map = {
     "aleff": "ا",
     "la": "لا",
 }
+# هنستخدم موديل عالمي لكن نحمّله عند أول استخدام فقط
+yolo_model = None
+DEVICE = "cpu"
+def get_model():
+    """
+    يحمّل YOLO مرة واحدة، ويحاول نقله لـ GPU لو متوفر.
+    يُستدعى داخل دالة عليها @spaces.GPU بعد ما الـ GPU يشتغل فعليًا.
+    """
+    global yolo_model, DEVICE
+    if yolo_model is None:
+        print("🔹 Loading YOLO model...")
+        yolo_model = YOLO(WEIGHTS_PATH)
+        print("📚 Classes:", yolo_model.names)
+    # نعيد التحقق من CUDA هنا (بعد ما GPU يشتغل في Spaces)
+    if torch.cuda.is_available():
+        if DEVICE != "cuda":
+            DEVICE = "cuda"
+            try:
+                yolo_model.to(DEVICE)
+                print("✅ YOLO model moved to cuda")
+            except Exception as e:
+                print("⚠️ تعذر نقل الموديل إلى cuda:", e)
+    else:
+        DEVICE = "cpu"
+        print("⚠️ CUDA غير متوفر، سيتم استخدام CPU.")
+    return yolo_model
 # =============================
+# ضغط الفيديو قبل المعالجة
 # =============================
 def preprocess_video(input_path: str, target_width: int = 640, target_fps: int = 8) -> str:
         frame_step = max(1, int(round(orig_fps / target_fps)))
         out_fps = orig_fps / frame_step
     target_height = int(target_width * h / w)
     fd, tmp_path = tempfile.mkstemp(suffix=".mp4")
         if not ret:
             break
         if frame_idx % frame_step == 0:
             resized = cv2.resize(frame, (target_width, target_height), interpolation=cv2.INTER_AREA)
             out.write(resized)
 # =============================
+# معالجة فريم واحد
 # =============================
 def detect_frame(frame_bgr):
+    model = get_model()  # نتأكد الموديل جاهز وعلى الجهاز الصحيح
     frame_rgb = cv2.cvtColor(frame_bgr, cv2.COLOR_BGR2RGB)
     result = model.predict(
         frame_rgb,
         conf=CONF_THRESHOLD,
         imgsz=IMG_SIZE,
         verbose=False,
+        device=DEVICE,  # cuda أو cpu حسب المتاح
     )[0]
     boxes = result.boxes
     height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
     if fps <= 0:
+        fps = 8.0
     out = cv2.VideoWriter(out_path, fourcc, fps, (width, height))
 # =============================
+# Gradio + @spaces.GPU
 # =============================
+@spaces.GPU  # هذا اللي يرضي Hugging Face ويشغّل GPU on demand
 def run(file):
     if file is None:
         return "لم يتم رفع فيديو", "", None
     video_path = file.name
     light_path = preprocess_video(video_path, target_width=640, target_fps=8)
     raw, processed_path = extract_and_render(light_path)
 with gr.Blocks() as demo:
+    gr.Markdown("## 🤟 ASL → Arabic (YOLO + Gemini) — نسخة GPU على Hugging Face Spaces")
     inp = gr.File(label="ارفع فيديو الإشارة")
     raw = gr.Textbox(label="النص الخام", lines=3)