Spaces:

FEREYDOONRAH
/

FEREYDOONBER

Runtime error

App Files Files Community

FEREYDOONRAH commited on 11 days ago

Commit

3938eeb

verified ·

1 Parent(s): a1918b1

Update app.py

Browse files

Files changed (1) hide show

app.py +157 -128

app.py CHANGED Viewed

@@ -1,149 +1,178 @@
 import os
-import gc
-import torch
 import requests
 from io import BytesIO
-from PIL import Image
-from transformers import AutoProcessor, VisionEncoderDecoderModel, AutoTokenizer
 import gradio as gr
-# -----------------------
-# مدل‌های انتخابی
-# -----------------------
-# مدل فارسی (قابل اجرا روی CPU 16GB)
-MODEL_FARSI = "arxyzan/Qwen2-VL-2B-Instruct-Farsi"
-# مدل انگلیسی (قابل اجرا روی CPU 16GB)
-MODEL_ENGLISH = "microsoft/git-base-textcaps"
-# انتخاب مدل پیش‌فرض
-MODEL_NAME = MODEL_FARSI  # تغییر بده اگر انگلیسی خواستی
-DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
-# -----------------------
 # مدیریت حافظه
-# -----------------------
-def cleanup_memory():
-    try:
-        if torch.cuda.is_available():
-            torch.cuda.empty_cache()
-    except Exception:
-        pass
-    gc.collect()
-cleanup_memory()
-# -----------------------
-# بارگذاری مدل
-# -----------------------
-try:
-    print(f"در حال بارگذاری مدل: {MODEL_NAME}")
-    processor = AutoProcessor.from_pretrained(MODEL_NAME)
-    model = VisionEncoderDecoderModel.from_pretrained(MODEL_NAME)
-    tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME)
-    model.to(DEVICE)
-    print("✅ مدل با موفقیت بارگذاری شد!")
-    MODEL_LOADED = True
-except Exception as e:
-    print(f"❌ خطا در بارگذاری مدل: {e}")
-    MODEL_LOADED = False
-# -----------------------
-# توابع کمکی
-# -----------------------
-def _is_garbage_text(s: str) -> bool:
-    if not s or len(s.strip()) <= 2:
-        return True
-    return False
-def _strip_prompt_echo(generated_text: str, prompt: str) -> str:
-    if not generated_text:
-        return ""
-    if not prompt:
-        return generated_text.strip()
-    if generated_text.startswith(prompt):
-        return generated_text[len(prompt):].strip(" :.-\n\t")
-    return generated_text.strip()
-# -----------------------
-# تابع پردازش تصویر
-# -----------------------
-def process_image(image_url: str, prompt_text: str):
-    cleanup_memory()
-    if not MODEL_LOADED:
-        return "❌ مدل بارگذاری نشده است."
-    if not image_url or not image_url.strip():
-        return "❌ لطفاً آدرس تصویر را وارد کنید."
-    if not image_url.startswith("http"):
-        return "❌ آدرس تصویر باید با http یا https شروع شود."
-    # دانلود تصویر
     try:
-        response = requests.get(image_url, timeout=25)
-        response.raise_for_status()
-        image = Image.open(BytesIO(response.content))
-        if image.mode != "RGB":
-            image = image.convert("RGB")
     except Exception as e:
-        return f"❌ خطا در دانلود یا باز کردن تصویر: {e}"
-    # پردازش تصویر
-    try:
-        inputs = processor(images=image, return_tensors="pt").to(DEVICE)
-    except Exception as e:
-        return f"❌ پردازش تصویر با processor ممکن نیست: {e}"
-    # اگر پرامپت موجود است، decoder_input_ids بساز
-    decoder_input_ids = None
-    full_prompt = None
-    if prompt_text and prompt_text.strip():
-        full_prompt = prompt_text.strip()
-        try:
-            tok = tokenizer(full_prompt, return_tensors="pt")
-            decoder_input_ids = tok.input_ids.to(DEVICE)
-        except Exception as e:
-            return f"❌ خطا در توکنایز پرامپت: {e}"
-    # تولید متن
     try:
-        if decoder_input_ids is not None:
-            outputs = model.generate(**inputs, decoder_input_ids=decoder_input_ids,
-                                     max_new_tokens=80, num_beams=3, no_repeat_ngram_size=2)
-        else:
-            outputs = model.generate(**inputs, max_new_tokens=60, num_beams=3, no_repeat_ngram_size=2)
-    except Exception as e:
-        return f"❌ خطا در تولید متن: {e}"
-    # دیکد خروجی
     try:
-        text = tokenizer.decode(outputs[0], skip_special_tokens=True).strip()
-        text = _strip_prompt_echo(text, full_prompt)
-        if _is_garbage_text(text):
-            return "⚠️ مدل خروجی مفیدی تولید نکرد. لطفاً پرامپت واضح یا تصویر دیگری وارد کنید."
     except Exception as e:
-        return f"❌ خطا در دیکد خروجی: {e}"
-    cleanup_memory()
-    return text
-# -----------------------
-# رابط Gradio
-# -----------------------
-with gr.Blocks(title="تبدیل تصویر به متن (CPU-friendly)") as demo:
-    gr.Markdown("# 🖼️ تبدیل تصویر به متن")
-    gr.Markdown("پرامپت را به فارسی یا انگلیسی وارد کنید تا خروجی تولید شود. اگر خالی باشد، مدل متن توصیفی ایجاد می‌کند.")
     with gr.Row():
-        gr.Markdown(f"**مدل:** {MODEL_NAME}")
     with gr.Row():
-        with gr.Column(scale=1):
-            image_url_input = gr.Textbox(label="آدرس تصویر (URL)", value="https://images.unsplash.com/photo-1541963463532-d68292c34b19?w=400")
-            prompt_input = gr.Textbox(label="پرامپت (اختیاری)", placeholder="مثال: این تصویر یک گربه در حال استراحت را نشان می‌دهد")
-            submit_btn = gr.Button("🚀 پردازش تصویر")
-        with gr.Column(scale=1):
-            output_box = gr.Textbox(label="نتیجه", lines=8, show_copy_button=True)
-    submit_btn.click(fn=process_image, inputs=[image_url_input, prompt_input], outputs=[output_box], show_progress="full")
 if __name__ == "__main__":
-    demo.launch(show_error=True, share=False)

 import os
+from huggingface_hub import login, whoami
+from transformers import pipeline
+from PIL import Image
 import requests
 from io import BytesIO
 import gradio as gr
+import torch
 # مدیریت حافظه
+torch.cuda.empty_cache() if torch.cuda.is_available() else None
+# خواندن توکن
+HF_TOKEN = os.environ.get('bermuda')
+# بررسی اتصال
+connection_status = "🔒 حالت عمومی"
+if HF_TOKEN:
     try:
+        login(token=HF_TOKEN)
+        user_info = whoami()
+        connection_status = f"✅ متصل به: {user_info['name']}"
+        print(connection_status)
     except Exception as e:
+        connection_status = f"⚠️ خطا در اتصال: {e}"
+        print(connection_status)
+print("📥 در حال بارگیری بهترین مدل چندزبانه برای CPU...")
+# بهترین انتخاب برای CPU + چندزبانگی
+BEST_MODEL = "microsoft/git-large"  # 🏆 برنده نهایی
+try:
+    print(f"🔍 بارگیری: {BEST_MODEL}")
+    pipe = pipeline(
+        "image-to-text",
+        model=BEST_MODEL,
+        device=-1,  # CPU
+        torch_dtype=torch.float32
+    )
+    print("✅ مدل با موفقیت بارگیری شد!")
+    model_loaded = True
+except Exception as e:
+    print(f"❌ خطا در بارگیری: {e}")
+    # جایگزین
     try:
+        BEST_MODEL = "Salesforce/blip2-opt-2.7b"
+        pipe = pipeline("image-to-text", model=BEST_MODEL, device=-1)
+        model_loaded = True
+        print(f"✅ مدل جایگزین {BEST_MODEL} بارگیری شد!")
+    except:
+        model_loaded = False
+def process_multilingual(image_url, instruction_text, language):
+    """پردازش چندزبانه"""
+    if not model_loaded:
+        return "❌ مدل بارگیری نشده است"
     try:
+        if not image_url.startswith('http'):
+            return "❌ آدرس تصویر نامعتبر"
+        # دانلود تصویر
+        response = requests.get(image_url, timeout=30)
+        image = Image.open(BytesIO(response.content))
+        if image.mode != 'RGB':
+            image = image.convert('RGB')
+        print(f"🌍 پردازش به زبان: {language}")
+        # ساخت دستور با توجه به زبان
+        if language == "فارسی":
+            prompt = instruction_text if instruction_text.strip() else "این تصویر را توصیف کن"
+        elif language == "English":
+            prompt = instruction_text if instruction_text.strip() else "Describe this image"
+        elif language == "العربية":
+            prompt = instruction_text if instruction_text.strip() else "صف هذه الصورة"
+        elif language == "中文":
+            prompt = instruction_text if instruction_text.strip() else "描述这张图片"
+        elif language == "Español":
+            prompt = instruction_text if instruction_text.strip() else "Describe esta imagen"
+        else:
+            prompt = instruction_text if instruction_text.strip() else "Describe this image"
+        # پردازش
+        result = pipe(image, prompt)
+        generated_text = result[0]['generated_text']
+        return f"**زبان: {language}**\n\n{generated_text}"
     except Exception as e:
+        return f"❌ خطا: {str(e)}"
+# رابط چندزبانه
+with gr.Blocks(title="پردازشگر چندزبانه تصویر", theme=gr.themes.Soft()) as demo:
+    gr.Markdown("# 🌍 پردازشگر چندزبانه تصاویر")
+    gr.Markdown("**پشتیبانی از فارسی، انگلیسی، عربی، چینی و اسپانیایی**")
     with gr.Row():
+        gr.Markdown(f"**وضعیت:** {connection_status}")
+        gr.Markdown(f"**مدل:** {BEST_MODEL}")
+        gr.Markdown("**⚡ بهینه برای CPU**")
     with gr.Row():
+        with gr.Column():
+            image_url = gr.Textbox(
+                label="آدرس تصویر",
+                value="https://images.unsplash.com/photo-1541963463532-d68292c34b19?w=400",
+                lines=2
+            )
+            language = gr.Dropdown(
+                label="زبان خروجی",
+                choices=["فارسی", "English", "العربية", "中文", "Español"],
+                value="فارسی"
+            )
+            instruction_text = gr.Textbox(
+                label="دستور (اختیاری)",
+                placeholder="متن دستور را به زبان انتخاب شده وارد کنی��...",
+                value="",
+                lines=2
+            )
+            submit_btn = gr.Button("🚀 پردازش چندزبانه", variant="primary")
+        with gr.Column():
+            output_text = gr.Markdown(
+                label="نتیجه پردازش"
+            )
+    # اطلاعات مدل
+    with gr.Accordion("🏆 اطلاعات مدل", open=True):
+        gr.Markdown("""
+        **microsoft/git-large - بهترین برای CPU:**
+        - ✅ سبک و سریع (0.4B پارامتر)
+        - 🌍 پشتیبانی از ۱۰۰+ زبان
+        - ⚡ پردازش ۱۰-۳۰ ثانیه‌ای
+        - 🎯 کیفیت عالی در همه زبان‌ها
+        """)
+    # مثال‌های چندزبانه
+    with gr.Accordion("🌐 مثال‌های چندزبانه", open=False):
+        examples = gr.Examples(
+            examples=[
+                [
+                    "https://images.unsplash.com/photo-1541963463532-d68292c34b19?w=400",
+                    "این تصویر را با جزئیات توصیف کن",
+                    "فارسی"
+                ],
+                [
+                    "https://upload.wikimedia.org/wikipedia/commons/thumb/6/68/Orange_tabby_cat_sitting_on_fallen_leaves-Hisashi-01A.jpg/400px-Orange_tabby_cat_sitting_on_fallen_leaves-Hisashi-01A.jpg",
+                    "Describe this cat and its environment",
+                    "English"
+                ],
+                [
+                    "https://images.unsplash.com/photo-1506905925346-21bda4d32df4?w=400",
+                    "صف هذا المنظر الطبيعي",
+                    "العربية"
+                ],
+            ],
+            inputs=[image_url, instruction_text, language],
+            outputs=[output_text]
+        )
+    submit_btn.click(
+        fn=process_multilingual,
+        inputs=[image_url, instruction_text, language],
+        outputs=[output_text],
+        show_progress="full"
+    )
 if __name__ == "__main__":
+    demo.launch()