Spaces:

omar721
/

janus-pro-api

Sleeping

App Files Files Community

omar721 commited on 28 days ago

Commit

09aeaac

verified ·

1 Parent(s): 431b26d

update app.py

Browse files

Files changed (1) hide show

app.py +83 -48

app.py CHANGED Viewed

@@ -3,38 +3,61 @@ import requests
 import os
 import time
-# Configuration
 API_TOKEN = os.environ.get("HF_TOKEN", "")
 MODEL_NAME = "deepseek-ai/Janus-Pro-7B"
 API_URL = f"https://api-inference.huggingface.co/models/{MODEL_NAME}"
-headers = {"Authorization": f"Bearer {API_TOKEN}"}
 def query_janus_model(payload):
     """Send request to Hugging Face Inference API"""
     try:
-        response = requests.post(API_URL, headers=headers, json=payload, timeout=30)
         if response.status_code == 503:
-            return {"error": "Model is loading, please try again in 30-60 seconds..."}
         elif response.status_code != 200:
-            return {"error": f"API Error: {response.status_code} - {response.text}"}
         return response.json()
     except requests.exceptions.Timeout:
-        return {"error": "Request timeout - model might be loading"}
     except Exception as e:
-        return {"error": f"Connection error: {str(e)}"}
 def chat_with_janus(message, history):
     """Chat function for Janus-Pro model"""
-    if not API_TOKEN:
-        return "⚠️ Please add your Hugging Face token in Space Settings → Repository secrets → HF_TOKEN"
     # Prepare the payload
     payload = {
         "inputs": message,
         "parameters": {
-            "max_new_tokens": 300,
             "temperature": 0.7,
             "top_p": 0.9,
             "do_sample": True,
@@ -46,19 +69,23 @@ def chat_with_janus(message, history):
     }
     # Show loading message
-    yield "🔄 Processing your request... (Model might take 30-60 seconds to load)"
     # Query the model
     result = query_janus_model(payload)
     # Process the response
     if "error" in result:
-        yield f"❌ {result['error']}"
     elif isinstance(result, list) and len(result) > 0:
         if 'generated_text' in result[0]:
-            yield result[0]['generated_text']
         else:
-            yield str(result[0])
     elif isinstance(result, dict) and 'generated_text' in result:
         yield result['generated_text']
     else:
@@ -68,69 +95,75 @@ def clear_chat():
     """Clear chat history"""
     return [], []
-# Custom CSS for better appearance
-css = """
-.gradio-container {
-    background: linear-gradient(135deg, #667eea 0%, #764ba2 100%);
-}
-.chatbot {
-    background: white;
-    border-radius: 10px;
-}
-"""
 # Create the chat interface
-with gr.Blocks(theme=gr.themes.Soft(), css=css) as demo:
     gr.Markdown(
         """
         # 🚀 Janus-Pro-7B Chat API
-        **Multimodal AI Model** - Understanding & Generation Capabilities
-        *Note: First request may take 30-60 seconds while the model loads*
         """
     )
     with gr.Row():
         with gr.Column(scale=1):
-            gr.Markdown("### ℹ️ About Janus-Pro")
             gr.Markdown("""
-            - **Model**: Janus-Pro-7B by DeepSeek
-            - **Capabilities**: Text understanding & generation
             - **License**: MIT
-            - **Framework**: Unified multimodal transformer
             """)
         with gr.Column(scale=2):
             chatbot = gr.Chatbot(
-                label="Chat with Janus-Pro",
                 height=400,
-                show_copy_button=True
             )
             with gr.Row():
                 msg = gr.Textbox(
-                    label="Your message",
-                    placeholder="Type your message here... (Press Enter to send)",
                     scale=4,
-                    container=False
                 )
-                clear_btn = gr.Button("🗑️ Clear", scale=1)
             with gr.Row():
                 gr.Examples(
                     examples=[
-                        "Explain quantum computing in simple terms",
-                        "Write a short poem about artificial intelligence",
-                        "What are the benefits of renewable energy?",
-                        "How does machine learning work?"
                     ],
                     inputs=msg,
-                    label="Try these examples:"
                 )
     # Event handlers
     msg.submit(
-        fn=chat_with_janus,
         inputs=[msg, chatbot],
         outputs=chatbot
     ).then(
@@ -146,10 +179,12 @@ with gr.Blocks(theme=gr.themes.Soft(), css=css) as demo:
     gr.Markdown(
         """
         ---
-        **Tips**:
-        - Be specific in your questions for better responses
-        - The model excels at technical explanations and creative writing
-        - First message may be slow as the model loads
         """
     )

 import os
 import time
+# Get the token from environment variables
 API_TOKEN = os.environ.get("HF_TOKEN", "")
 MODEL_NAME = "deepseek-ai/Janus-Pro-7B"
 API_URL = f"https://api-inference.huggingface.co/models/{MODEL_NAME}"
+headers = {"Authorization": f"Bearer {API_TOKEN}"} if API_TOKEN else {}
+def check_token_setup():
+    """Check if token is properly set up"""
+    if not API_TOKEN:
+        return "❌ HF_TOKEN not found. Please add your Hugging Face token in Space Settings → Secrets → HF_TOKEN"
+    elif not API_TOKEN.startswith("hf_"):
+        return "❌ Invalid token format. Token should start with 'hf_'"
+    else:
+        return "✅ Token is properly configured!"
 def query_janus_model(payload):
     """Send request to Hugging Face Inference API"""
+    if not API_TOKEN:
+        return {"error": "No API token configured"}
     try:
+        response = requests.post(API_URL, headers=headers, json=payload, timeout=60)
         if response.status_code == 503:
+            return {"error": "🔄 Model is loading, please try again in 30-60 seconds..."}
+        elif response.status_code == 401:
+            return {"error": "🔐 Invalid API token. Please check your HF_TOKEN secret."}
+        elif response.status_code == 404:
+            return {"error": "❌ Model not found. The model might be temporarily unavailable."}
         elif response.status_code != 200:
+            return {"error": f"API Error {response.status_code}: {response.text}"}
         return response.json()
     except requests.exceptions.Timeout:
+        return {"error": "⏰ Request timeout - model might be loading"}
     except Exception as e:
+        return {"error": f"🔌 Connection error: {str(e)}"}
 def chat_with_janus(message, history):
     """Chat function for Janus-Pro model"""
+    # First check token setup
+    token_status = check_token_setup()
+    if "❌" in token_status:
+        yield token_status
+        return
+    # Show token status
+    yield "✅ Token configured! Processing your request..."
+    time.sleep(1)
     # Prepare the payload
     payload = {
         "inputs": message,
         "parameters": {
+            "max_new_tokens": 350,
             "temperature": 0.7,
             "top_p": 0.9,
             "do_sample": True,
     }
     # Show loading message
+    yield "🔄 Sending request to Janus-Pro-7B... (First time may take 30-60 seconds)"
     # Query the model
     result = query_janus_model(payload)
     # Process the response
     if "error" in result:
+        yield f"{result['error']}"
     elif isinstance(result, list) and len(result) > 0:
         if 'generated_text' in result[0]:
+            generated_text = result[0]['generated_text']
+            # Clean up the response
+            if generated_text.startswith(message):
+                generated_text = generated_text[len(message):].strip()
+            yield generated_text
         else:
+            yield f"📄 Response: {str(result[0])}"
     elif isinstance(result, dict) and 'generated_text' in result:
         yield result['generated_text']
     else:
     """Clear chat history"""
     return [], []
 # Create the chat interface
+with gr.Blocks(theme=gr.themes.Soft(), title="Janus-Pro-7B API") as demo:
     gr.Markdown(
         """
         # 🚀 Janus-Pro-7B Chat API
+        **Free API for DeepSeek's Multimodal AI Model**
+        *Understanding & Generation Capabilities*
         """
     )
+    # Token status display
+    token_status = gr.Markdown(check_token_setup())
     with gr.Row():
         with gr.Column(scale=1):
+            gr.Markdown("### 📋 Instructions")
             gr.Markdown("""
+            1. **First message may take 30-60 seconds** (model loading)
+            2. **Subsequent messages are faster**
+            3. **Be specific** for better responses
+            4. Model supports **technical explanations** and **creative writing**
+            """)
+            gr.Markdown("### ℹ️ Model Info")
+            gr.Markdown("""
+            - **Name**: Janus-Pro-7B
+            - **Developer**: DeepSeek AI
+            - **Type**: Multimodal (Text + Image)
             - **License**: MIT
             """)
         with gr.Column(scale=2):
             chatbot = gr.Chatbot(
+                label="💬 Chat with Janus-Pro",
                 height=400,
+                show_copy_button=True,
+                placeholder="Your conversation will appear here..."
             )
             with gr.Row():
                 msg = gr.Textbox(
+                    label="Type your message",
+                    placeholder="Ask me anything... (Press Enter to send)",
                     scale=4,
+                    container=False,
+                    autofocus=True
                 )
+                clear_btn = gr.Button("🗑️ Clear Chat", scale=1)
             with gr.Row():
                 gr.Examples(
                     examples=[
+                        "Explain quantum computing like I'm 10 years old",
+                        "Write a short story about a robot learning to paint",
+                        "What are the main differences between AI and human intelligence?",
+                        "How do transformers work in machine learning?"
                     ],
                     inputs=msg,
+                    label="💡 Try these examples:"
                 )
     # Event handlers
+    def respond_and_clear(message, history):
+        for response in chat_with_janus(message, history):
+            yield response
     msg.submit(
+        fn=respond_and_clear,
         inputs=[msg, chatbot],
         outputs=chatbot
     ).then(
     gr.Markdown(
         """
         ---
+        **Note**: This is a free API using Hugging Face's Inference API. There might be rate limits for high usage.
+        **Troubleshooting**:
+        - If you get token errors, check your HF_TOKEN secret in Space Settings
+        - If model is loading, wait 30-60 seconds and try again
+        - For persistent issues, check the Space logs
         """
     )