Spaces:

Agents-MCP-Hackathon
/

Galita

Runtime error

App Files Files Community

mokrane25 commited on Jun 11

Commit

1f848f3

verified ·

1 Parent(s): c1a51db

Update app.py

Browse files

Files changed (1) hide show

app.py +261 -60

app.py CHANGED Viewed

@@ -1,64 +1,265 @@
 import gradio as gr
-from huggingface_hub import InferenceClient
-"""
-For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
-"""
-client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")
-def respond(
-    message,
-    history: list[tuple[str, str]],
-    system_message,
-    max_tokens,
-    temperature,
-    top_p,
-):
-    messages = [{"role": "system", "content": system_message}]
-    for val in history:
-        if val[0]:
-            messages.append({"role": "user", "content": val[0]})
-        if val[1]:
-            messages.append({"role": "assistant", "content": val[1]})
-    messages.append({"role": "user", "content": message})
-    response = ""
-    for message in client.chat_completion(
-        messages,
-        max_tokens=max_tokens,
-        stream=True,
-        temperature=temperature,
-        top_p=top_p,
-    ):
-        token = message.choices[0].delta.content
-        response += token
-        yield response
-"""
-For information on how to customize the ChatInterface, peruse the gradio docs: https://www.gradio.app/docs/chatinterface
-"""
-demo = gr.ChatInterface(
-    respond,
-    additional_inputs=[
-        gr.Textbox(value="You are a friendly Chatbot.", label="System message"),
-        gr.Slider(minimum=1, maximum=2048, value=512, step=1, label="Max new tokens"),
-        gr.Slider(minimum=0.1, maximum=4.0, value=0.7, step=0.1, label="Temperature"),
-        gr.Slider(
-            minimum=0.1,
-            maximum=1.0,
-            value=0.95,
-            step=0.05,
-            label="Top-p (nucleus sampling)",
-        ),
-    ],
-)
 if __name__ == "__main__":
-    demo.launch()

+# app.py
 import gradio as gr
+import os
+import traceback
+import asyncio
+from dotenv import load_dotenv
+from models.task_prompt import TaskPrompt
+import time
+from llama_index.core import Settings as LlamaSettings # Import at top level
+from llama_index.llms.anthropic import Anthropic # Import at top level
+from manager_agent import ManagerAgent # Ensure this path is correct
+import concurrent.futures # For running blocking code in a separate thread
+# Load environment variables from .env file
+load_dotenv()
+# --- Configuration ---
+LLM_MODEL = "claude-sonnet-4-20250514"
+# --- Global variables ---
+current_status = "Ready"
+llm_global = None
+manager_agent_global = None
+# Settings_global is not strictly needed as a global if LlamaSettings is imported directly
+# Thread pool executor for running blocking agent tasks
+thread_pool_executor = concurrent.futures.ThreadPoolExecutor(max_workers=os.cpu_count() or 1)
+# --- LlamaIndex LLM Initialization ---
+def initialize_components():
+    global llm_global, manager_agent_global
+    api_key = os.environ.get("ANTHROPIC_API_KEY")
+    if not api_key:
+        print("\n" + "="*60)
+        print("⚠️ ERROR: ANTHROPIC_API_KEY not found in environment variables!")
+        print("Please set your API key (e.g., in a .env file).")
+        print("="*60 + "\n")
+        return
+    try:
+        llm_global = Anthropic(
+            model=LLM_MODEL,
+            temperature=0.2,
+            max_tokens=4096
+        )
+        LlamaSettings.llm = llm_global # Use the imported LlamaSettings directly
+        print(f"Successfully initialized LlamaIndex with Anthropic model: {LLM_MODEL} (temperature=0.2)")
+        manager_agent_global = ManagerAgent(
+            llm_global,
+            max_iterations=30, # Keep this reasonable for testing
+            update_callback=update_status_callback
+        )
+        print("✅ ManagerAgent initialized successfully")
+    except Exception as e:
+        print(f"Error initializing Anthropic LLM or ManagerAgent: {e}")
+        traceback.print_exc()
+# --- Update callback function (called by ManagerAgent) ---
+def update_status_callback(message):
+    global current_status
+    # This function is called from the ManagerAgent's thread (potentially)
+    # or the ReAct agent's execution context.
+    # It needs to update the global variable, which the Gradio polling thread will pick up.
+    current_status = message
+    print(f"✅ UI_STATUS_UPDATE (via callback): {message}") # Differentiate console log
+# --- Status retrieval function for Gradio polling ---
+def get_current_status_for_ui():
+    global current_status
+    timestamp = time.time()
+    return f"{current_status}<span style='display:none;'>{timestamp}</span>"
+# --- Gradio Interface Setup ---
+def create_gradio_interface():
+    if "ANTHROPIC_API_KEY" not in os.environ:
+        gr.Warning("ANTHROPIC_API_KEY not found in environment variables! ALITA may not function correctly.")
+    with gr.Blocks(theme="soft") as demo:
+        gr.Markdown("# ALITA")
+        gr.Markdown("ALITA is a self-learning AI agent that can search for information, analyze data, create tools, and orchestrate complex tasks.")
+        chatbot_component = gr.Chatbot(
+            label="Chat",
+            height=500,
+            show_label=False,
+            # type='messages' # For Gradio 4.x+
+        )
+        gr.Markdown("Gradio version: " + gr.__version__ + " (Chatbot type defaults to 'tuples' for older versions. Consider `type='messages'` for newer Gradio if issues persist with chat display).")
+        with gr.Row():
+            message_textbox = gr.Textbox(
+                placeholder="Type your message here...",
+                scale=7,
+                show_label=False,
+                container=False
+            )
+        gr.Examples(
+            examples=[
+            "🔍 Search for information on artificial intelligence",
+            "📊 Analyze technology market trends",
+            "⚡ Create a script to automate a repetitive task",
+            "🌐 Find open source resources for machine learning",
+            ],
+            inputs=message_textbox,
+        )
+        status_box_component = gr.Textbox(
+            label="Agent Status",
+            value=get_current_status_for_ui(),
+            interactive=False,
+            # elem_id="status_box_alita" # For potential direct JS manipulation if desperate (avoid)
+        )
+        def add_user_msg(user_input_text, chat_history_list):
+            if not user_input_text.strip():
+                return gr.update(), chat_history_list
+            # For older Gradio, history is list of [user_msg, bot_msg] tuples
+            chat_history_list.append((user_input_text, None))
+            return gr.update(value=""), chat_history_list
+        async def generate_bot_reply(chat_history_list):
+            if not chat_history_list or chat_history_list[-1][0] is None:
+                # This case should ideally not be reached if add_user_msg works correctly
+                yield chat_history_list
+                return
+            user_message = chat_history_list[-1][0]
+            if manager_agent_global is None or LlamaSettings.llm is None:
+                # This update_status_callback will set current_status
+                # The polling mechanism (continuous_status_updater) should pick it up.
+                update_status_callback("⚠️ Error: Agent or LLM not initialized. Check API key and logs.")
+                # For older Gradio, update the last tuple's second element
+                chat_history_list[-1] = (chat_history_list[-1][0], "❌ Critical Error: ALITA is not properly initialized. Please check server logs and API key.")
+                yield chat_history_list
+                return
+            try:
+                print(f"\n🤖 GRADIOLOG: Processing user message: '{user_message[:100]}{'...' if len(user_message) > 100 else ''}'")
+                update_status_callback(f"💬 Processing: '{user_message[:50]}{'...' if len(user_message) > 50 else ''}'")
+                await asyncio.sleep(0.01) # Allow UI to briefly update with "Processing..."
+                task_prompt = TaskPrompt(text=user_message)
+                update_status_callback("🔄 Analyzing request and determining optimal workflow...")
+                await asyncio.sleep(0.01) # Allow UI to briefly update
+                # Run the blocking manager_agent_global.run_task in a separate thread
+                loop = asyncio.get_event_loop()
+                response_text_from_agent = await loop.run_in_executor(
+                    thread_pool_executor,
+                    manager_agent_global.run_task, # The function to run
+                    task_prompt                     # Arguments to the function
+                )
+                # By this point, run_task has completed, and all its internal
+                # calls to update_status_callback (via send_update) should have occurred.
+                # The polling mechanism should have picked up these changes.
+                update_status_callback("✨ Generating final response stream...")
+                await asyncio.sleep(0.01)
+                final_bot_response = response_text_from_agent
+                words = final_bot_response.split()
+                accumulated_response_stream = ""
+                total_words = len(words)
+                # Initialize bot's part of the message in history for older Gradio
+                current_user_message = chat_history_list[-1][0]
+                chat_history_list[-1] = (current_user_message, "")
+                if not words:
+                    chat_history_list[-1] = (current_user_message, final_bot_response.strip())
+                    yield chat_history_list
+                else:
+                    for i, word in enumerate(words):
+                        accumulated_response_stream += word + " "
+                        # These status updates are for the streaming part,
+                        # agent's internal updates should have already happened.
+                        if total_words > 0: # Avoid division by zero
+                            if i == total_words // 4: update_status_callback("🔄 Streaming response (25%)...")
+                            elif i == total_words // 2: update_status_callback("🔄 Streaming response (50%)...")
+                            elif i == (total_words * 3) // 4: update_status_callback("🔄 Streaming response (75%)...")
+                        if i % 3 == 0 or i == len(words) - 1:
+                            chat_history_list[-1] = (current_user_message, accumulated_response_stream.strip())
+                            yield chat_history_list
+                            await asyncio.sleep(0.01) # For streaming effect
+                # Ensure final complete response is set
+                if chat_history_list[-1][1] != final_bot_response.strip():
+                    chat_history_list[-1] = (current_user_message, final_bot_response.strip())
+                    yield chat_history_list
+                print("✅ GRADIOLOG: Task processing and streaming completed.")
+                update_status_callback("✅ Ready for your next request")
+            except Exception as e:
+                error_message_for_ui = f"❌ Gradio/Agent Error: {str(e)}"
+                print(f"\n🚨 GRADIOLOG: Error in generate_bot_reply: {e}")
+                traceback.print_exc()
+                update_status_callback(f"❌ Error: {str(e)[:100]}...")
+                chat_history_list[-1] = (chat_history_list[-1][0], error_message_for_ui)
+                yield chat_history_list
+        message_textbox.submit(
+            add_user_msg,
+            inputs=[message_textbox, chatbot_component],
+            outputs=[message_textbox, chatbot_component],
+            show_progress="hidden", # Gradio 3.x might not have this, can be ignored
+        ).then(
+            generate_bot_reply,
+            inputs=[chatbot_component],
+            outputs=[chatbot_component],
+            api_name=False, # Good practice
+            # show_progress="hidden", # Gradio 3.x might not have this
+        )
+        async def continuous_status_updater(update_interval_seconds=0.3): # Slightly faster poll
+            """Continuously yields status updates for the status_box_component."""
+            print("GRADIOLOG: Starting continuous_status_updater loop.")
+            while True:
+                # print(f"POLL: Fetching status: {current_status}") # DEBUG: very verbose
+                yield get_current_status_for_ui()
+                await asyncio.sleep(update_interval_seconds)
+        demo.load(continuous_status_updater, inputs=None, outputs=status_box_component)
+        print("GRADIOLOG: Continuous status updater loaded.")
+    return demo
+# Initialize LLM and Agent components
+initialize_components()
+# --- Launch the Application ---
 if __name__ == "__main__":
+    print(f"Gradio version: {gr.__version__}")
+    print("🚀 Starting Gradio ALITA Chat Application...")
+    alita_interface = create_gradio_interface()
+    try:
+        alita_interface.launch(
+            share=False,
+            server_name="127.0.0.1",
+            server_port=6126,
+            show_error=True,
+            # debug=True # Can be helpful
+        )
+    except KeyboardInterrupt:
+        print("\n👋 Application stopped by user")
+    except Exception as e:
+        print(f"\n❌ Error launching application: {e}")
+        traceback.print_exc()
+    finally:
+        print("Shutting down thread pool executor...")
+        thread_pool_executor.shutdown(wait=True) # Clean up threads
+    print("✅ Gradio application stopped.")