Spaces:

jlgaralc
/

Agent_Agents_Course

Sleeping

App Files Files Community

jesusgj commited on Jun 28

Commit

892cc72

1 Parent(s): 80ef074

Modified files

Browse files

Files changed (1) hide show

agent.py +251 -153

agent.py CHANGED Viewed

@@ -1,177 +1,275 @@
 import os
-import re
-import requests
-import serpapi
 import time
-from smolagents import CodeAgent, ToolCallingAgent, WebSearchTool, tool
-from smolagents import InferenceClientModel
 from dotenv import load_dotenv
-from markdownify import markdownify
 from requests.exceptions import RequestException
 from llama_index.core import VectorStoreIndex, download_loader
 from llama_index.core.schema import Document
-from youtube_transcript_api import YouTubeTranscriptApi
-search_cache = {}
-webpage_cache = {}
-MAX_RETRIES = 3
-INITIAL_DELAY = 1  # seconds
-def initialize_agent():
-    # Load environment variables from .env file
     load_dotenv()
-    # 1. Load the model
-    # Make sure to set TOGETHER_API_KEY in your environment variables
-    model_name = "mistralai/Mixtral-8x7B-Instruct-v0.1"
-    try:
-        model = InferenceClientModel(model_id=model_name, token=os.environ.get("TOGETHER_API_KEY"), provider="together")
-    except Exception as e:
-        print(f"Error loading model: {e}")
-        model = None
-    # 2. Define the tools
     @tool
     def query_webpage(url: str, query: str) -> str:
-        """Queries a webpage at the given URL to find specific information and returns a concise answer.
-        Args:
-            url: The URL of the webpage to query.
-            query: The specific question to ask about the content of the webpage.
-        Returns:
-            A concise answer to the query based on the webpage's content, or an error message.
         """
-        if (url, query) in webpage_cache:
-            return webpage_cache[(url, query)]
-        for i in range(MAX_RETRIES):
-            try:
-                BeautifulSoupWebReader = download_loader("BeautifulSoupWebReader")
-                loader = BeautifulSoupWebReader()
-                documents = loader.load_data(urls=[url])
-                index = VectorStoreIndex.from_documents(documents)
-                query_engine = index.as_query_engine()
-                response = query_engine.query(query)
-                webpage_cache[(url, query)] = str(response)
-                return str(response)
-            except Exception as e:
-                if i < MAX_RETRIES - 1:
-                    delay = INITIAL_DELAY * (2 ** i)
-                    print(f"Error querying webpage: {str(e)}. Retrying in {delay} seconds...")
-                    time.sleep(delay)
-                else:
-                    return f"An unexpected error occurred after multiple retries: {str(e)}"
     @tool
-    def query_youtube_video(video_id: str, query: str) -> str:
-        """Queries a YouTube video's transcript to find specific information and returns a concise answer.
-        Args:
-            video_id: The ID of the YouTube video.
-            query: The specific question to ask about the content of the video transcript.
-        Returns:
-            A concise answer to the query based on the video transcript, or an error message.
-        """
-        if (video_id, query) in webpage_cache: # Using webpage_cache for simplicity
-            return webpage_cache[(video_id, query)]
-        for i in range(MAX_RETRIES):
-            try:
-                transcript_list = YouTubeTranscriptApi.get_transcript(video_id)
-                transcript_text = " ".join([t['text'] for t in transcript_list])
-                documents = [Document(text=transcript_text)]
-                index = VectorStoreIndex.from_documents(documents)
-                query_engine = index.as_query_engine()
-                response = query_engine.query(query)
-                webpage_cache[(video_id, query)] = str(response)
-                return str(response)
-            except Exception as e:
-                if i < MAX_RETRIES - 1:
-                    delay = INITIAL_DELAY * (2 ** i)
-                    print(f"Error querying YouTube video: {str(e)}. Retrying in {delay} seconds...")
-                    time.sleep(delay)
-                else:
-                    return f"An unexpected error occurred after multiple retries: {str(e)}"
-    @tool
-    def google_search(query: str) -> str:
-        """Searches Google for the given query and returns the results.
-        Args:
-            query: The query to search for.
-        Returns:
-            The search results, or an error message if the search fails.
-        """
-        if query in search_cache:
-            return search_cache[query]
-        for i in range(MAX_RETRIES):
-            try:
-                client = serpapi.Client(api_key=os.environ.get("SERPAPI_API_KEY"))
-                results = client.search(q=query, engine="google")
-                if "ai_overview" in results:
-                    ai_overview = results["ai_overview"]
-                    output = ""
-                    for block in ai_overview.get("text_blocks", []):
-                        if block["type"] == "paragraph":
-                            output += block["snippet"] + "\n\n"
-                        elif block["type"] == "heading":
-                            output += f"### {block['snippet']}\n\n"
-                        elif block["type"] == "list":
-                            for item in block["list"]:
-                                output += f"- **{item['title']}** {item['snippet']}\n"
-                            output += "\n"
-                    if "references" in ai_overview:
-                        output += "\n**References:**\n"
-                        for ref in ai_overview["references"]:
-                            output += f"- [{ref['title']}]({ref['link']})\n"
-                    search_cache[query] = output
-                    return output
-                elif "organic_results" in results:
-                    result = str(results["organic_results"])
-                    search_cache[query] = result
-                    return result
-                else:
-                    return "No results found."
-            except Exception as e:
-                if i < MAX_RETRIES - 1:
-                    delay = INITIAL_DELAY * (2 ** i)
-                    print(f"Error performing Google search: {str(e)}. Retrying in {delay} seconds...")
-                    time.sleep(delay)
-                else:
-                    return f"Error performing Google search after multiple retries: {str(e)}"
-    # 3. Define the agents
-    if model:
-        web_agent = ToolCallingAgent(
-            tools=[WebSearchTool(), query_webpage, query_youtube_video, google_search],
-            model=model,
-            max_steps=10,
-            name="web_search_agent",
-            description="Runs web searches for you.",
-        )
-        manager_agent = CodeAgent(
-            tools=[],
-            model=model,
-            managed_agents=[web_agent],
-            additional_authorized_imports=["time", "numpy", "pandas", "requests", "serpapi", "llama_index", "beautifulsoup4", "markdownify", "lxml", "json", "urllib.parse", "youtube_transcript_api", "together"],
-            instructions='''You are a general AI assistant. I will ask you a question. Report your thoughts, and finish your answer with the a new line and the following template: FINAL ANSWER: [YOUR FINAL ANSWER]. YOUR FINAL ANSWER should be a number OR as few words as possible OR a comma separated list of numbers and/or strings. If you are asked for a number, don't use comma to write your number neither use units such as $ or percent sign unless specified otherwise. If you are asked for a string, don't use articles, neither abbreviations (e.g. for cities), and write the digits in plain text unless specified otherwise. If you are asked for a comma separated list, apply the above rules depending of whether the element to be put in the list is a number or a string.
-To achieve the best results, follow these steps:
-1. **Understand the Question:** Carefully read and analyze the user's question to identify the core task and any specific constraints (e.g., format, type of answer).
-2. **Formulate a Plan:** Based on the question, devise a step-by-step plan. This might involve using web search, querying webpages, or analyzing YouTube videos. Consider what information is needed and which tool is best suited to obtain it.
-3. **Execute Tools:** Prioritize using `WebSearchTool()` for general web searches. If `WebSearchTool()` fails, or if more specific, structured search results are required (e.g., for AI overviews or specific data points), then use `google_search` (SerpApi). Use `query_webpage` for detailed information extraction from specific URLs and `query_youtube_video` for YouTube transcript analysis. Be mindful of rate limits and use caching effectively.
-4. **Synthesize Information:** Combine and process the information obtained from the tools to formulate a comprehensive answer. If the question requires specific data extraction, ensure accuracy.
-5. **Format the Final Answer:** Adhere strictly to the specified FINAL ANSWER template. Ensure the answer type (number, string, comma-separated list) matches the question's requirement.
-6. **Self-Correction:** If initial attempts fail or produce unsatisfactory results, re-evaluate the plan and try alternative approaches or tools.'''
-        )
-        return manager_agent
-    else:
-        return None

 import os
 import time
+import logging
+import urllib.parse as urlparse
+import io
+import contextlib
+from functools import lru_cache, wraps
+# Add necessary imports for new tools
+import chess
+from stockfish import Stockfish
 from dotenv import load_dotenv
 from requests.exceptions import RequestException
+import serpapi
 from llama_index.core import VectorStoreIndex, download_loader
 from llama_index.core.schema import Document
+from youtube_transcript_api import YouTubeTranscriptApi, YouTubeTranscriptApiError
+from smolagents import CodeAgent, ToolCallingAgent, WebSearchTool, tool
+from smolagents import InferenceClientModel
+# --- Configuration and Setup ---
+def configure_logging():
+    """Sets up basic logging configuration."""
+    logging.basicConfig(
+        level=logging.INFO,
+        format="%(asctime)s [%(levelname)s] %(name)s: %(message)s",
+        datefmt="%Y-%m-%d %H:%M:%S"
+    )
+def load_api_keys():
+    """Loads API keys from a .env file."""
     load_dotenv()
+    keys = {
+        'together': os.getenv('TOGETHER_API_KEY'),
+        'serpapi': os.getenv('SERPAPI_API_KEY'),
+    }
+    if not all(keys.values()):
+        raise ValueError("One or more API keys are missing. Please check your .env file.")
+    return keys
+# --- Decorators ---
+def retry(max_retries=3, initial_delay=1, backoff=2):
+    """A robust retry decorator with exponential backoff."""
+    def decorator(func):
+        @wraps(func)
+        def wrapper(*args, **kwargs):
+            delay = initial_delay
+            # Define specific, retry-able exceptions
+            retryable_exceptions = (RequestException, SerpApiClientException, YouTubeTranscriptApiError)
+            for attempt in range(1, max_retries + 1):
+                try:
+                    return func(*args, **kwargs)
+                except retryable_exceptions as e:
+                    if attempt == max_retries:
+                        logging.error(f"{func.__name__} failed after {attempt} attempts: {e}")
+                        raise
+                    logging.warning(f"Attempt {attempt} for {func.__name__} failed: {e}. Retrying in {delay} seconds...")
+                    time.sleep(delay)
+                    delay *= backoff
+                except Exception as e:
+                    logging.error(f"{func.__name__} failed with a non-retryable error: {e}")
+                    raise
+        return wrapper
+    return decorator
+# --- Main Agent Initialization (as called by app.py) ---
+def initialize_agent():
+    """
+    Initializes a multi-disciplinary agent with a toolset and reasoning framework
+    designed for the benchmark's question categories.
+    """
+    api_keys = load_api_keys()
+    # --- Caching Layer for LlamaIndex ---
+    @lru_cache(maxsize=32)
+    @retry()
+    def get_webpage_index(url: str) -> VectorStoreIndex:
+        logging.info(f"Indexing webpage: {url}")
+        loader_cls = download_loader("BeautifulSoupWebReader")
+        loader = loader_cls()
+        docs = loader.load_data(urls=[url])
+        return VectorStoreIndex.from_documents(docs)
+    @lru_cache(maxsize=32)
+    @retry()
+    def get_youtube_index(video_id: str) -> VectorStoreIndex:
+        logging.info(f"Indexing YouTube video: {video_id}")
+        transcript = YouTubeTranscriptApi.get_transcript(video_id)
+        text = ' '.join([t['text'] for t in transcript])
+        doc = Document(text=text, doc_id=f"youtube_{video_id}")
+        return VectorStoreIndex.from_documents([doc])
+    # --- Specialized Tool Definitions ---
+    # 1. Web Search Tools
+    @tool
+    @retry()
+    def google_search(query: str) -> str:
+        """Use for general knowledge questions, finding facts, or when you don't have a specific URL."""
+        client = serpapi.Client(api_key=api_keys['serpapi'])
+        results = client.search(q=query, engine="google")
+        if organic_results := results.get('organic_results'):
+            md = ["### Top Search Results"]
+            for res in organic_results[:5]:
+                md.append(f"- **{res.get('title', 'N/A')}**: {res.get('snippet', 'No snippet available.')}\n  [Source]({res.get('link', '#')})")
+            return "\n\n".join(md)
+        return "No results found."
     @tool
     def query_webpage(url: str, query: str) -> str:
+        """Use when you need to answer a specific question about the content of a single webpage URL."""
+        try:
+            index = get_webpage_index(url)
+            return str(index.as_query_engine().query(query))
+        except Exception as e:
+            return f"Error querying webpage {url}: {e}"
+    # 2. YouTube Tool
+    @tool
+    def query_youtube_video(video_url_or_id: str, query: str) -> str:
+        """Use for questions about the content of a YouTube video. Accepts a full URL or a video ID."""
+        try:
+            video_id = video_url_or_id
+            if "youtube.com" in video_url_or_id or "youtu.be" in video_url_or_id:
+                parsed_url = urlparse.urlparse(video_url_or_id)
+                video_id = urlparse.parse_qs(parsed_url.query).get('v', [None])[0]
+                if not video_id:
+                    video_id = parsed_url.path.lstrip('/')
+            if not video_id:
+                return "Error: Could not extract a valid YouTube video ID."
+            index = get_youtube_index(video_id)
+            return str(index.as_query_engine().query(query))
+        except YouTubeTranscriptApiError as e:
+            return f"Error fetching transcript for video {video_id}: {e}"
+        except Exception as e:
+            return f"Error querying YouTube video {video_id}: {e}"
+    # 3. Coding Tool
+    @tool
+    def run_python_code(code: str) -> str:
         """
+        Executes a string of Python code and returns its standard output.
+        Use this for coding challenges, calculations, or data manipulation.
+        The code is executed in a restricted environment; it cannot access external files.
+        """
+        output = io.StringIO()
+        try:
+            with contextlib.redirect_stdout(output):
+                exec(code, {})
+            return output.getvalue()
+        except Exception as e:
+            return f"Error executing code: {e}"
+    # 4. Chess Tool
     @tool
+    def get_chess_move(fen: str) -> str:
+        """
+        Finds the best chess move for a given board position in FEN format.
+        Use this exclusively for chess-related questions.
+        """
+        # Path to stockfish can be set via env var for flexibility in HF Spaces
+        stockfish_path = os.getenv("STOCKFISH_PATH", "/usr/games/stockfish")
+        if not os.path.exists(stockfish_path):
+            return f"Error: Stockfish engine not found at {stockfish_path}. Please set STOCKFISH_PATH environment variable."
+        try:
+            stockfish = Stockfish(path=stockfish_path)
+            stockfish.set_fen_position(fen)
+            best_move = stockfish.get_best_move()
+            return best_move
+        except Exception as e:
+            return f"Error analyzing chess position: {e}"
+    # --- Model and Agent Initialization ---
+    try:
+        model = InferenceClientModel(
+            model_id="mistralai/Mixtral-8x7B-Instruct-v0.1",
+            token=api_keys['together'],
+            provider="together"
+        )
+        logging.info("Model loaded successfully.")
+    except Exception as e:
+        logging.error(f"Failed to load model: {e}")
+        raise
+    # A single, powerful worker agent with a diverse toolset
+    worker_agent = ToolCallingAgent(
+        tools=[
+            google_search,
+            query_webpage,
+            query_youtube_video,
+            run_python_code,
+            get_chess_move,
+        ],
+        model=model,
+        max_steps=5, # Sub-tasks should be short and focused
+        name="multi_tool_worker",
+        description="A specialized worker agent that can search the web, query videos, execute code, and play chess."
+    )
+    # The manager agent acts as a strategic dispatcher.
+    manager = CodeAgent(
+        model=model,
+        managed_agents=[worker_agent],
+        instructions="""
+You are a master AI assistant responsible for answering a user's question. Your goal is to provide a single, precise, and final answer.
+**Your Strategic Thought Process for GAIA Tasks:**
+1.  **ANALYZE THE QUESTION (Deep Understanding):**
+    *   Carefully read and dissect the user's question. Identify all constraints, keywords, and the exact format required for the final answer (e.g., number, string, comma-separated list, specific units).
+    *   Determine the core task: Is it a factual lookup, data extraction, code execution, video analysis, or a chess problem?
+2.  **FORMULATE A DETAILED PLAN (Multi-step if needed):**
+    *   Based on your analysis, outline a step-by-step strategy. For complex questions (Level 2/3 GAIA), this plan might involve multiple tool calls and intermediate reasoning steps.
+    *   **Prioritize Tools:**
+        *   For general web searches or initial broad information gathering, prefer `WebSearchTool()`. It's often quicker for a first pass.
+        *   If `WebSearchTool()` doesn't yield precise results, or if you need structured data (e.g., AI overviews, specific facts from search results), use `google_search` (SerpApi).
+        *   For extracting specific information from a known webpage URL, use `query_webpage`.
+        *   For questions about YouTube video content, use `query_youtube_video`.
+        *   For computational tasks or code generation, use `run_python_code`.
+        *   For chess problems, use `get_chess_move`.
+    *   Consider potential pitfalls and how to recover (e.g., if a search yields no results, try a different query).
+3.  **EXECUTE AND ITERATE (Tool Delegation & Synthesis):**
+    *   Delegate tasks to the `multi_tool_worker` agent, providing the exact tool and parameters.
+    *   Carefully evaluate the output from each tool call.
+    *   If the output is not sufficient, refine your query or try a different tool/approach. This is where iterative refinement and self-correction are crucial.
+    *   Synthesize information from multiple sources if necessary to build the complete answer.
+4.  **FORMULATE THE FINAL ANSWER (Precision & Format):**
+    *   Once you have definitively found the answer, format it *exactly* as requested in the original question.
+    *   **DO NOT** add any extra text, explanations, or conversational filler. The final answer must be *only* the answer itself.
+    *   Example: If the question asks for a number and the answer is "123", your output should be `FINAL ANSWER: 123`. If it asks for a string "New York", your output should be `FINAL ANSWER: New York`. If it asks for a comma-separated list "apple,banana", your output should be `FINAL ANSWER: apple,banana`.
+"""
+    )
+    logging.info("Multi-task agent initialized successfully.")
+    return manager
+# --- Main Execution Block for Local Testing ---
+def main():
+    """Main function for local testing of the agent."""
+    configure_logging()
+    try:
+        global SerpApiClientException
+        from serpapi.client import SerpApiClientException
+        agent = initialize_agent()
+        if agent:
+            # Example prompts for each category
+            prompts = {
+                "Web Search": "Who is the current CEO of OpenAI?",
+                "YouTube": "What is the main topic of the video https://www.youtube.com/watch?v=bZQun8Y4L2A regarding AI models?",
+                "Coding": "Write a Python script that calculates and prints the factorial of 5.",
+                "Chess": "What is the best move for the starting chess position? The FEN is 'rnbqkbnr/pppppppp/8/8/8/8/PPPPPPPP/RNBQKBNR w KQkq - 0 1'."
+            }
+            for category, prompt in prompts.items():
+                logging.info(f"\n--- Testing Category: {category} ---")
+                logging.info(f"Prompt: {prompt}")
+                response = agent.run(prompt)
+                logging.info(f"Agent's Final Answer: {response}")
+                logging.info("-" * (30 + len(category)))
+    except Exception as e:
+        logging.critical(f"An unhandled error occurred during local testing: {e}", exc_info=True)
+if __name__ == "__main__":
+    # This allows you to test the agent's logic by running `python agent.py` locally.
+    main()