final-assignment-hf-agent-course

Running

App Files Files Community

Francesco Laiti commited on 2 days ago

Commit

a745ced

1 Parent(s): 2e3fe1a

Add .gitignore, implement AskMeAnythingAgent in agent.py, and update app.py to utilize the new agent. Include instruction prompts in YAML format.

Browse files

Files changed (4) hide show

.gitignore +197 -0
agent.py +104 -0
app.py +17 -15
instruction_prompts.yaml +12 -0

.gitignore ADDED Viewed

	@@ -0,0 +1,197 @@

+# Created by https://www.toptal.com/developers/gitignore/api/visualstudiocode,python
+# Edit at https://www.toptal.com/developers/gitignore?templates=visualstudiocode,python
+media/
+old_agent.py
+### Python ###
+# Byte-compiled / optimized / DLL files
+__pycache__/
+*.py[cod]
+*$py.class
+# C extensions
+*.so
+# Distribution / packaging
+.Python
+build/
+develop-eggs/
+dist/
+downloads/
+eggs/
+.eggs/
+lib/
+lib64/
+parts/
+sdist/
+var/
+wheels/
+share/python-wheels/
+*.egg-info/
+.installed.cfg
+*.egg
+MANIFEST
+# PyInstaller
+#  Usually these files are written by a python script from a template
+#  before PyInstaller builds the exe, so as to inject date/other infos into it.
+*.manifest
+*.spec
+# Installer logs
+pip-log.txt
+pip-delete-this-directory.txt
+# Unit test / coverage reports
+htmlcov/
+.tox/
+.nox/
+.coverage
+.coverage.*
+.cache
+nosetests.xml
+coverage.xml
+*.cover
+*.py,cover
+.hypothesis/
+.pytest_cache/
+cover/
+# Translations
+*.mo
+*.pot
+# Django stuff:
+*.log
+local_settings.py
+db.sqlite3
+db.sqlite3-journal
+# Flask stuff:
+instance/
+.webassets-cache
+# Scrapy stuff:
+.scrapy
+# Sphinx documentation
+docs/_build/
+# PyBuilder
+.pybuilder/
+target/
+# Jupyter Notebook
+.ipynb_checkpoints
+# IPython
+profile_default/
+ipython_config.py
+# pyenv
+#   For a library or package, you might want to ignore these files since the code is
+#   intended to run in multiple environments; otherwise, check them in:
+# .python-version
+# pipenv
+#   According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
+#   However, in case of collaboration, if having platform-specific dependencies or dependencies
+#   having no cross-platform support, pipenv may install dependencies that don't work, or not
+#   install all needed dependencies.
+#Pipfile.lock
+# poetry
+#   Similar to Pipfile.lock, it is generally recommended to include poetry.lock in version control.
+#   This is especially recommended for binary packages to ensure reproducibility, and is more
+#   commonly ignored for libraries.
+#   https://python-poetry.org/docs/basic-usage/#commit-your-poetrylock-file-to-version-control
+#poetry.lock
+# pdm
+#   Similar to Pipfile.lock, it is generally recommended to include pdm.lock in version control.
+#pdm.lock
+#   pdm stores project-wide configurations in .pdm.toml, but it is recommended to not include it
+#   in version control.
+#   https://pdm.fming.dev/#use-with-ide
+.pdm.toml
+# PEP 582; used by e.g. github.com/David-OConnor/pyflow and github.com/pdm-project/pdm
+__pypackages__/
+# Celery stuff
+celerybeat-schedule
+celerybeat.pid
+# SageMath parsed files
+*.sage.py
+# Environments
+.env
+.venv
+env/
+venv/
+ENV/
+env.bak/
+venv.bak/
+# Spyder project settings
+.spyderproject
+.spyproject
+# Rope project settings
+.ropeproject
+# mkdocs documentation
+/site
+# mypy
+.mypy_cache/
+.dmypy.json
+dmypy.json
+# Pyre type checker
+.pyre/
+# pytype static type analyzer
+.pytype/
+# Cython debug symbols
+cython_debug/
+# PyCharm
+#  JetBrains specific template is maintained in a separate JetBrains.gitignore that can
+#  be found at https://github.com/github/gitignore/blob/main/Global/JetBrains.gitignore
+#  and can be added to the global gitignore or merged into this file.  For a more nuclear
+#  option (not recommended) you can uncomment the following to ignore the entire idea folder.
+#.idea/
+### Python Patch ###
+# Poetry local configuration file - https://python-poetry.org/docs/configuration/#local-configuration
+poetry.toml
+# ruff
+.ruff_cache/
+# LSP config files
+pyrightconfig.json
+### VisualStudioCode ###
+.vscode/*
+!.vscode/settings.json
+!.vscode/tasks.json
+!.vscode/launch.json
+!.vscode/extensions.json
+!.vscode/*.code-snippets
+# Local History for Visual Studio Code
+.history/
+# Built Visual Studio Code Extensions
+*.vsix
+### VisualStudioCode Patch ###
+# Ignore all local history of files
+.history
+.ionide
+# End of https://www.toptal.com/developers/gitignore/api/visualstudiocode,python

agent.py ADDED Viewed

	@@ -0,0 +1,104 @@

+import os
+from dotenv import load_dotenv
+import yaml
+import re
+import json
+import pandas as pd
+from pathlib import Path
+import time
+from agno.agent import Agent, RunResponse
+from agno.models.google import Gemini
+from agno.media import Image, Audio, Video, File
+from agno.tools.googlesearch import GoogleSearchTools
+from agno.tools.calculator import CalculatorTools
+URL_BASE_DOWNLOAD = "https://agents-course-unit4-scoring.hf.space/files/"
+load_dotenv()
+class AskMeAnythingAgent:
+    def __init__(self, model_id: str = "gemini-2.0-flash", debug: bool = False):
+        with open("instruction_prompts.yaml", "r") as file:
+            self.instruction_prompts = yaml.safe_load(file)
+        self.main_agent = Agent(
+            name="Ask Me Anything",
+            model=Gemini(id=model_id),
+            role=self.instruction_prompts["role"],
+            instructions=self.instruction_prompts["instructions"],
+            goal=self.instruction_prompts["goal"],
+            tools=[GoogleSearchTools(), CalculatorTools()],
+            debug_mode=debug,
+        )
+    def __call__(self, question: str, file_name: str = "", debug: bool = False) -> str:
+        payload = self.manage_payload(file_name, question)
+        response: RunResponse = self.main_agent.run(message=question, **payload)
+        return self.parse_response(response.content)
+    def manage_payload(self, file_name: str, question: str):
+        if file_name != "":
+            if file_name.endswith(".png"):
+                return {"images": [Image(url=URL_BASE_DOWNLOAD + file_name.split(".")[0], format="png")]}
+            elif file_name.endswith(".mp3"):
+                return {"audio": [Audio(url=URL_BASE_DOWNLOAD + file_name.split(".")[0], format="mp3")]}
+            elif file_name.endswith(".xlsx"):
+                df = pd.read_excel(io=URL_BASE_DOWNLOAD + file_name.split(".")[0])
+                df.to_csv(f"media/{file_name.split('.')[0]}.csv", index=False)
+                return {"files": [File(filepath=f"media/{file_name.split('.')[0]}.csv", mime_type="text/csv")]}
+            else:
+                return {"files": [File(url=URL_BASE_DOWNLOAD + file_name.split(".")[0])]}
+        elif "https://www.youtube.com/" in question:
+                url = re.search(r'https://www\.youtube\.com/watch\?v=[\w-]+', question).group(0)
+                path_to_file = self.download_yt_video(url)
+                return {"videos": [Video(filepath=path_to_file)]}
+        else:
+            return {}
+    def download_yt_video(self, url: str):
+        import yt_dlp
+        import os
+        ydl_opts = {
+            'format': 'best',
+            'outtmpl': 'media/%(id)s.%(ext)s',
+            'quiet': True,
+        }
+        os.makedirs("media", exist_ok=True)
+        print(f"Downloading video from {url}")
+        if not os.path.exists(f"media/{url.split('v=')[1]}.mp4"):
+            with yt_dlp.YoutubeDL(ydl_opts) as ydl:
+                #info = ydl.extract_info(url, download=False)
+                #final_filename = ydl.prepare_filename(info)
+                ydl.download([url])
+        return Path(__file__).parent.joinpath(f"media/{url.split('v=')[1]}.mp4")
+    def download_file(self, file_name: str):
+        import requests
+        response = requests.get(URL_BASE_DOWNLOAD + file_name)
+        os.makedirs("media", exist_ok=True)
+        if not os.path.exists(f"media/{file_name}"):
+            with open(f"media/{file_name}", 'wb') as file:
+                file.write(response.content)
+        return f"media/{file_name}"
+    def parse_response(self, response: str):
+        field_header_pattern = re.compile(r"\[\[ ## ANSWER ## \]\]|\[\[## ANSWER ##\]\]")
+        for line in response.splitlines():
+            match = field_header_pattern.search(line.strip())
+            if match:
+                return line[match.end():].strip()
+        return "invalid"
+if __name__ == "__main__":
+    with open("questions.json", "r") as file:
+        questions = json.load(file)
+    for i, question in enumerate(questions):
+        agent = AskMeAnythingAgent(debug=False)
+        print(f"{i+1}. QUESTION: ", question["question"], "\nFILE: ", question["file_name"])
+        print(f"{i+1}. ANSWER: ", agent(question["question"], question["file_name"]), "\n\n")
+        if (i+1) % 5 == 0:
+            print("Sleeping for 30 seconds to avoid RPM limit from API")
+            time.sleep(30)

app.py CHANGED Viewed

@@ -3,21 +3,16 @@ import gradio as gr
 import requests
 import inspect
 import pandas as pd
-# (Keep Constants as is)
 # --- Constants ---
 DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
-# --- Basic Agent Definition ---
-# ----- THIS IS WERE YOU CAN BUILD WHAT YOU WANT ------
-class BasicAgent:
-    def __init__(self):
-        print("BasicAgent initialized.")
-    def __call__(self, question: str) -> str:
-        print(f"Agent received question (first 50 chars): {question[:50]}...")
-        fixed_answer = "This is a default answer."
-        print(f"Agent returning fixed answer: {fixed_answer}")
-        return fixed_answer
 def run_and_submit_all( profile: gr.OAuthProfile | None):
     """
@@ -40,7 +35,7 @@ def run_and_submit_all( profile: gr.OAuthProfile | None):
     # 1. Instantiate Agent ( modify this part to create your agent)
     try:
-        agent = BasicAgent()
     except Exception as e:
         print(f"Error instantiating agent: {e}")
         return f"Error initializing agent: {e}", None
@@ -76,17 +71,24 @@ def run_and_submit_all( profile: gr.OAuthProfile | None):
     for item in questions_data:
         task_id = item.get("task_id")
         question_text = item.get("question")
         if not task_id or question_text is None:
             print(f"Skipping item with missing task_id or question: {item}")
             continue
         try:
-            submitted_answer = agent(question_text)
             answers_payload.append({"task_id": task_id, "submitted_answer": submitted_answer})
             results_log.append({"Task ID": task_id, "Question": question_text, "Submitted Answer": submitted_answer})
         except Exception as e:
              print(f"Error running agent on task {task_id}: {e}")
              results_log.append({"Task ID": task_id, "Question": question_text, "Submitted Answer": f"AGENT ERROR: {e}"})
     if not answers_payload:
         print("Agent did not produce any answers to submit.")
         return "Agent did not produce any answers to submit.", pd.DataFrame(results_log)

 import requests
 import inspect
 import pandas as pd
+from agent import AskMeAnythingAgent
+import time
+from tqdm import tqdm
 # --- Constants ---
 DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
+RPM_MODEL_LIMIT = 10
+MARGIN_TIME = 15
+MODEL_ID = "gemini-2.5-flash-preview-04-17" # "gemini-2.5-pro-exp-03-25"
 def run_and_submit_all( profile: gr.OAuthProfile | None):
     """
     # 1. Instantiate Agent ( modify this part to create your agent)
     try:
+        agent = AskMeAnythingAgent(model_id=MODEL_ID, debug=True)
     except Exception as e:
         print(f"Error instantiating agent: {e}")
         return f"Error initializing agent: {e}", None
     for item in questions_data:
         task_id = item.get("task_id")
         question_text = item.get("question")
+        file_name = item.get("file_name")
         if not task_id or question_text is None:
             print(f"Skipping item with missing task_id or question: {item}")
             continue
+        start_time = time.time()
         try:
+            submitted_answer = agent(question_text, file_name)
             answers_payload.append({"task_id": task_id, "submitted_answer": submitted_answer})
             results_log.append({"Task ID": task_id, "Question": question_text, "Submitted Answer": submitted_answer})
         except Exception as e:
              print(f"Error running agent on task {task_id}: {e}")
              results_log.append({"Task ID": task_id, "Question": question_text, "Submitted Answer": f"AGENT ERROR: {e}"})
+        end_time = time.time()
+        time_taken = end_time - start_time
+        if time_taken < (60 / RPM_MODEL_LIMIT):
+            print(f"Waiting for {60 / RPM_MODEL_LIMIT - time_taken + MARGIN_TIME} seconds to avoid exceeding the free tier rate limit")
+            for _ in tqdm(range(int(60 / RPM_MODEL_LIMIT - time_taken + MARGIN_TIME)), desc="Waiting..."):
+                time.sleep(1)
     if not answers_payload:
         print("Agent did not produce any answers to submit.")
         return "Agent did not produce any answers to submit.", pd.DataFrame(results_log)

instruction_prompts.yaml ADDED Viewed

	@@ -0,0 +1,12 @@

+role:
+ - "You will be given a question, and optionally an attached file (image, audio, video, spreadsheet, or code)"
+goal:
+ - "Produce a correct, concise answer based on the question and file."
+instructions:
+  - "Start your response with a brief explanation of your reasoning unless the question explicitly instructs you to provide only the answer."
+  - "End your response using the following template: [[ ## ANSWER ## ]] {final answer}"
+  - "For number, do not include commas (e.g., write 1042 not 1,042), do not include units (e.g., $, %, etc.) unless explicitly required, do not use scientific notation unless specified.."
+  - "For string, do not use articles (e.g., a, an, the), do not use abbreviations (e.g., use 'San Francisco' instead of 'SF'), write digits as plain text (e.g., 'three' instead of '3') unless numeric form is clearly expected (e.g., years, IDs)."
+  - "For list, return items as a comma-separated list, apply the number and string formatting rules to each element, alphabetize the list if the question asks for it, follow any specific structural requirements in the question (e.g., 'last names only')."
+  - "If a file is provided, incorporate relevant content from the file in your answer."
+  - "If the question requires a specific format (e.g., algebraic notation, page numbers), use it exactly as expected."