kfahn's picture
Update app.py
7348fc4 verified
raw
history blame
5.8 kB
from smolagents import CodeAgent,DuckDuckGoSearchTool, HfApiModel,load_tool,tool
import datetime
import requests
import pytz
import yaml
import asyncio
import nest_asyncio
from playwright.async_api import async_playwright
from PIL import Image
import subprocess
import json
import gradio as gr
from tools.final_answer import FinalAnswerTool
from Gradio_UI import GradioUI
nest_asyncio.apply() # Ensure async works in a Jupyter/Colab/HF Spaces environment
subprocess.run(["apt-get", "update"])
subprocess.run(["apt-get", "install", "-y", "libnss3", "libatk1.0-0", "libatk-bridge2.0-0", "libxcomposite1",
"libxdamage1", "libcups2"])
subprocess.run(["playwright", "install", "chromium"])
# Below is an example of a tool that does nothing. Amaze us with your creativity !
@tool
def my_custom_tool(arg1:str, arg2:int)-> str: #it's import to specify the return type
#Keep this format for the description / args / args description but feel free to modify the tool
"""A tool that does nothing yet
Args:
arg1: the first argument
arg2: the second argument
"""
return "What magic will you build ?"
def load_image_sources():
with open("image_sources.json", "r") as file:
return json.load(file)
image_sources = load_image_sources()
def get_image_url(image_type: str):
return image_sources.get(image_type, None)
async def capture_screenshot(image_type: str):
"""Launches Playwright and uses user input, if any, to captures a screenshot of an image from p5.js."""
print("Launching Playwright...")
async with async_playwright() as p:
browser = await p.chromium.launch(headless=True)
page = await browser.new_page()
#url = "https://openprocessing.org/sketch/2539973"
url = "https://editor.p5js.org/kfahn/full/2XD5Y8MiV"
image_url
if image_type:
image_url = get_image_url(image_type)
else:
image_url = url
print(f"Opening image from p5 sketch: {image_url}")
await page.goto(image_url, timeout=120000) # Wait for the image page to load
print("Waiting for image element...")
# await page.wait_for_selector("img", timeout=120000) # Wait for the <img> to be visible
await page.wait_for_timeout(5000) # Allow sketch to fully render
print("Capturing screenshot...")
await page.screenshot(path="img.png")
await browser.close()
print("Screenshot saved!")
@tool
def grab_image(image_type: str) -> Image:
"""
Fetches an op art image from a p5.js sketch.
This function sends uses Playwright to launch a headless server and grab a screenshot of a p5.js sketch.
Args:
image_type: A geneerate art type
Returns:
image: The screen shot of the p5.js sketch as an image.
"""
print("Running async Playwright screenshot...")
loop = asyncio.new_event_loop() # Create a new event loop (Fixes issues on HF Spaces)
asyncio.set_event_loop(loop)
loop.run_until_complete(capture_screenshot(image_type))
print("Loading image for Gradio...")
img = Image.open("img.png")
return img
@tool
def get_joke() -> str:
"""
Fetches a random joke from the JokeAPI.
This function sends a GET request to the JokeAPI to retrieve a random joke.
It handles both single jokes and two-part jokes (setup and delivery).
If the request fails or the response does not contain a joke, an error message is returned.
Returns:
str: The joke as a string, or an error message if the joke could not be fetched.
"""
url = "https://v2.jokeapi.dev/joke/Any?type=single"
try:
response = requests.get(url)
response.raise_for_status()
data = response.json()
if "joke" in data:
return data["joke"]
elif "setup" in data and "delivery" in data:
return f"{data['setup']} - {data['delivery']}"
else:
return "Error: Unable to fetch joke."
except requests.exceptions.RequestException as e:
return f"Error fetching joke: {str(e)}"
#https://github.com/huggingface/smolagents/blob/main/examples/multiple_tools.py
@tool
def get_current_time_in_timezone(timezone: str) -> str:
"""A tool that fetches the current local time in a specified timezone.
Args:
timezone: A string representing a valid timezone (e.g., 'America/New_York').
"""
try:
# Create timezone object
tz = pytz.timezone(timezone)
# Get current time in that timezone
local_time = datetime.datetime.now(tz).strftime("%Y-%m-%d %H:%M:%S")
return f"The current local time in {timezone} is: {local_time}"
except Exception as e:
return f"Error fetching time for timezone '{timezone}': {str(e)}"
final_answer = FinalAnswerTool()
# If the agent does not answer, the model is overloaded, please use another model or the following Hugging Face Endpoint that also contains qwen2.5 coder:
# model_id='https://pflgm2locj2t89co.us-east-1.aws.endpoints.huggingface.cloud'
model = HfApiModel(
max_tokens=2096,
temperature=0.5,
model_id='Qwen/Qwen2.5-Coder-32B-Instruct',# it is possible that this model may be overloaded
custom_role_conversions=None,
)
# Import tool from Hub
image_generation_tool = load_tool("agents-course/text-to-image", trust_remote_code=True)
with open("prompts.yaml", 'r') as stream:
prompt_templates = yaml.safe_load(stream)
agent = CodeAgent(
model=model,
tools=[final_answer, get_joke, grab_image], ## add your tools here (don't remove final answer)
max_steps=6,
verbosity_level=1,
grammar=None,
planning_interval=None,
name=None,
description=None,
prompt_templates=prompt_templates
)
GradioUI(agent).launch()