File size: 8,490 Bytes
9b5b26a
 
 
 
c19d193
9aab3c6
bd61bf6
91298ce
9aab3c6
 
fe2c880
212a11a
aa95680
3fdf8f1
bd61bf6
9aab3c6
6aae614
8fe992b
9b5b26a
 
bd61bf6
 
0f2505a
d6e96a8
8c95909
0f2505a
 
667a8cc
9aab3c6
5df72d6
9b5b26a
3d1237b
9b5b26a
 
 
 
 
 
 
 
f97f98a
aa95680
784bf9c
5375f47
aa95680
 
 
 
cd2ac71
5375f47
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
cd2ac71
 
5375f47
cd2ac71
5375f47
cd2ac71
5375f47
 
cd2ac71
5375f47
 
cd2ac71
5375f47
 
 
 
 
 
cd2ac71
5375f47
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
abe7d90
aa95680
5375f47
9aab3c6
 
72153e1
9aab3c6
615ec88
5375f47
 
 
2d91d02
5375f47
 
 
2d91d02
5375f47
 
2d91d02
5375f47
 
2d91d02
5375f47
 
2d91d02
5375f47
 
2d91d02
5375f47
 
2d91d02
cd2ac71
41ed7f9
7348fc4
 
bd61bf6
f0b59ad
 
bd61bf6
7348fc4
f0b59ad
 
9aab3c6
b2876d5
9aab3c6
bd61bf6
5422b86
bd61bf6
 
7348fc4
bd61bf6
9aab3c6
62bdbcb
a3e866a
de3d7c6
 
 
5422b86
369a3f5
1cc5977
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
f97f98a
9b5b26a
 
 
 
 
 
 
 
 
 
 
 
 
 
8c01ffb
 
6aae614
ae7a494
 
 
 
e121372
bf6d34c
 
29ec968
fe328e0
13d500a
8c01ffb
 
9b5b26a
 
8c01ffb
861422e
 
9b5b26a
8c01ffb
8fe992b
9aab3c6
8c01ffb
 
 
 
 
 
861422e
8fe992b
 
9b5b26a
8c01ffb
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
from smolagents import CodeAgent,DuckDuckGoSearchTool, HfApiModel,load_tool,tool
import datetime
import requests
import pytz
import yaml
import asyncio
import nest_asyncio
#import matplotlib
from playwright.async_api import async_playwright
from PIL import Image
import numpy as np
import subprocess
import json
from rapidfuzz import process
import gradio as gr

from tools.final_answer import FinalAnswerTool

from Gradio_UI import GradioUI

nest_asyncio.apply()  # Ensure async works in a Jupyter/Colab/HF Spaces environment

subprocess.run(["apt-get", "update"])
subprocess.run(["apt-get", "install", "-y", "libnss3", "libatk1.0-0", "libatk-bridge2.0-0", "libxcomposite1",
"libxdamage1", "libcups2"])


subprocess.run(["playwright", "install", "chromium"])

# Below is an example of a tool that does nothing. Amaze us with your creativity !
@tool
def my_custom_tool(arg1:str, arg2:int)-> str: #it's import to specify the return type
    #Keep this format for the description / args / args description but feel free to modify the tool
    """A tool that does nothing yet 
    Args:
        arg1: the first argument
        arg2: the second argument
    """
    return "What magic will you build ?"


def load_image_sources():
    with open("expanded.json", "r") as file:
    # with open("image_sources.json", "r") as file:
        return json.load(file)

image_sources = load_image_sources()


def get_image_url(image_type: str, image_sources: dict):
    """Finds the best match for the given image type in a nested JSON structure."""

    choices = list(image_sources.keys())  # Get all available keys

    # Find the best match using `rapidfuzz`
    best_match, score, *_ = process.extractOne(image_type, choices, score_cutoff=60)

    if best_match:
        # Access the image_sources dictionary directly using the best_match string as the key
        print(f"Best match found: {best_match}") # Removed category access as it's not needed
        return image_sources[best_match]  # Returns {'url', 'width', 'height', etc.}

    else:
        # Default return if no good match is found
        return {
            "url": "https://editor.p5js.org/kfahn/full/2XD5Y8MiV",
            "width": 800,
            "height": 800
        }

# def get_image_url(image_type: str):
#     """Finds the best match for the given image type using fuzzy matching."""
#     choices = list(image_sources.keys())  # Get all available keys
#     best_match, score, *rest = process.extractOne(image_type, choices)  
    
#     if score > 90:  # Set a threshold to ensure a reasonable match
#         print(best_match)
#         return image_sources[best_match]
#     else:
#        #return None  # No good match found
#         return "https://editor.p5js.org/kfahn/full/2XD5Y8MiV"

# async def capture_screenshot(image_type: str):
#     """Launches Playwright and uses user input,  if any, to captures a screenshot of an image from p5.js."""
#     print("Launching Playwright...")
#     async with async_playwright() as p:
#         browser = await p.chromium.launch(headless=True)
#         page = await browser.new_page()

#         #url = "https://openprocessing.org/sketch/2539973"
#         url = "https://editor.p5js.org/kfahn/full/2XD5Y8MiV"
       
#         if image_type: 
#             image_url = get_image_url(image_type)
#         else:
#             image_url = url
        
#         print(f"Opening image from p5 sketch: {image_url}")
#         await page.goto(image_url, timeout=120000)  # Wait for the image page to load

#         print("Waiting for image element...")
#        # await page.wait_for_selector("img", timeout=120000)  # Wait for the <img> to be visible
#         await page.wait_for_timeout(5000)  # Allow sketch to fully render
#         print("Capturing screenshot...")
#         await page.set_viewport_size({"width": 800, "height": 800})
#         await page.locator("iframe").screenshot(path="img.png")
#         await browser.close()
#         print("Screenshot saved!")

async def capture_screenshot(image_type: str):
    """Captures a screenshot of an image from p5.js."""
    print("Launching Playwright...")
    async with async_playwright() as p:
        browser = await p.chromium.launch(headless=True)
        page = await browser.new_page()

        # Load image sources from JSON
        image_sources = load_image_sources()
        image_data = get_image_url(image_type, image_sources)

        image_url = image_data["url"]
        width = image_data["width"]
        height = image_data["height"]

        print(f"Opening image: {image_url}")
        await page.goto(image_url, timeout=120000)  # Load page

        print("Waiting for render...")
        await page.wait_for_timeout(5000)

        print(f"Setting viewport to {width}x{height}...")
        await page.set_viewport_size({"width": width, "height": height})

        print("Capturing screenshot...")
        await page.locator("iframe").screenshot(path="img.png")

        await browser.close()
        print("Screenshot saved!")


     
@tool
def grab_image(image_type: str) -> Image:
    """
    Fetches an user specified image or generative object from a p5.js sketch.
    This tool can be used to show a user what the generative art looks like.
    This function sends uses Playwright to launch a headless server and grab a screenshot of a p5.js sketch.
    Args:
        image_type: The art type or generative object. 
        
    Returns:
        image: The screen shot of the p5.js sketch as an image.
    """
    print("Running async Playwright screenshot...")
    
    loop = asyncio.new_event_loop()  # Create a new event loop (Fixes issues on HF Spaces)
    asyncio.set_event_loop(loop)
    loop.run_until_complete(capture_screenshot(image_type))

    print("Loading image for Gradio...")

    img = Image.open("img.png")
    
    
    return img

@tool
def get_joke() -> str:
    """
    Fetches a random joke from the JokeAPI.
    This function sends a GET request to the JokeAPI to retrieve a random joke.
    It handles both single jokes and two-part jokes (setup and delivery).
    If the request fails or the response does not contain a joke, an error message is returned.
    Returns:
        str: The joke as a string, or an error message if the joke could not be fetched.
    """
    url = "https://v2.jokeapi.dev/joke/Any?type=single"

    try:
        response = requests.get(url)
        response.raise_for_status()

        data = response.json()

        if "joke" in data:
            return data["joke"]
        elif "setup" in data and "delivery" in data:
            return f"{data['setup']} - {data['delivery']}"
        else:
            return "Error: Unable to fetch joke."

    except requests.exceptions.RequestException as e:
        return f"Error fetching joke: {str(e)}"

#https://github.com/huggingface/smolagents/blob/main/examples/multiple_tools.py
@tool
def get_current_time_in_timezone(timezone: str) -> str:
    """A tool that fetches the current local time in a specified timezone.
    Args:
        timezone: A string representing a valid timezone (e.g., 'America/New_York').
    """
    try:
        # Create timezone object
        tz = pytz.timezone(timezone)
        # Get current time in that timezone
        local_time = datetime.datetime.now(tz).strftime("%Y-%m-%d %H:%M:%S")
        return f"The current local time in {timezone} is: {local_time}"
    except Exception as e:
        return f"Error fetching time for timezone '{timezone}': {str(e)}"


final_answer = FinalAnswerTool()

# If the agent does not answer, the model is overloaded, please use another model or the following Hugging Face Endpoint that also contains qwen2.5 coder:
# model_id='https://pflgm2locj2t89co.us-east-1.aws.endpoints.huggingface.cloud' 

model = HfApiModel(
max_tokens=2096,
temperature=0.5,
model_id='Qwen/Qwen2.5-Coder-32B-Instruct',# it is possible that this model may be overloaded
custom_role_conversions=None,
)


# Import tool from Hub
image_generation_tool = load_tool("agents-course/text-to-image", trust_remote_code=True)

with open("prompts.yaml", 'r') as stream:
    prompt_templates = yaml.safe_load(stream)
    
agent = CodeAgent(
    model=model,
    tools=[final_answer, get_joke, grab_image], ## add your tools here (don't remove final answer)
    max_steps=6,
    verbosity_level=1,
    grammar=None,
    planning_interval=None,
    name=None,
    description=None,
    prompt_templates=prompt_templates
)


GradioUI(agent).launch()