File size: 6,873 Bytes
9b5b26a
 
 
 
c19d193
9aab3c6
bd61bf6
9aab3c6
 
212a11a
bd61bf6
9aab3c6
6aae614
8fe992b
9b5b26a
 
bd61bf6
 
0f2505a
d6e96a8
 
0f2505a
 
667a8cc
9aab3c6
136b2bd
 
 
 
 
 
 
 
 
 
5df72d6
9b5b26a
3d1237b
9b5b26a
 
 
 
 
 
 
 
5422b86
 
 
 
 
 
 
 
 
9aab3c6
72153e1
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
9aab3c6
41ed7f9
9aab3c6
 
72153e1
9aab3c6
615ec88
41ed7f9
ee1f53a
 
d0feb1f
2f991ca
72153e1
41ed7f9
 
5422b86
41ed7f9
d40b66d
 
9aab3c6
 
 
 
41ed7f9
9aab3c6
cf1e144
bd61bf6
 
 
9aab3c6
b2876d5
9aab3c6
bd61bf6
5422b86
bd61bf6
 
 
 
9aab3c6
 
 
5422b86
bd61bf6
21aafa2
369a3f5
1cc5977
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
9b5b26a
 
 
 
 
 
 
 
 
 
 
 
 
 
8c01ffb
 
6aae614
ae7a494
 
 
 
e121372
bf6d34c
 
29ec968
fe328e0
13d500a
8c01ffb
 
9b5b26a
 
8c01ffb
861422e
 
9b5b26a
8c01ffb
8fe992b
9aab3c6
8c01ffb
 
 
 
 
 
861422e
8fe992b
 
9b5b26a
8c01ffb
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
from smolagents import CodeAgent,DuckDuckGoSearchTool, HfApiModel,load_tool,tool
import datetime
import requests
import pytz
import yaml
import asyncio
import nest_asyncio
from playwright.async_api import async_playwright
from PIL import Image
import subprocess
import gradio as gr

from tools.final_answer import FinalAnswerTool

from Gradio_UI import GradioUI

nest_asyncio.apply()  # Ensure async works in a Jupyter/Colab/HF Spaces environment

subprocess.run(["apt-get", "update"])
subprocess.run(["apt-get", "install", "-y", "libnss3", "libatk1.0-0", "libatk-bridge2.0-0", "libxcomposite1",
"libxdamage1"])


subprocess.run(["playwright", "install", "chromium"])

# def install_playwright_and_deps():
#     try:
#         # Install Playwright
#         subprocess.check_call(["pip", "install", "playwright"])
#         subprocess.check_call(["apt-get", "playwright", "install-deps"])
#     except subprocess.CalledProcessError as e:
#         print(f"Error installing Playwright or dependencies: {e}")

# install_playwright_and_deps()

# Below is an example of a tool that does nothing. Amaze us with your creativity !
@tool
def my_custom_tool(arg1:str, arg2:int)-> str: #it's import to specify the return type
    #Keep this format for the description / args / args description but feel free to modify the tool
    """A tool that does nothing yet 
    Args:
        arg1: the first argument
        arg2: the second argument
    """
    return "What magic will you build ?"

#https://huggingface.co/black-forest-labs/FLUX.1-dev
#@tool
# def image_generation_tool = Tool.from_space(
#     "black-forest-labs/FLUX.1-schnell",
#     name="image_generator",
#     description="Generate an image from a prompt"
# )


# Debugging: Print statements to track execution
# async def capture_screenshot():
#     print("Launching Playwright...")
#     async with async_playwright() as p:
#         browser = await p.chromium.launch(headless=True)  
#         page = await browser.new_page()
#         print("Opening the p5.js sketch...")
#         await page.goto("https://editor.p5js.org/kfahn/full/2XD5Y8MiV", timeout=6000)

#         print("Waiting for canvas element...")
#         await page.wait_for_selector("canvas")  # Ensure p5.js has loaded
#         await page.wait_for_timeout(5000)  # Additional wait

#         print("Capturing screenshot...")
#         await page.screenshot(path="img.png")
#         await browser.close()
#         print("Screenshot saved!")

async def capture_screenshot():
    """Launches Playwright and captures a screenshot of an image from GitHub."""
    print("Launching Playwright...")
    async with async_playwright() as p:
        browser = await p.chromium.launch(headless=True)
        page = await browser.new_page()

        # Use the raw GitHub image URL
        url = "https://openprocessing.org/sketch/2539973"
        #url = "https://thecodingtrain.com/showcase/author/kathy-mcguiness"
        #url = "https://huggingface.co/datasets/hf-vision/course-assets/raw/main/feature-extraction-feature-matching/Flow-Chart-for-SURF-Feature-Detection.png"
        image_url = url

        print(f"Opening image from GitHub: {image_url}")
        await page.goto(image_url, timeout=120000)  # Wait for the image page to load

        print("Waiting for image element...")
       # await page.wait_for_selector("img", timeout=120000)  # Wait for the <img> to be visible
        await page.wait_for_timeout(5000)  # Allow sketch to fully render
        print("Capturing screenshot...")
        await page.screenshot(path="img.png")
        await browser.close()
        print("Screenshot saved!")
     
@tool
def grab_image() -> Image:
    """
    Fetches an op art image from a p5.js sketch.
    This function sends uses Playwright to launch a headless server and grab a screenshot of a p5.js sketch.
    Returns:
        image: The screen shot of the p5.js sketch as an image.
    """
    print("Running async Playwright screenshot...")
    
    loop = asyncio.new_event_loop()  # Create a new event loop (Fixes issues on HF Spaces)
    asyncio.set_event_loop(loop)
    loop.run_until_complete(capture_screenshot())

    print("Loading image for Gradio...")
    img = Image.open("img.png")
    return img


#https://github.com/huggingface/smolagents/blob/main/examples/multiple_tools.py
@tool
def get_joke() -> str:
    """
    Fetches a random joke from the JokeAPI.
    This function sends a GET request to the JokeAPI to retrieve a random joke.
    It handles both single jokes and two-part jokes (setup and delivery).
    If the request fails or the response does not contain a joke, an error message is returned.
    Returns:
        str: The joke as a string, or an error message if the joke could not be fetched.
    """
    url = "https://v2.jokeapi.dev/joke/Any?type=single"

    try:
        response = requests.get(url)
        response.raise_for_status()

        data = response.json()

        if "joke" in data:
            return data["joke"]
        elif "setup" in data and "delivery" in data:
            return f"{data['setup']} - {data['delivery']}"
        else:
            return "Error: Unable to fetch joke."

    except requests.exceptions.RequestException as e:
        return f"Error fetching joke: {str(e)}"


@tool
def get_current_time_in_timezone(timezone: str) -> str:
    """A tool that fetches the current local time in a specified timezone.
    Args:
        timezone: A string representing a valid timezone (e.g., 'America/New_York').
    """
    try:
        # Create timezone object
        tz = pytz.timezone(timezone)
        # Get current time in that timezone
        local_time = datetime.datetime.now(tz).strftime("%Y-%m-%d %H:%M:%S")
        return f"The current local time in {timezone} is: {local_time}"
    except Exception as e:
        return f"Error fetching time for timezone '{timezone}': {str(e)}"


final_answer = FinalAnswerTool()

# If the agent does not answer, the model is overloaded, please use another model or the following Hugging Face Endpoint that also contains qwen2.5 coder:
# model_id='https://pflgm2locj2t89co.us-east-1.aws.endpoints.huggingface.cloud' 

model = HfApiModel(
max_tokens=2096,
temperature=0.5,
model_id='Qwen/Qwen2.5-Coder-32B-Instruct',# it is possible that this model may be overloaded
custom_role_conversions=None,
)


# Import tool from Hub
image_generation_tool = load_tool("agents-course/text-to-image", trust_remote_code=True)

with open("prompts.yaml", 'r') as stream:
    prompt_templates = yaml.safe_load(stream)
    
agent = CodeAgent(
    model=model,
    tools=[final_answer, get_joke, grab_image], ## add your tools here (don't remove final answer)
    max_steps=6,
    verbosity_level=1,
    grammar=None,
    planning_interval=None,
    name=None,
    description=None,
    prompt_templates=prompt_templates
)


GradioUI(agent).launch()