Spaces:

fdaudens
/

perspicacity

Running

App Files Files Community

fdaudens HF Staff commited on May 2

Commit

4c2fdec

verified ·

1 Parent(s): 71dd8bc

Update app.py

Browse files

update chatbot

Files changed (1) hide show

app.py +57 -65

app.py CHANGED Viewed

@@ -1,4 +1,3 @@
-# app.py
 import os
 import logging
 import asyncio
@@ -19,13 +18,10 @@ from llama_index.llms.huggingface_api import HuggingFaceInferenceAPI
 from llama_index.core.memory import ChatMemoryBuffer
 from llama_index.readers.web import RssReader
-import subprocess
-subprocess.run(["playwright", "install"])
-# allow nested loops in Spaces
-nest_asyncio.apply()
-# --- Llangfuse ---
 instrumentor = LlamaIndexInstrumentor(
     public_key=os.environ.get("LANGFUSE_PUBLIC_KEY"),
     secret_key=os.environ.get("LANGFUSE_SECRET_KEY"),
@@ -33,84 +29,80 @@ instrumentor = LlamaIndexInstrumentor(
 )
 instrumentor.start()
-# --- Secrets via env vars ---
-HF_TOKEN            = os.getenv("HF_TOKEN")
-# OPENAI_API_KEY      = os.getenv("OPENAI_API_KEY")
-OPENWEATHERMAP_KEY  = os.getenv("OPENWEATHERMAP_API_KEY")
-SERPER_API_KEY      = os.getenv("SERPER_API_KEY")
-# --- LLMs ---
 llm = HuggingFaceInferenceAPI(
     model_name="Qwen/Qwen2.5-Coder-32B-Instruct",
-    token=HF_TOKEN,
     task="conversational"
 )
-memory = ChatMemoryBuffer.from_defaults(token_limit=8192)
 today_str = datetime.now().strftime("%B %d, %Y")
 ANON_USER_ID = os.environ.get("ANON_USER_ID", uuid.uuid4().hex)
-# # OpenAI for pure function-calling
-# openai_llm = OpenAI(
-#     model="gpt-4o",
-#     api_key=OPENAI_API_KEY,
-#     temperature=0.0,
-#     streaming=False,
-# )
-# --- Tools Setup ---
-# DuckDuckGo
-duck_spec = DuckDuckGoSearchToolSpec()
-search_tool = FunctionTool.from_defaults(duck_spec.duckduckgo_full_search)
-# Weather
-openweather_api_key=OPENWEATHERMAP_KEY
-weather_tool_spec = OpenWeatherMapToolSpec(key=openweather_api_key)
-weather_tool_spec = OpenWeatherMapToolSpec(key=openweather_api_key)
 weather_tool = FunctionTool.from_defaults(
-    weather_tool_spec.weather_at_location,
     name="current_weather",
-    description="Get the current weather at a specific location (city, country)."
 )
 forecast_tool = FunctionTool.from_defaults(
-    weather_tool_spec.forecast_tommorrow_at_location,
     name="weather_forecast",
-    description="Get tomorrow's weather forecast for a specific location (city, country)."
 )
-# Playwright (synchronous start)
-async def _start_browser():
-    return await PlaywrightToolSpec.create_async_playwright_browser(headless=True)
-browser = asyncio.get_event_loop().run_until_complete(_start_browser())
 playwright_tool_spec = PlaywrightToolSpec.from_async_browser(browser)
 navigate_tool = FunctionTool.from_defaults(
     playwright_tool_spec.navigate_to,
     name="web_navigate",
-    description="Navigate to a specific URL."
 )
 extract_text_tool = FunctionTool.from_defaults(
     playwright_tool_spec.extract_text,
     name="web_extract_text",
-    description="Extract all text from the current page."
 )
 extract_links_tool = FunctionTool.from_defaults(
     playwright_tool_spec.extract_hyperlinks,
     name="web_extract_links",
-    description="Extract all hyperlinks from the current page."
 )
-# Google News RSS
 def fetch_google_news_rss():
-    docs = RssReader(html_to_text=True).load_data(["https://news.google.com/rss"])
-    return [{"title":d.metadata.get("title",""), "url":d.metadata.get("link","")} for d in docs]
 google_rss_tool = FunctionTool.from_defaults(
-    fn=fetch_google_news_rss,
     name="fetch_google_news_rss",
-    description="Fetch latest headlines and URLs from Google News RSS."
 )
-# Serper
 async def fetch_serper_news(query: str):
     if not serper_api_key:
         raise ValueError("Missing SERPER_API_KEY environment variable")
@@ -124,12 +116,12 @@ async def fetch_serper_news(query: str):
 serper_news_tool = FunctionTool.from_defaults(
     fetch_serper_news,
     name="fetch_news_from_serper",
-    description="Fetch news articles on a given topic via the Serper API."
 )
 # Create the agent workflow
 tools = [
-    search_tool,
     navigate_tool,
     extract_text_tool,
     extract_links_tool,
@@ -162,26 +154,26 @@ async def run_query(query: str):
 # Gradio interface function
 async def gradio_query(user_input, chat_history=None):
-    chat_history = chat_history or []
     result = await run_query(user_input)
-    response = result.response
-    chat_history.append((user_input, response))
-    return chat_history, chat_history
 # Build and launch Gradio app
 grb = gr.Blocks()
 with grb:
-    gr.Markdown("## Perspicacity")
-    gr.Markdown(
-        "This bot can check the news, tell you the weather, and even browse websites to answer follow-up questions — all powered by a team of tiny AI agents working behind the scenes.\n\n"
-        "🧪 Built for fun during the [AI Agents course](https://huggingface.co/learn/agents-course/unit0/introduction) — it's just a demo to show what agents can do.  \n"
-        "🙌 Got ideas or improvements? PRs welcome!  \n\n"
-        "👉 _Try asking “What’s the weather in Montreal?” or “What’s in the news today?”_"
-    )
-    chatbot = gr.Chatbot()  # conversation UI
     txt = gr.Textbox(placeholder="Ask me anything...", show_label=False)
     txt.submit(gradio_query, [txt, chatbot], [chatbot, chatbot])
     gr.Button("Send").click(gradio_query, [txt, chatbot], [chatbot, chatbot])
 if __name__ == "__main__":
-    grb.launch()

 import os
 import logging
 import asyncio
 from llama_index.core.memory import ChatMemoryBuffer
 from llama_index.readers.web import RssReader
+# Configure logging
+logging.getLogger("langfuse").setLevel(logging.WARNING)
+# Initialize Langfuse instrumentor
 instrumentor = LlamaIndexInstrumentor(
     public_key=os.environ.get("LANGFUSE_PUBLIC_KEY"),
     secret_key=os.environ.get("LANGFUSE_SECRET_KEY"),
 )
 instrumentor.start()
+# Environment variables
+hf_token = os.environ.get("HF_TOKEN")
+openweather_api_key = os.environ.get("OPENWEATHER_API_KEY")
+serper_api_key = os.environ.get("SERPER_API_KEY")
+# Initialize LLM and conversation memory
 llm = HuggingFaceInferenceAPI(
     model_name="Qwen/Qwen2.5-Coder-32B-Instruct",
+    token=hf_token,
     task="conversational"
 )
+memory = ChatMemoryBuffer.from_defaults(token_limit=4096)
 today_str = datetime.now().strftime("%B %d, %Y")
 ANON_USER_ID = os.environ.get("ANON_USER_ID", uuid.uuid4().hex)
+# Define tools
+# DuckDuckGo web search
+duckduckgo_tool = FunctionTool.from_defaults(
+    DuckDuckGoSearchToolSpec().duckduckgo_full_search
+)
+# Weather tools
 weather_tool = FunctionTool.from_defaults(
+    OpenWeatherMapToolSpec(key=openweather_api_key).weather_at_location,
     name="current_weather",
+    description="Get the current weather for a city/country."
 )
 forecast_tool = FunctionTool.from_defaults(
+    OpenWeatherMapToolSpec(key=openweather_api_key).forecast_tommorrow_at_location,
     name="weather_forecast",
+    description="Get tomorrow's weather forecast for a city/country."
 )
+# Playwright tools setup
+nest_asyncio.apply()
+browser = asyncio.get_event_loop().run_until_complete(
+    PlaywrightToolSpec.create_async_playwright_browser(
+        headless=True,
+        args=["--no-sandbox", "--disable-setuid-sandbox"]
+    )
+)
 playwright_tool_spec = PlaywrightToolSpec.from_async_browser(browser)
 navigate_tool = FunctionTool.from_defaults(
     playwright_tool_spec.navigate_to,
     name="web_navigate",
+    description="Navigate to a URL."
 )
 extract_text_tool = FunctionTool.from_defaults(
     playwright_tool_spec.extract_text,
     name="web_extract_text",
+    description="Extract text from the current page."
 )
 extract_links_tool = FunctionTool.from_defaults(
     playwright_tool_spec.extract_hyperlinks,
     name="web_extract_links",
+    description="Extract hyperlinks from the current page."
 )
+# Google News RSS tool
 def fetch_google_news_rss():
+    reader = RssReader(html_to_text=True)
+    docs = reader.load_data(["https://news.google.com/rss"])
+    return [
+        {"title": doc.metadata.get("title", "").strip(), "url": doc.metadata.get("link", "")} for doc in docs
+    ]
 google_rss_tool = FunctionTool.from_defaults(
+    fetch_google_news_rss,
     name="fetch_google_news_rss",
+    description="Get latest headlines and URLs from Google News RSS feed."
 )
+# Serper news API tool
 async def fetch_serper_news(query: str):
     if not serper_api_key:
         raise ValueError("Missing SERPER_API_KEY environment variable")
 serper_news_tool = FunctionTool.from_defaults(
     fetch_serper_news,
     name="fetch_news_from_serper",
+    description="Fetch news articles on a topic via Serper API."
 )
 # Create the agent workflow
 tools = [
+    duckduckgo_tool,
     navigate_tool,
     extract_text_tool,
     extract_links_tool,
 # Gradio interface function
 async def gradio_query(user_input, chat_history=None):
+    history = chat_history or []
     result = await run_query(user_input)
+    # Ensure text-only content and strip any role prefix
+    resp_text = str(result.response)
+    if resp_text.lower().startswith("assistant:"):
+        resp_text = resp_text.split(":", 1)[1].strip()
+    # Append OpenAI-style message dicts
+    history.append({"role": "user", "content": user_input})
+    history.append({"role": "assistant", "content": resp_text})
+    return history, history
 # Build and launch Gradio app
 grb = gr.Blocks()
 with grb:
+    gr.Markdown("## AI Web Agent")
+    chatbot = gr.Chatbot(type="messages")  # use openai-style messages
     txt = gr.Textbox(placeholder="Ask me anything...", show_label=False)
     txt.submit(gradio_query, [txt, chatbot], [chatbot, chatbot])
     gr.Button("Send").click(gradio_query, [txt, chatbot], [chatbot, chatbot])
 if __name__ == "__main__":
+    # share=True if you want a public Space link
+    grb.launch()