Final_Assignment_Template

Sleeping

App Files Files Community

tatianija commited on Jul 3

Commit

adacbb6

verified ·

1 Parent(s): d6efa0a

Update app.py

Browse files

Files changed (1) hide show

app.py +59 -1

app.py CHANGED Viewed

@@ -28,6 +28,64 @@ cached_answers = {}
 cached_questions = []
 processing_status = {"is_processing": False, "progress": 0, "total": 0}
 # --- Web Content Fetcher ---
 class WebContentFetcher:
     def __init__(self, debug: bool = True):
@@ -389,7 +447,7 @@ class AudioTranscriptionTool:
 # --- Enhanced Intelligent Agent with Direct Attachment Processing ---
 class IntelligentAgent:
     def __init__(self, debug: bool = True, model_name: str = "meta-llama/Llama-3.1-8B-Instruct"):
-        self.search_tool = DuckDuckGoSearchTool()
         self.client = InferenceClient(model=model_name, provider="sambanova")
         self.image_tool = ImageAnalysisTool()
         self.audio_tool = AudioTranscriptionTool()

 cached_questions = []
 processing_status = {"is_processing": False, "progress": 0, "total": 0}
+# simple search instrad of duck:
+class SimpleSearchTool:
+    """
+    Simple search tool that scrapes DuckDuckGo HTML results.
+    Drop-in replacement for DuckDuckGoSearchTool.
+    """
+    def __init__(self):
+        self.session = requests.Session()
+        self.session.headers.update({
+            'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36'
+        })
+    def run(self, query: str) -> str:
+        """Search and return formatted results."""
+        try:
+            # Encode query for URL
+            encoded_query = urllib.parse.quote_plus(query)
+            url = f"https://html.duckduckgo.com/html/?q={encoded_query}"
+            response = self.session.get(url, timeout=10)
+            response.raise_for_status()
+            soup = BeautifulSoup(response.content, 'html.parser')
+            results = []
+            # Find search result containers
+            result_containers = soup.find_all('div', class_='result__body')
+            for i, container in enumerate(result_containers[:5], 1):
+                try:
+                    # Extract title and URL
+                    title_elem = container.find('a', class_='result__a')
+                    if not title_elem:
+                        continue
+                    title = title_elem.get_text().strip()
+                    url = title_elem.get('href', '')
+                    # Extract snippet
+                    snippet_elem = container.find('a', class_='result__snippet')
+                    snippet = snippet_elem.get_text().strip() if snippet_elem else ''
+                    if title and url:
+                        result = f"{i}. {title}\n   URL: {url}\n"
+                        if snippet:
+                            result += f"   Snippet: {snippet}\n"
+                        results.append(result)
+                except Exception:
+                    continue
+            return "\n".join(results) if results else "No search results found."
+        except Exception as e:
+            return f"Search failed: {str(e)}"
 # --- Web Content Fetcher ---
 class WebContentFetcher:
     def __init__(self, debug: bool = True):
 # --- Enhanced Intelligent Agent with Direct Attachment Processing ---
 class IntelligentAgent:
     def __init__(self, debug: bool = True, model_name: str = "meta-llama/Llama-3.1-8B-Instruct"):
+        self.search_tool = SimpleSearchTool()
         self.client = InferenceClient(model=model_name, provider="sambanova")
         self.image_tool = ImageAnalysisTool()
         self.audio_tool = AudioTranscriptionTool()