First_agent_template

Sleeping

dygoo commited on Feb 14

Commit

29ebc9b

verified ·

1 Parent(s): 6fd9231

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -22,7 +22,7 @@ site_config = {
 @tool
-def get_latest_news(news_sites: List[str]) -> Dict[str,List[str]]:
     """
     Tool returns news headlines from multiple news sites.
@@ -31,19 +31,26 @@ def get_latest_news(news_sites: List[str]) -> Dict[str,List[str]]:
     Returns:
         Dict[str, List[str]]: A dictionary where the keys are the news site URLs and the values are lists of headlines.
     """
     headlines = {}
     for site in news_sites:
         try:
-            config = site_config.get(site,{'tag': 'h2', 'class':'headline'})
             response = requests.get(site)
             response.raise_for_status()
             soup = BeautifulSoup(response.content, 'html.parser')
-            site_headlines=soup.find_all(config['tag'], class_ = config['class'])
             headlines[site] = [headline.text for headline in site_headlines]
         except requests.RequestException as e:
-            headlines[site] = f"Error fetching news:{e}"
     return headlines

 @tool
+def get_latest_news(news_sites: List[str]) -> Dict[str, List[str]]:
     """
     Tool returns news headlines from multiple news sites.
     Returns:
         Dict[str, List[str]]: A dictionary where the keys are the news site URLs and the values are lists of headlines.
+    Notes:
+        The function uses a predefined `site_config` dictionary to determine the HTML tag and class to extract headlines from each site.
+        The `site_config` dictionary should have the following structure:
+        {
+            "site_url": {'tag': 'html_tag', 'class': 'css_class'}
+        }
+        If a site is not found in `site_config`, it defaults to {'tag': 'h2', 'class': 'headline'}.
     """
     headlines = {}
     for site in news_sites:
         try:
+            config = site_config.get(site, {'tag': 'h2', 'class': 'headline'})
             response = requests.get(site)
             response.raise_for_status()
             soup = BeautifulSoup(response.content, 'html.parser')
+            site_headlines = soup.find_all(config['tag'], class_=config['class'])
             headlines[site] = [headline.text for headline in site_headlines]
         except requests.RequestException as e:
+            headlines[site] = f"Error fetching news: {e}"
     return headlines