Spaces:
Running
Running
File size: 3,006 Bytes
372531f |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 |
# Tavily API Retriever
# libraries
import os
import requests
import json
class GoogleSearch:
"""
Google API Retriever
"""
def __init__(self, query, headers=None):
"""
Initializes the TavilySearch object
Args:
query:
"""
self.query = query
self.headers = headers or {}
self.api_key = self.headers.get("google_api_key") or self.get_api_key() # Use the passed api_key or fallback to environment variable
self.cx_key = self.headers.get("google_cx_key") or self.get_cx_key() # Use the passed cx_key or fallback to environment variable
def get_api_key(self):
"""
Gets the Google API key
Returns:
"""
# Get the API key
try:
api_key = os.environ["GOOGLE_API_KEY"]
except:
raise Exception("Google API key not found. Please set the GOOGLE_API_KEY environment variable. "
"You can get a key at https://developers.google.com/custom-search/v1/overview")
return api_key
def get_cx_key(self):
"""
Gets the Google CX key
Returns:
"""
# Get the API key
try:
api_key = os.environ["GOOGLE_CX_KEY"]
except:
raise Exception("Google CX key not found. Please set the GOOGLE_CX_KEY environment variable. "
"You can get a key at https://developers.google.com/custom-search/v1/overview")
return api_key
def search(self, max_results=7):
"""
Searches the query
Returns:
"""
"""Useful for general internet search queries using the Google API."""
print("Searching with query {0}...".format(self.query))
url = f"https://www.googleapis.com/customsearch/v1?key={self.api_key}&cx={self.cx_key}&q={self.query}&start=1"
resp = requests.get(url)
if resp.status_code < 200 or resp.status_code >= 300:
print("Google search: unexpected response status: ", resp.status_code)
if resp is None:
return
try:
search_results = json.loads(resp.text)
except Exception:
return
if search_results is None:
return
results = search_results.get("items", [])
search_results = []
# Normalizing results to match the format of the other search APIs
for result in results:
# skip youtube results
if "youtube.com" in result["link"]:
continue
try:
search_result = {
"title": result["title"],
"href": result["link"],
"body": result["snippet"],
}
except:
continue
search_results.append(search_result)
return search_results[:max_results]
|