File size: 4,325 Bytes
09ebcd0
 
eec4d01
efb5f18
09ebcd0
6097fb2
1b298f9
34db24b
 
 
 
 
 
 
 
 
 
 
6097fb2
1b298f9
eec4d01
6097fb2
2efa0ec
eec4d01
 
 
 
 
 
 
 
 
 
 
 
1b298f9
6097fb2
 
eec4d01
 
 
6097fb2
 
eec4d01
6097fb2
 
 
 
 
1b298f9
6097fb2
efb5f18
 
 
a4f4206
 
 
efb5f18
 
a4f4206
 
efb5f18
 
 
a4f4206
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6097fb2
a4f4206
efb5f18
 
158b524
eec4d01
34db24b
 
eec4d01
6097fb2
68a8b0c
a4f4206
6097fb2
ab30506
6097fb2
34db24b
6097fb2
 
 
ad0f104
efb5f18
a4f4206
 
ad0f104
 
94b1606
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
import gradio as gr
import requests
import json
from datetime import datetime, timedelta

API_KEY = "V38CNn4HXpLtynJQyOeoUensTEYoFy8PBUxKpDqAW1pawT1vfJ2BWtPQ98h6"

MAJOR_COUNTRIES = [
    "United States", "United Kingdom", "Canada", "Australia", "Germany", 
    "France", "Japan", "South Korea", "China", "India", 
    "Brazil", "Mexico", "Russia", "Italy", "Spain", 
    "Netherlands", "Sweden", "Switzerland", "Norway", "Denmark", 
    "Finland", "Belgium", "Austria", "New Zealand", "Ireland", 
    "Singapore", "Hong Kong", "Israel", "United Arab Emirates", "Saudi Arabia", 
    "South Africa", "Turkey", "Egypt", "Poland", "Czech Republic", 
    "Hungary", "Greece", "Portugal", "Argentina", "Chile", 
    "Colombia", "Peru", "Venezuela", "Thailand", "Malaysia", 
    "Indonesia", "Philippines", "Vietnam", "Pakistan", "Bangladesh"
]

def search_serphouse(query, country, verbatim, page, num_result):
    url = "https://api.serphouse.com/serp/live"
    
    payload = {
        "data": {
            "q": query,
            "domain": "google.com",
            "loc": country,
            "lang": "en",
            "device": "desktop",
            "serp_type": "news",
            "page": str(page),
            "verbatim": verbatim,
            "num": str(num_result)
        }
    }
    
    headers = {
        "accept": "application/json",
        "content-type": "application/json",
        "authorization": f"Bearer {API_KEY}"
    }
    
    response = requests.post(url, json=payload, headers=headers)
    
    if response.status_code == 200:
        return response.json()
    else:
        return f"Error: {response.status_code} - {response.text}"

def format_results(results):
    now = datetime.now()
    html_output = "<h2>Search Results</h2>"
    
    # 디버깅: API 응답 전체를 출력
    html_output += f"<pre>{json.dumps(results, indent=2)}</pre>"
    
    if isinstance(results, dict) and "results" in results:
        news_results = results["results"].get("news", [])
        if not news_results:
            html_output += "<p>No news results found in the API response.</p>"
        for result in news_results:
            time_str = result.get("time", "").strip()
            if time_str.endswith("ago"):
                time_parts = time_str.split()
                if len(time_parts) >= 2:
                    try:
                        time_value = int(time_parts[0])
                        time_unit = time_parts[1]
                        
                        if time_unit in ["minute", "minutes", "hour", "hours"] and time_value <= 24:
                            html_output += f"""
                            <div style='border: 1px solid #ddd; padding: 10px; margin-bottom: 10px;'>
                                <h3><a href='{result.get('url', '#')}'>{result.get('title', 'No Title')}</a></h3>
                                <p>{result.get('snippet', 'No Snippet')}</p>
                                <p><small>Source: {result.get('channel', 'Unknown')} - {result.get('time', 'Unknown time')}</small></p>
                            </div>
                            """
                    except ValueError:
                        html_output += f"<p>Error parsing time: {time_str}</p>"
                else:
                    html_output += f"<p>Invalid time format: {time_str}</p>"
            else:
                html_output += f"<p>Unexpected time format: {time_str}</p>"
    else:
        html_output += "<p>Unexpected response format or no results found.</p>"
    
    return html_output

def serphouse_search(query, country, verbatim, page, num_result):
    verbatim = "1" if verbatim else "0"
    
    results = search_serphouse(query, country, verbatim, page, num_result)
    return format_results(results)

iface = gr.Interface(
    fn=serphouse_search,
    inputs=[
        gr.Textbox(label="Search Query"),
        gr.Dropdown(MAJOR_COUNTRIES, label="Country"),
        gr.Checkbox(label="Verbatim"),
        gr.Slider(1, 10, 1, label="Page"),
        gr.Slider(1, 100, 10, label="Number of Results")
    ],
    outputs="html",
    title="SERPHouse News Search Interface",
    description="Enter your search query and select a country to get news results from the SERPHouse API. Only articles from the last 24 hours will be displayed."
)

iface.launch()