Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
@@ -1,11 +1,9 @@
|
|
|
|
1 |
import requests
|
|
|
2 |
from requests.adapters import HTTPAdapter
|
3 |
from requests.packages.urllib3.util.retry import Retry
|
4 |
-
from
|
5 |
-
import gradio as gr
|
6 |
-
import datetime
|
7 |
-
import pandas as pd
|
8 |
-
import xlsxwriter
|
9 |
|
10 |
def setup_session():
|
11 |
session = requests.Session()
|
@@ -21,17 +19,18 @@ def generate_naver_search_url(query):
|
|
21 |
return url
|
22 |
|
23 |
def crawl_naver_search_results(url):
|
24 |
-
|
|
|
25 |
soup = BeautifulSoup(response.text, "html.parser")
|
26 |
results = []
|
27 |
-
for li in soup.find_all("li", class_="bx"):
|
28 |
for div in li.find_all("div", class_="detail_box"):
|
29 |
-
for div2 in div.find_all("div", class_
|
30 |
title = div2.text.strip()
|
31 |
for a in div2.find_all("a", href=True):
|
32 |
link = a["href"]
|
33 |
-
results.append(
|
34 |
-
return "
|
35 |
|
36 |
with gr.Interface(
|
37 |
fn=lambda query: crawl_naver_search_results(generate_naver_search_url(query)),
|
|
|
1 |
+
import gradio as gr
|
2 |
import requests
|
3 |
+
from bs4 import BeautifulSoup
|
4 |
from requests.adapters import HTTPAdapter
|
5 |
from requests.packages.urllib3.util.retry import Retry
|
6 |
+
from tabulate import tabulate
|
|
|
|
|
|
|
|
|
7 |
|
8 |
def setup_session():
|
9 |
session = requests.Session()
|
|
|
19 |
return url
|
20 |
|
21 |
def crawl_naver_search_results(url):
|
22 |
+
session = setup_session()
|
23 |
+
response = session.get(url)
|
24 |
soup = BeautifulSoup(response.text, "html.parser")
|
25 |
results = []
|
26 |
+
for li in soup.find_all("li", class_="bx")[:10]:
|
27 |
for div in li.find_all("div", class_="detail_box"):
|
28 |
+
for div2 in div.find_all("div", class_ "title_area"):
|
29 |
title = div2.text.strip()
|
30 |
for a in div2.find_all("a", href=True):
|
31 |
link = a["href"]
|
32 |
+
results.append([title, link])
|
33 |
+
return tabulate(results, headers=["제목", "링크"], tablefmt="grid")
|
34 |
|
35 |
with gr.Interface(
|
36 |
fn=lambda query: crawl_naver_search_results(generate_naver_search_url(query)),
|