Spaces:

AIRider
/

Youtube_Anal_v1

Sleeping

App Files Files Community

AIRider commited on Jul 25, 2024

Commit

b6549ee

verified ·

1 Parent(s): a629f01

Update app.py

Browse files

Files changed (1) hide show

app.py +18 -18

app.py CHANGED Viewed

@@ -8,15 +8,19 @@ from sklearn.feature_extraction.text import TfidfVectorizer
 from sklearn.cluster import KMeans
 from datetime import datetime, timedelta
 import os
-from transformers import InferenceClient  # 가정: transformers 모듈 사용
 def create_client(model_name):
-    return InferenceClient(model_name, token=os.getenv("HF_TOKEN"))
 client = create_client("CohereForAI/c4ai-command-r-plus")
-def get_video_stats(api_key, video_id):
-    youtube = build("youtube", "v3", developerKey=api_key)
     video_response = youtube.videos().list(
         part="snippet,statistics",
         id=video_id
@@ -40,8 +44,8 @@ def get_video_stats(api_key, video_id):
         "Comment Count": comment_count
     }
-def get_channel_stats(api_key, channel_id):
-    youtube = build("youtube", "v3", developerKey=api_key)
     channel_response = youtube.channels().list(
         part="statistics",
         id=channel_id
@@ -55,8 +59,8 @@ def get_channel_stats(api_key, channel_id):
     return subscriber_count
-def get_video_data(api_key, query, max_results, published_after, published_before):
-    youtube = build("youtube", "v3", developerKey=api_key)
     video_ids = []
     next_page_token = None
@@ -82,9 +86,9 @@ def get_video_data(api_key, query, max_results, published_after, published_befor
     video_stats = []
     for video_id in video_ids:
-        stats = get_video_stats(api_key, video_id)
         channel_id = stats["Channel ID"]
-        subscriber_count = get_channel_stats(api_key, channel_id)
         stats["Subscriber Count"] = subscriber_count
         video_stats.append(stats)
@@ -130,14 +134,11 @@ def analyze_titles(video_stats_df, n_clusters=5):
     return cluster_summary_df
 def summarize_cluster(cluster_text, cluster_num):
-    response = client.generate(
-        prompt=f"다음 동영상을 분석하여 요약하고, 500자 이내로 동영상의 특징 및 인기 요인을 설명해주세요: {cluster_text}",
-        max_tokens=500
-    )
-    summary = response['choices'][0]['text'].strip()
     return summary
-def main(api_key, query, max_results, period, page, n_clusters=5):
     if query:
         #  기간 설정
         now = datetime.utcnow()
@@ -151,7 +152,7 @@ def main(api_key, query, max_results, period, page, n_clusters=5):
         else:
             published_after = (now - timedelta(days=30)).isoformat("T") + "Z"  # 기본값 1개월
-        video_stats_df = get_video_data(api_key, query, max_results, published_after, published_before)
         if page == "Video Ranking":
             video_stats_df, fig, csv_download_link = visualize_video_ranking(video_stats_df)
@@ -164,7 +165,6 @@ def main(api_key, query, max_results, period, page, n_clusters=5):
 iface = gr.Interface(
     fn=main,
     inputs=[
-        gr.components.Textbox(label="YouTube API Key를 입력하세요", type="password"),
         gr.components.Textbox(label="검색 쿼리"),
         gr.components.Slider(minimum=1, maximum=1000, value=5, label="최대 결과 수"),
         gr.components.Dropdown(["1주일", "1개월", "3개월"], label="기간"),

 from sklearn.cluster import KMeans
 from datetime import datetime, timedelta
 import os
+from huggingface_hub import InferenceApi  # Hugging Face Hub API 사용
+# 여기에 YouTube API 키를 입력하세요
+YOUTUBE_API_KEY = "YOUR_YOUTUBE_API_KEY"
 def create_client(model_name):
+    token = os.getenv("HF_TOKEN")
+    return InferenceApi(repo_id=model_name, token=token)
 client = create_client("CohereForAI/c4ai-command-r-plus")
+def get_video_stats(video_id):
+    youtube = build("youtube", "v3", developerKey=YOUTUBE_API_KEY)
     video_response = youtube.videos().list(
         part="snippet,statistics",
         id=video_id
         "Comment Count": comment_count
     }
+def get_channel_stats(channel_id):
+    youtube = build("youtube", "v3", developerKey=YOUTUBE_API_KEY)
     channel_response = youtube.channels().list(
         part="statistics",
         id=channel_id
     return subscriber_count
+def get_video_data(query, max_results, published_after, published_before):
+    youtube = build("youtube", "v3", developerKey=YOUTUBE_API_KEY)
     video_ids = []
     next_page_token = None
     video_stats = []
     for video_id in video_ids:
+        stats = get_video_stats(video_id)
         channel_id = stats["Channel ID"]
+        subscriber_count = get_channel_stats(channel_id)
         stats["Subscriber Count"] = subscriber_count
         video_stats.append(stats)
     return cluster_summary_df
 def summarize_cluster(cluster_text, cluster_num):
+    response = client(inputs=cluster_text)
+    summary = response[0]["generated_text"].strip()
     return summary
+def main(query, max_results, period, page, n_clusters=5):
     if query:
         #  기간 설정
         now = datetime.utcnow()
         else:
             published_after = (now - timedelta(days=30)).isoformat("T") + "Z"  # 기본값 1개월
+        video_stats_df = get_video_data(query, max_results, published_after, published_before)
         if page == "Video Ranking":
             video_stats_df, fig, csv_download_link = visualize_video_ranking(video_stats_df)
 iface = gr.Interface(
     fn=main,
     inputs=[
         gr.components.Textbox(label="검색 쿼리"),
         gr.components.Slider(minimum=1, maximum=1000, value=5, label="최대 결과 수"),
         gr.components.Dropdown(["1주일", "1개월", "3개월"], label="기간"),