kai-ytb-private-reply

Build error

App Files Files Community

seawolf2357 commited on Sep 18, 2024

Commit

7524905

verified ·

1 Parent(s): b17754f

Update app.py

Browse files

Files changed (1) hide show

app.py +28 -53

app.py CHANGED Viewed

@@ -5,9 +5,10 @@ import re
 import asyncio
 import subprocess
 import aiohttp
 from huggingface_hub import InferenceClient
 from googleapiclient.discovery import build
-from youtube_transcript_api import YouTubeTranscriptApi
 from youtube_transcript_api.formatters import TextFormatter
 from dotenv import load_dotenv
@@ -26,7 +27,6 @@ intents.guild_messages = True
 # 추론 API 클라이언트 설정
 hf_client = InferenceClient("CohereForAI/c4ai-command-r-plus-08-2024", token=os.getenv("HF_TOKEN"))
-#hf_client = InferenceClient("CohereForAI/aya-23-35B", token=os.getenv("HF_TOKEN"))
 # YouTube API 설정
 API_KEY = os.getenv("YOUTUBE_API_KEY")
@@ -35,9 +35,6 @@ youtube_service = build('youtube', 'v3', developerKey=API_KEY)
 # 특정 채널 ID
 SPECIFIC_CHANNEL_ID = int(os.getenv("DISCORD_CHANNEL_ID"))
-# 웹훅 URL 설정
-#WEBHOOK_URL = "https://connect.pabbly.com/workflow/sendwebhookdata/IjU3NjUwNTY1MDYzMjA0MzA1MjY4NTUzMDUxMzUi_pc"
 # 전송 실패 시 재시도 횟수
 MAX_RETRIES = 3
@@ -109,26 +106,34 @@ def extract_video_id(url):
     logging.debug(f'추출된 비디오 ID: {video_id}')
     return video_id
-async def get_best_available_transcript(video_id):
-    try:
-        transcript = YouTubeTranscriptApi.get_transcript(video_id, languages=['ko'])
-    except Exception as e:
-        logging.warning(f'한국어 자막 가져오기 오류: {e}')
         try:
-            transcript = YouTubeTranscriptApi.get_transcript(video_id, languages=['en'])
         except Exception as e:
-            logging.warning(f'영어 자막 가져오기 오류: {e}')
             try:
-                transcripts = YouTubeTranscriptApi.list_transcripts(video_id)
-                transcript = transcripts.find_manually_created_transcript().fetch()
             except Exception as e:
-                logging.error(f'대체 자막 가져오기 오류: {e}')
-                return None
-    formatter = TextFormatter()
-    transcript_text = formatter.format_transcript(transcript)
-    logging.debug(f'가져온 자막: {transcript_text}')
-    return transcript_text
 async def get_video_comments(video_id):
     comments = []
@@ -150,7 +155,7 @@ async def generate_replies(comments, transcript):
     replies = []
     for comment, _ in comments:
         messages = [
-            {"role": "system", "content": """너의 이름은 OpenFreeAI이다. 답글 생성후 가장 마지막에 너의 이름을 밝히고 공손하게 인사하라. 비디오 자막: {transcript}"""},
             {"role": "user", "content": comment}
         ]
         loop = asyncio.get_event_loop()
@@ -166,43 +171,13 @@ async def generate_replies(comments, transcript):
     logging.debug(f'생성된 답글: {replies}')
     return replies
-async def send_webhook_data(session, chunk_data, chunk_number):
-    for attempt in range(MAX_RETRIES):
-        try:
-            async with session.post(WEBHOOK_URL, json=chunk_data) as resp:
-                if resp.status == 200:
-                    logging.info(f"웹훅으로 데이터 전송 성공: {chunk_number} 번째 시도")
-                    return True  # 성공 시 종료
-                else:
-                    logging.error(f"웹훅으로 데이터 전송 실패: {resp.status}, {chunk_number} 번째 시도")
-        except aiohttp.ClientError as e:
-            logging.error(f"웹훅 전송 중 오류 발생: {e}, {chunk_number} 번째 시도")
-        await asyncio.sleep(1)  # 재시도 전에 잠시 대기
-    return False  # 재시도 횟수 초과 시 실패로 간주
 async def create_thread_and_send_replies(message, video_id, comments, replies, session):
     thread = await message.channel.create_thread(name=f"{message.author.name}의 댓글 답글", message=message)
-    webhook_data = {"video_id": video_id, "replies": []}
     for (comment, comment_id), reply in zip(comments, replies):
         embed = discord.Embed(description=f"**댓글**: {comment}\n**답글**: {reply}")
         await thread.send(embed=embed)
-        # 웹훅 데이터 준비 (comment id 포함)
-        webhook_data["replies"].append({"comment": comment, "reply": reply, "comment_id": comment_id})
-    # 데이터를 여러 번 나누어 전송
-    chunk_size = 1  # 전송할 데이터의 개수를 1로 설정하여 각 데이터를 별도로 전송
-    for i in range(0, len(webhook_data["replies"]), chunk_size):
-        chunk = webhook_data["replies"][i:i+chunk_size]
-        chunk_data = {"video_id": video_id, "replies": chunk}
-        success = await send_webhook_data(session, chunk_data, i // chunk_size + 1)
-        if not success:
-            logging.error(f"데이터 전송 실패: {i // chunk_size + 1} 번째 청크")
 if __name__ == "__main__":
     discord_client = MyClient(intents=intents)
-    discord_client.run(os.getenv('DISCORD_TOKEN'))

 import asyncio
 import subprocess
 import aiohttp
+import time
 from huggingface_hub import InferenceClient
 from googleapiclient.discovery import build
+from youtube_transcript_api import YouTubeTranscriptApi, TranscriptsDisabled, NoTranscriptFound
 from youtube_transcript_api.formatters import TextFormatter
 from dotenv import load_dotenv
 # 추론 API 클라이언트 설정
 hf_client = InferenceClient("CohereForAI/c4ai-command-r-plus-08-2024", token=os.getenv("HF_TOKEN"))
 # YouTube API 설정
 API_KEY = os.getenv("YOUTUBE_API_KEY")
 # 특정 채널 ID
 SPECIFIC_CHANNEL_ID = int(os.getenv("DISCORD_CHANNEL_ID"))
 # 전송 실패 시 재시도 횟수
 MAX_RETRIES = 3
     logging.debug(f'추출된 비디오 ID: {video_id}')
     return video_id
+async def get_best_available_transcript(video_id, max_retries=3, delay=5):
+    for attempt in range(max_retries):
         try:
+            transcript = YouTubeTranscriptApi.get_transcript(video_id, languages=['ko'])
         except Exception as e:
+            logging.warning(f'한국어 자막 가져오기 오류: {e}')
             try:
+                transcript = YouTubeTranscriptApi.get_transcript(video_id, languages=['en'])
             except Exception as e:
+                logging.warning(f'영어 자막 가져오기 오류: {e}')
+                try:
+                    transcripts = YouTubeTranscriptApi.list_transcripts(video_id)
+                    transcript = transcripts.find_manually_created_transcript().fetch()
+                except Exception as e:
+                    if attempt < max_retries - 1:
+                        logging.error(f'대체 자막 가져오기 오류: {e}')
+                        await asyncio.sleep(delay)
+                        continue
+                    else:
+                        logging.error(f'모든 자막 가져오기 시도 실패: {e}')
+                        return None
+        formatter = TextFormatter()
+        transcript_text = formatter.format_transcript(transcript)
+        logging.debug(f'가져온 자막: {transcript_text}')
+        return transcript_text
+    return None
 async def get_video_comments(video_id):
     comments = []
     replies = []
     for comment, _ in comments:
         messages = [
+            {"role": "system", "content": f"""너의 이름은 OpenFreeAI이다. 답글 생성후 가장 마지막에 너의 이름을 밝히고 공손하게 인사하라. 비디오 자막: {transcript}"""},
             {"role": "user", "content": comment}
         ]
         loop = asyncio.get_event_loop()
     logging.debug(f'생성된 답글: {replies}')
     return replies
 async def create_thread_and_send_replies(message, video_id, comments, replies, session):
     thread = await message.channel.create_thread(name=f"{message.author.name}의 댓글 답글", message=message)
     for (comment, comment_id), reply in zip(comments, replies):
         embed = discord.Embed(description=f"**댓글**: {comment}\n**답글**: {reply}")
         await thread.send(embed=embed)
 if __name__ == "__main__":
     discord_client = MyClient(intents=intents)
+    discord_client.run(os.getenv('DISCORD_TOKEN'))