kai-ytb-private-reply

Build error

App Files Files Community

seawolf2357 commited on Jun 26, 2024

Commit

3cbcff7

verified ·

1 Parent(s): 829fd20

Update app.py

Browse files

Files changed (1) hide show

app.py +70 -19

app.py CHANGED Viewed

@@ -4,6 +4,7 @@ import os
 import re
 import asyncio
 import subprocess
 from huggingface_hub import InferenceClient
 from googleapiclient.discovery import build
 from youtube_transcript_api import YouTubeTranscriptApi
@@ -33,17 +34,27 @@ youtube_service = build('youtube', 'v3', developerKey=API_KEY)
 # 특정 채널 ID
 SPECIFIC_CHANNEL_ID = int(os.getenv("DISCORD_CHANNEL_ID"))
 class MyClient(discord.Client):
     def __init__(self, *args, **kwargs):
         super().__init__(*args, **kwargs)
         self.is_processing = False
     async def on_ready(self):
         logging.info(f'{self.user}로 로그인되었습니다!')
         # web.py 파일 실행
         subprocess.Popen(["python", "web.py"])
-        logging.info("Web.py server has been started.")
         # 봇이 시작될 때 안내 메시지를 전송
         channel = self.get_channel(SPECIFIC_CHANNEL_ID)
@@ -65,7 +76,7 @@ class MyClient(discord.Client):
                 comments = await get_video_comments(video_id)
                 if comments and transcript:
                     replies = await generate_replies(comments, transcript)
-                    await create_thread_and_send_replies(message, video_id, comments, replies)
                 else:
                     await message.channel.send("자막이나 댓글을 가져올 수 없습니다.")
             else:
@@ -78,6 +89,12 @@ class MyClient(discord.Client):
             isinstance(message.channel, discord.Thread) and message.channel.parent_id == SPECIFIC_CHANNEL_ID
         )
 def extract_video_id(url):
     video_id = None
     youtube_regex = (
@@ -88,28 +105,28 @@ def extract_video_id(url):
     match = re.match(youtube_regex, url)
     if match:
         video_id = match.group(6)
-    logging.debug(f'Extracted video ID: {video_id}')
     return video_id
 async def get_best_available_transcript(video_id):
     try:
         transcript = YouTubeTranscriptApi.get_transcript(video_id, languages=['ko'])
     except Exception as e:
-        logging.warning(f'Error fetching Korean transcript: {e}')
         try:
             transcript = YouTubeTranscriptApi.get_transcript(video_id, languages=['en'])
         except Exception as e:
-            logging.warning(f'Error fetching English transcript: {e}')
             try:
                 transcripts = YouTubeTranscriptApi.list_transcripts(video_id)
                 transcript = transcripts.find_manually_created_transcript().fetch()
             except Exception as e:
-                logging.error(f'Error fetching alternative transcript: {e}')
                 return None
     formatter = TextFormatter()
     transcript_text = formatter.format_transcript(transcript)
-    logging.debug(f'Fetched transcript: {transcript_text}')
     return transcript_text
 async def get_video_comments(video_id):
@@ -125,7 +142,7 @@ async def get_video_comments(video_id):
         comment_id = item['snippet']['topLevelComment']['id']
         comments.append((comment, comment_id))
-    logging.debug(f'Fetched comments: {comments}')
     return comments
 async def generate_replies(comments, transcript):
@@ -135,25 +152,59 @@ async def generate_replies(comments, transcript):
             {"role": "system", "content": f"비디오 자막: {transcript}"},
             {"role": "user", "content": comment}
         ]
-        loop = asyncio.get_event_loop()
-        response = await loop.run_in_executor(None, lambda: hf_client.chat_completion(
-            messages, max_tokens=400, temperature=0.7, top_p=0.85))
-        if response.choices and response.choices[0].message:
-            reply = response.choices[0].message['content'].strip()
-        else:
-            reply = "답글을 생성할 수 없습니다."
         replies.append(reply)
-    logging.debug(f'Generated replies: {replies}')
     return replies
-async def create_thread_and_send_replies(message, video_id, comments, replies):
     thread = await message.channel.create_thread(name=f"{message.author.name}의 댓글 답글", message=message)
-    for (comment, _), reply in zip(comments, replies):
         embed = discord.Embed(description=f"**댓글**: {comment}\n**답글**: {reply}")
         await thread.send(embed=embed)
 if __name__ == "__main__":
     discord_client = MyClient(intents=intents)
     discord_client.run(os.getenv('DISCORD_TOKEN'))

 import re
 import asyncio
 import subprocess
+import aiohttp
 from huggingface_hub import InferenceClient
 from googleapiclient.discovery import build
 from youtube_transcript_api import YouTubeTranscriptApi
 # 특정 채널 ID
 SPECIFIC_CHANNEL_ID = int(os.getenv("DISCORD_CHANNEL_ID"))
+# 웹훅 URL 설정
+WEBHOOK_URL = "https://connect.pabbly.com/workflow/sendwebhookdata/IjU3NjUwNTY1MDYzMjA0MzA1MjY4NTUzMDUxMzUi_pc"
+# 전송 실패 시 재시도 횟수
+MAX_RETRIES = 3
 class MyClient(discord.Client):
     def __init__(self, *args, **kwargs):
         super().__init__(*args, **kwargs)
         self.is_processing = False
+        self.session = None
     async def on_ready(self):
         logging.info(f'{self.user}로 로그인되었습니다!')
         # web.py 파일 실행
         subprocess.Popen(["python", "web.py"])
+        logging.info("Web.py 서버가 시작되었습니다.")
+        # aiohttp 클라이언트 세션 생성
+        self.session = aiohttp.ClientSession()
         # 봇이 시작될 때 안내 메시지를 전송
         channel = self.get_channel(SPECIFIC_CHANNEL_ID)
                 comments = await get_video_comments(video_id)
                 if comments and transcript:
                     replies = await generate_replies(comments, transcript)
+                    await create_thread_and_send_replies(message, video_id, comments, replies, self.session)
                 else:
                     await message.channel.send("자막이나 댓글을 가져올 수 없습니다.")
             else:
             isinstance(message.channel, discord.Thread) and message.channel.parent_id == SPECIFIC_CHANNEL_ID
         )
+    async def close(self):
+        # aiohttp 클라이언트 세션 종료
+        if self.session:
+            await self.session.close()
+        await super().close()
 def extract_video_id(url):
     video_id = None
     youtube_regex = (
     match = re.match(youtube_regex, url)
     if match:
         video_id = match.group(6)
+    logging.debug(f'추출된 비디오 ID: {video_id}')
     return video_id
 async def get_best_available_transcript(video_id):
     try:
         transcript = YouTubeTranscriptApi.get_transcript(video_id, languages=['ko'])
     except Exception as e:
+        logging.warning(f'한국어 자막 가져오기 오류: {e}')
         try:
             transcript = YouTubeTranscriptApi.get_transcript(video_id, languages=['en'])
         except Exception as e:
+            logging.warning(f'영어 자막 가져오기 오류: {e}')
             try:
                 transcripts = YouTubeTranscriptApi.list_transcripts(video_id)
                 transcript = transcripts.find_manually_created_transcript().fetch()
             except Exception as e:
+                logging.error(f'대체 자막 가져오기 오류: {e}')
                 return None
     formatter = TextFormatter()
     transcript_text = formatter.format_transcript(transcript)
+    logging.debug(f'가져온 자막: {transcript_text}')
     return transcript_text
 async def get_video_comments(video_id):
         comment_id = item['snippet']['topLevelComment']['id']
         comments.append((comment, comment_id))
+    logging.debug(f'가져온 댓글: {comments}')
     return comments
 async def generate_replies(comments, transcript):
             {"role": "system", "content": f"비디오 자막: {transcript}"},
             {"role": "user", "content": comment}
         ]
+        try:
+            loop = asyncio.get_event_loop()
+            response = await loop.run_in_executor(None, lambda: hf_client.chat_completion(
+                messages, max_tokens=250, temperature=0.7, top_p=0.85))
+            if response.choices and response.choices[0].message:
+                reply = response.choices[0].message['content'].strip()
+            else:
+                reply = "답글을 생성할 수 없습니다."
+        except Exception as e:
+            logging.error(f"API 호출 중 오류 발생: {e}")
+            reply = "서버 오류로 인해 답글을 생성할 수 없습니다."
         replies.append(reply)
+    logging.debug(f'생성된 답글: {replies}')
     return replies
+async def send_webhook_data(session, chunk_data, chunk_number):
+    for attempt in range(MAX_RETRIES):
+        try:
+            async with session.post(WEBHOOK_URL, json=chunk_data) as resp:
+                if resp.status == 200:
+                    logging.info(f"웹훅으로 데이터 전송 성공: {chunk_number} 번째 시도")
+                    return True  # 성공 시 종료
+                else:
+                    logging.error(f"웹훅으로 데이터 전송 실패: {resp.status}, {chunk_number} 번째 시도")
+        except aiohttp.ClientError as e:
+            logging.error(f"웹훅 전송 중 오류 발생: {e}, {chunk_number} 번째 시도")
+        await asyncio.sleep(1)  # 재시도 전에 잠시 대기
+    return False  # 재시도 횟수 초과 시 실패로 간주
+async def create_thread_and_send_replies(message, video_id, comments, replies, session):
     thread = await message.channel.create_thread(name=f"{message.author.name}의 댓글 답글", message=message)
+    webhook_data = {"video_id": video_id, "replies": []}
+    for (comment, comment_id), reply in zip(comments, replies):
         embed = discord.Embed(description=f"**댓글**: {comment}\n**답글**: {reply}")
         await thread.send(embed=embed)
+        # 웹훅 데이터 준비 (comment id 포함)
+        webhook_data["replies"].append({"comment": comment, "reply": reply, "comment_id": comment_id})
+    # 데이터를 여러 번 나누어 전송
+    chunk_size = 1  # 전송할 데이터의 개수를 1로 설정하여 각 데이터를 별도로 전송
+    for i in range(0, len(webhook_data["replies"]), chunk_size):
+        chunk = webhook_data["replies"][i:i+chunk_size]
+        chunk_data = {"video_id": video_id, "replies": chunk}
+        success = await send_webhook_data(session, chunk_data, i // chunk_size + 1)
+        if not success:
+            logging.error(f"데이터 전송 실패: {i // chunk_size + 1} 번째 청크")
 if __name__ == "__main__":
     discord_client = MyClient(intents=intents)
     discord_client.run(os.getenv('DISCORD_TOKEN'))