AGAZO_Final_Assignment

Sleeping

agazo commited on Jun 5

Commit

e83c110

verified ·

1 Parent(s): ecf342c

Update audio_to_text_tool.py

Files changed (1) hide show

audio_to_text_tool.py CHANGED Viewed

@@ -64,19 +64,17 @@ def audio_to_text_from_youtube(youtube_url: str) -> str:
     """
     try:
         with tempfile.TemporaryDirectory() as tmpdir:
-            audio_output_path = os.path.join(tmpdir, "audio.mp3")
             BASE_DIR = os.path.dirname(os.path.abspath(__file__))
             cookies_path = os.path.join(BASE_DIR, 'files', 'cookies.txt')
-            plain_txt_file = get_text_file_contents(cookies_path)
-            print('cookies: \n' + plain_txt_file)
-            # Download best audio using yt-dlp
             ydl_opts = {
                 "format": "bestaudio/best",
-                "outtmpl": audio_output_path,
                 "quiet": True,
                 "cookiefile": cookies_path,
                 "postprocessors": [{
@@ -89,6 +87,10 @@ def audio_to_text_from_youtube(youtube_url: str) -> str:
             with yt_dlp.YoutubeDL(ydl_opts) as ydl:
                 ydl.download([youtube_url])
             # Transcribe with OpenAI Whisper
             with open(audio_output_path, "rb") as audio_file:
                 transcript = client.audio.transcriptions.create(

     """
     try:
         with tempfile.TemporaryDirectory() as tmpdir:
+            audio_stem = os.path.join(tmpdir, "audio")
+            audio_output_path = audio_stem + ".mp3"
             BASE_DIR = os.path.dirname(os.path.abspath(__file__))
             cookies_path = os.path.join(BASE_DIR, 'files', 'cookies.txt')
+            print('cookies: \n' + get_text_file_contents(cookies_path))
             ydl_opts = {
                 "format": "bestaudio/best",
+                "outtmpl": audio_stem,
                 "quiet": True,
                 "cookiefile": cookies_path,
                 "postprocessors": [{
             with yt_dlp.YoutubeDL(ydl_opts) as ydl:
                 ydl.download([youtube_url])
+            # Ensure file exists
+            if not os.path.exists(audio_output_path):
+                raise FileNotFoundError(f"Audio file not created: {audio_output_path}")
             # Transcribe with OpenAI Whisper
             with open(audio_output_path, "rb") as audio_file:
                 transcript = client.audio.transcriptions.create(