gaia-agent

Running

Daniel Amendoeira commited on 23 days ago

Commit

104dc35

verified ·

1 Parent(s): 77866f8

Update tools.py

Files changed (1) hide show

tools.py CHANGED Viewed

@@ -5,6 +5,7 @@ import openai
 import os
 import tempfile
 from urllib.parse import urlparse
 def current_date(_):
     return datetime.datetime.now().strftime("%Y-%m-%d")
@@ -56,20 +57,20 @@ def transcribe_audio(audio_input: str) -> str:
         if is_url:
             parsed = urlparse(audio_input)  # breaks down the URL into components (scheme, netloc, path, params, etc.)
-            path_extracted = os.path.splitext(parsed.path)[1] or ".mp3"  # get the actual file extension from the URL path or define it to .mp3 if no extension is found
             # Download to temporary file
-            with tempfile.NamedTemporaryFile(suffix=ext, delete=False) as tmp_file:
-                response = requests.get(audio_input)
-                response.raise_for_status()
-                tmp_file.write(response.content)
                 file_path = tmp_file.name
         else:
             file_path = audio_input
-        # Transcribe using OpenAI Whisper
-        client = openai.OpenAI(api_key=os.getenv("OPENAI_API_KEY"))
-        with open(file_path, "rb") as audio_file:
             transcription = client.audio.transcriptions.create(
                 model="whisper-1",
                 file=audio_file

 import os
 import tempfile
 from urllib.parse import urlparse
+from openai import OpenAI
 def current_date(_):
     return datetime.datetime.now().strftime("%Y-%m-%d")
         if is_url:
             parsed = urlparse(audio_input)  # breaks down the URL into components (scheme, netloc, path, params, etc.)
+            extension = os.path.splitext(parsed.path)[1] or ".mp3"  # get the actual file extension from the URL path or define it to .mp3 if no extension is found
             # Download to temporary file
+            with tempfile.NamedTemporaryFile(suffix=extension, delete=False) as tmp_file:  # creates a temporary file
+                response = requests.get(audio_input)  # downloads the content
+                response.raise_for_status()  # checks if the http request was successful
+                tmp_file.write(response.content)  # saves the file to disk
                 file_path = tmp_file.name
         else:
             file_path = audio_input
+        # Transcribing audio using OpenAI Whisper
+        client = OpenAI()
+        with open(file_path, "rb") as audio_file:  # opens the audio file from disk in binary mode (rb); the "with" block ensures the file is automatically closed afterward
             transcription = client.audio.transcriptions.create(
                 model="whisper-1",
                 file=audio_file