gaia-agent

Running

App Files Files Community

Daniel Amendoeira commited on 21 days ago

Commit

77866f8

verified ·

1 Parent(s): ffff64a

Update tools.py

Browse files

Files changed (1) hide show

tools.py +51 -1

tools.py CHANGED Viewed

@@ -1,5 +1,10 @@
 from langchain.tools import Tool
 import datetime
 def current_date(_):
     return datetime.datetime.now().strftime("%Y-%m-%d")
@@ -33,4 +38,49 @@ datetime_tools = [
         func=days_until,
         description="Returns the number of days from today until a given date (input format: YYYY-MM-DD)."
     )
-]

 from langchain.tools import Tool
 import datetime
+import requests
+import openai
+import os
+import tempfile
+from urllib.parse import urlparse
 def current_date(_):
     return datetime.datetime.now().strftime("%Y-%m-%d")
         func=days_until,
         description="Returns the number of days from today until a given date (input format: YYYY-MM-DD)."
     )
+]
+def transcribe_audio(audio_input: str) -> str:
+    """
+    Transcribes an audio file from a local file or a URL
+    Args:
+        audio_input (str): A local file path or a direct URL to the audio file (.mp3, .m4a, etc.)
+    Returns:
+        str: The transcribed text from the audio.
+    """
+    try:
+        # Detects if audio_input is a URL
+        is_url = audio_input.startswith("http://") or audio_input.startswith("https://")
+        if is_url:
+            parsed = urlparse(audio_input)  # breaks down the URL into components (scheme, netloc, path, params, etc.)
+            path_extracted = os.path.splitext(parsed.path)[1] or ".mp3"  # get the actual file extension from the URL path or define it to .mp3 if no extension is found
+            # Download to temporary file
+            with tempfile.NamedTemporaryFile(suffix=ext, delete=False) as tmp_file:
+                response = requests.get(audio_input)
+                response.raise_for_status()
+                tmp_file.write(response.content)
+                file_path = tmp_file.name
+        else:
+            file_path = audio_input
+        # Transcribe using OpenAI Whisper
+        client = openai.OpenAI(api_key=os.getenv("OPENAI_API_KEY"))
+        with open(file_path, "rb") as audio_file:
+            transcription = client.audio.transcriptions.create(
+                model="whisper-1",
+                file=audio_file
+            )
+        return transcription.text
+    except Exception as e:
+        return f"Transcription failed: {e}"
+transcribe_audio_tool = Tool(
+        name="transcribe_audio",
+        func=transcribe_audio,
+        description="Transcribes an audio file from a local file or a URL"
+)