Spaces:

Gigaverse
/

ivrit-ai-streaming

Sleeping

App Files Files Community

AshDavid12 commited on Sep 10, 2024

Commit

6465ad1

1 Parent(s): 860f8a3

hf home change

Browse files

Files changed (2) hide show

infer.py +22 -24
requirements.txt +2 -0

infer.py CHANGED Viewed

@@ -1,8 +1,10 @@
 import torch
 from transformers import WhisperProcessor, WhisperForConditionalGeneration
 import soundfile as sf
-from fastapi import FastAPI, File, UploadFile
 import uvicorn
 import os
 from datetime import datetime
@@ -30,33 +32,36 @@ model.to(device)
 print(f"Model is using device: {device}")
-@app.post("/transcribe/")
-async def transcribe_audio(file: UploadFile = File(...)):
-    # Print file upload start
-    print(f"Received audio file: {file.filename}")
-    # Save the uploaded file
-    file_location = f"temp_{file.filename}"
     try:
-        with open(file_location, "wb+") as f:
-            f.write(await file.read())
-        print(f"File saved to: {file_location}")
     except Exception as e:
-        print(f"Error saving the file: {e}")
-        return {"error": f"Error saving the file: {e}"}
-    # Load the audio file and preprocess it
     try:
-        audio_input, _ = sf.read(file_location)
-        print(f"Audio file {file.filename} successfully read.")
         inputs = processor(audio_input, return_tensors="pt", sampling_rate=16000)
         print(f"Audio file preprocessed for transcription.")
     except Exception as e:
         print(f"Error processing the audio file: {e}")
         return {"error": f"Error processing the audio file: {e}"}
-    # Move inputs to the same device as the model
     inputs = {key: value.to(device) for key, value in inputs.items()}
     print("Inputs moved to the appropriate device.")
@@ -77,13 +82,6 @@ async def transcribe_audio(file: UploadFile = File(...)):
         print(f"Error decoding the transcription: {e}")
         return {"error": f"Error decoding the transcription: {e}"}
-    # Clean up the temporary file
-    try:
-        os.remove(file_location)
-        print(f"Temporary file {file_location} deleted.")
-    except Exception as e:
-        print(f"Error deleting the temporary file: {e}")
     return {"transcription": transcription}
 @app.get("/")

 import torch
 from transformers import WhisperProcessor, WhisperForConditionalGeneration
 import soundfile as sf
+from fastapi import FastAPI, File, UploadFile, Form
 import uvicorn
+import requests
+import io
 import os
 from datetime import datetime
 print(f"Model is using device: {device}")
+@app.post("/transcribe-url/")
+def transcribe_audio_url(audio_url: str = Form(...)):
+    # Download the audio file from the provided URL
     try:
+        response = requests.get(audio_url)
+        if response.status_code != 200:
+            return {"error": f"Failed to download audio from URL. Status code: {response.status_code}"}
+        print(f"Successfully downloaded audio from URL: {audio_url}")
+        audio_data = io.BytesIO(response.content)  # Store audio data in memory
     except Exception as e:
+        print(f"Error downloading the audio file: {e}")
+        return {"error": f"Error downloading the audio file: {e}"}
+    # Process the audio
     try:
+        audio_input, _ = sf.read(audio_data)  # Read the audio from the in-memory BytesIO
+        print(f"Audio file from URL successfully read.")
+    except Exception as e:
+        print(f"Error reading the audio file: {e}")
+        return {"error": f"Error reading the audio file: {e}"}
+    # Preprocess the audio for Whisper
+    try:
         inputs = processor(audio_input, return_tensors="pt", sampling_rate=16000)
         print(f"Audio file preprocessed for transcription.")
     except Exception as e:
         print(f"Error processing the audio file: {e}")
         return {"error": f"Error processing the audio file: {e}"}
+    # Move inputs to the appropriate device
     inputs = {key: value.to(device) for key, value in inputs.items()}
     print("Inputs moved to the appropriate device.")
         print(f"Error decoding the transcription: {e}")
         return {"error": f"Error decoding the transcription: {e}"}
     return {"transcription": transcription}
 @app.get("/")

requirements.txt CHANGED Viewed

@@ -3,5 +3,7 @@ uvicorn
 torch
 whisper
 python-multipart
 transformers
 soundfile

 torch
 whisper
 python-multipart
+requests
+io
 transformers
 soundfile