Spaces:

Athspi
/

Ai-audio

Running

Athspi commited on Jan 11

Commit

49d93f9

verified ·

1 Parent(s): d93d8a9

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,39 +1,25 @@
-# Install required libraries
-# Uncomment the line below if you are running locally to install dependencies
-# !pip install gradio openai-whisper
 import gradio as gr
-import whisper
-# Load Whisper model
-model = whisper.load_model("large")
-# Define transcription function
-def transcribe_audio(audio):
-    """
-    Transcribes the uploaded audio file into text.
-    """
-    try:
-        # Transcribe the audio
-        result = model.transcribe(audio)
-        transcription = result["text"]
-        return transcription
-    except Exception as e:
-        return f"Error transcribing audio: {str(e)}"
-# Gradio Interface
-interface = gr.Interface(
     fn=transcribe_audio,
-    inputs=gr.Audio(type="filepath", label="Upload your audio file"),
-    outputs=gr.Textbox(label="Transcribed Text"),
-    title="AI Audio Transcriber",
-    description=(
-        "Upload an audio file, and this AI will transcribe the content into text. "
-        "Powered by OpenAI Whisper, it supports most languages."
-    ),
-    theme="compact"
 )
-# Launch the interface
-if __name__ == "__main__":
-    interface.launch(share=True)

 import gradio as gr
+from transformers import pipeline
+# Load the Whisper model for speech recognition
+model = pipeline("automatic-speech-recognition", model="openai/whisper-medium")
+def transcribe_audio(audio_file, language="english"):
+    # Transcribe the audio file
+    transcription = model(audio_file, generate_kwargs={"language": language})
+    return transcription["text"]
+# Define the Gradio interface
+iface = gr.Interface(
     fn=transcribe_audio,
+    inputs=[
+        gr.Audio(type="filepath", label="Upload Audio File"),
+        gr.Dropdown(choices=["english", "spanish", "french", "german", "chinese", "japanese", "korean", "hindi"], label="Select Language", value="english")
+    ],
+    outputs=gr.Textbox(label="Transcription"),
+    title="Multi-Language Audio Transcription",
+    description="Upload an audio file and select the language to transcribe it."
 )
+# Launch the Gradio interface
+iface.launch()