Spaces:

Athspi
/

Ai-audio

Running

Athspi commited on Jan 11

Commit

8ff4639

verified ·

1 Parent(s): 14e4da2

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -21,25 +21,34 @@ def transcribe_audio(audio_file):
     # Split the audio into chunks
     chunks = split_audio(audio_file)
-    # Transcribe each chunk
     transcriptions = []
     for chunk in chunks:
-        result = model(chunk)
         transcriptions.append(result["text"])
         os.remove(chunk)  # Clean up chunk files
     # Combine all transcriptions into one
     full_transcription = " ".join(transcriptions)
-    return full_transcription
 # Define the Gradio interface
 iface = gr.Interface(
     fn=transcribe_audio,
     inputs=gr.Audio(type="filepath", label="Upload Audio File"),
-    outputs=gr.Textbox(label="Transcription"),
-    title="Fast Audio Transcription with Automatic Language Detection",
-    description="Upload an audio file, and the system will automatically detect the language and transcribe it quickly."
 )
 # Launch the Gradio interface
-iface.launch(share=True)

     # Split the audio into chunks
     chunks = split_audio(audio_file)
+    # Transcribe each chunk and collect results
     transcriptions = []
+    detected_languages = set()
     for chunk in chunks:
+        # Enable language detection and transcription
+        result = model(chunk, return_timestamps=False, generate_kwargs={"task": "transcribe"})
         transcriptions.append(result["text"])
+        detected_languages.add(result.get("language", "unknown"))  # Extract detected language
         os.remove(chunk)  # Clean up chunk files
     # Combine all transcriptions into one
     full_transcription = " ".join(transcriptions)
+    # Get the detected language (use the first detected language if multiple are found)
+    detected_language = detected_languages.pop() if detected_languages else "unknown"
+    # Return transcription and detected language
+    return f"Detected Language: {detected_language}\n\nTranscription:\n{full_transcription}"
 # Define the Gradio interface
 iface = gr.Interface(
     fn=transcribe_audio,
     inputs=gr.Audio(type="filepath", label="Upload Audio File"),
+    outputs=gr.Textbox(label="Transcription and Detected Language"),
+    title="Audio Transcription with Automatic Language Detection",
+    description="Upload an audio file, and the system will automatically detect the language and transcribe it."
 )
 # Launch the Gradio interface
+iface.launch()