Athspi commited on
Commit
3b2b2f2
·
verified ·
1 Parent(s): 8ff4639

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +10 -5
app.py CHANGED
@@ -23,20 +23,25 @@ def transcribe_audio(audio_file):
23
 
24
  # Transcribe each chunk and collect results
25
  transcriptions = []
26
- detected_languages = set()
27
 
28
  for chunk in chunks:
29
  # Enable language detection and transcription
30
- result = model(chunk, return_timestamps=False, generate_kwargs={"task": "transcribe"})
31
  transcriptions.append(result["text"])
32
- detected_languages.add(result.get("language", "unknown")) # Extract detected language
 
 
 
 
33
  os.remove(chunk) # Clean up chunk files
34
 
35
  # Combine all transcriptions into one
36
  full_transcription = " ".join(transcriptions)
37
 
38
- # Get the detected language (use the first detected language if multiple are found)
39
- detected_language = detected_languages.pop() if detected_languages else "unknown"
 
40
 
41
  # Return transcription and detected language
42
  return f"Detected Language: {detected_language}\n\nTranscription:\n{full_transcription}"
 
23
 
24
  # Transcribe each chunk and collect results
25
  transcriptions = []
26
+ detected_language = None
27
 
28
  for chunk in chunks:
29
  # Enable language detection and transcription
30
+ result = model(chunk, generate_kwargs={"task": "transcribe", "language": None}) # Let Whisper detect language
31
  transcriptions.append(result["text"])
32
+
33
+ # Extract detected language from the result (if available)
34
+ if "language" in result:
35
+ detected_language = result["language"]
36
+
37
  os.remove(chunk) # Clean up chunk files
38
 
39
  # Combine all transcriptions into one
40
  full_transcription = " ".join(transcriptions)
41
 
42
+ # If no language was detected, set a default message
43
+ if detected_language is None:
44
+ detected_language = "unknown (language not detected)"
45
 
46
  # Return transcription and detected language
47
  return f"Detected Language: {detected_language}\n\nTranscription:\n{full_transcription}"