Spaces:
Paused
Paused
Update stt/stt_deepgram.py
Browse files- stt/stt_deepgram.py +15 -1
stt/stt_deepgram.py
CHANGED
|
@@ -32,21 +32,35 @@ class DeepgramSTT(STTInterface):
|
|
| 32 |
"""Map language codes to Deepgram format"""
|
| 33 |
# Deepgram uses different language codes
|
| 34 |
language_map = {
|
|
|
|
| 35 |
"tr-TR": "tr",
|
|
|
|
| 36 |
"en-US": "en-US",
|
| 37 |
"en-GB": "en-GB",
|
|
|
|
| 38 |
"de-DE": "de",
|
|
|
|
| 39 |
"fr-FR": "fr",
|
|
|
|
| 40 |
"es-ES": "es",
|
|
|
|
| 41 |
"it-IT": "it",
|
|
|
|
| 42 |
"pt-BR": "pt-BR",
|
|
|
|
| 43 |
"ru-RU": "ru",
|
|
|
|
| 44 |
"ja-JP": "ja",
|
|
|
|
| 45 |
"ko-KR": "ko",
|
|
|
|
| 46 |
"zh-CN": "zh-CN",
|
|
|
|
| 47 |
"ar-SA": "ar",
|
| 48 |
}
|
| 49 |
-
|
|
|
|
|
|
|
| 50 |
|
| 51 |
async def transcribe(self, audio_data: bytes, config: STTConfig) -> Optional[TranscriptionResult]:
|
| 52 |
"""Transcribe audio data using Deepgram API"""
|
|
|
|
| 32 |
"""Map language codes to Deepgram format"""
|
| 33 |
# Deepgram uses different language codes
|
| 34 |
language_map = {
|
| 35 |
+
"tr": "tr",
|
| 36 |
"tr-TR": "tr",
|
| 37 |
+
"en": "en-US",
|
| 38 |
"en-US": "en-US",
|
| 39 |
"en-GB": "en-GB",
|
| 40 |
+
"de": "de",
|
| 41 |
"de-DE": "de",
|
| 42 |
+
"fr": "fr",
|
| 43 |
"fr-FR": "fr",
|
| 44 |
+
"es": "es",
|
| 45 |
"es-ES": "es",
|
| 46 |
+
"it": "it",
|
| 47 |
"it-IT": "it",
|
| 48 |
+
"pt": "pt-BR",
|
| 49 |
"pt-BR": "pt-BR",
|
| 50 |
+
"ru": "ru",
|
| 51 |
"ru-RU": "ru",
|
| 52 |
+
"ja": "ja",
|
| 53 |
"ja-JP": "ja",
|
| 54 |
+
"ko": "ko",
|
| 55 |
"ko-KR": "ko",
|
| 56 |
+
"zh": "zh-CN",
|
| 57 |
"zh-CN": "zh-CN",
|
| 58 |
+
"ar": "ar",
|
| 59 |
"ar-SA": "ar",
|
| 60 |
}
|
| 61 |
+
|
| 62 |
+
# Default to the language itself if not in map
|
| 63 |
+
return language_map.get(language, language)
|
| 64 |
|
| 65 |
async def transcribe(self, audio_data: bytes, config: STTConfig) -> Optional[TranscriptionResult]:
|
| 66 |
"""Transcribe audio data using Deepgram API"""
|