Spaces:
Building
Building
Update stt/stt_deepgram.py
Browse files- stt/stt_deepgram.py +15 -1
stt/stt_deepgram.py
CHANGED
@@ -32,21 +32,35 @@ class DeepgramSTT(STTInterface):
|
|
32 |
"""Map language codes to Deepgram format"""
|
33 |
# Deepgram uses different language codes
|
34 |
language_map = {
|
|
|
35 |
"tr-TR": "tr",
|
|
|
36 |
"en-US": "en-US",
|
37 |
"en-GB": "en-GB",
|
|
|
38 |
"de-DE": "de",
|
|
|
39 |
"fr-FR": "fr",
|
|
|
40 |
"es-ES": "es",
|
|
|
41 |
"it-IT": "it",
|
|
|
42 |
"pt-BR": "pt-BR",
|
|
|
43 |
"ru-RU": "ru",
|
|
|
44 |
"ja-JP": "ja",
|
|
|
45 |
"ko-KR": "ko",
|
|
|
46 |
"zh-CN": "zh-CN",
|
|
|
47 |
"ar-SA": "ar",
|
48 |
}
|
49 |
-
|
|
|
|
|
50 |
|
51 |
async def transcribe(self, audio_data: bytes, config: STTConfig) -> Optional[TranscriptionResult]:
|
52 |
"""Transcribe audio data using Deepgram API"""
|
|
|
32 |
"""Map language codes to Deepgram format"""
|
33 |
# Deepgram uses different language codes
|
34 |
language_map = {
|
35 |
+
"tr": "tr",
|
36 |
"tr-TR": "tr",
|
37 |
+
"en": "en-US",
|
38 |
"en-US": "en-US",
|
39 |
"en-GB": "en-GB",
|
40 |
+
"de": "de",
|
41 |
"de-DE": "de",
|
42 |
+
"fr": "fr",
|
43 |
"fr-FR": "fr",
|
44 |
+
"es": "es",
|
45 |
"es-ES": "es",
|
46 |
+
"it": "it",
|
47 |
"it-IT": "it",
|
48 |
+
"pt": "pt-BR",
|
49 |
"pt-BR": "pt-BR",
|
50 |
+
"ru": "ru",
|
51 |
"ru-RU": "ru",
|
52 |
+
"ja": "ja",
|
53 |
"ja-JP": "ja",
|
54 |
+
"ko": "ko",
|
55 |
"ko-KR": "ko",
|
56 |
+
"zh": "zh-CN",
|
57 |
"zh-CN": "zh-CN",
|
58 |
+
"ar": "ar",
|
59 |
"ar-SA": "ar",
|
60 |
}
|
61 |
+
|
62 |
+
# Default to the language itself if not in map
|
63 |
+
return language_map.get(language, language)
|
64 |
|
65 |
async def transcribe(self, audio_data: bytes, config: STTConfig) -> Optional[TranscriptionResult]:
|
66 |
"""Transcribe audio data using Deepgram API"""
|