Spaces:
Building
Building
Update stt_google.py
Browse files- stt_google.py +26 -9
stt_google.py
CHANGED
@@ -40,20 +40,37 @@ class GoogleCloudSTT(STTInterface):
|
|
40 |
async def start_streaming(self, config: STTConfig) -> None:
|
41 |
"""Initialize streaming session"""
|
42 |
try:
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
43 |
recognition_config = speech.RecognitionConfig(
|
44 |
-
encoding=self._get_encoding(
|
45 |
-
sample_rate_hertz=
|
46 |
-
language_code=
|
47 |
-
enable_automatic_punctuation=
|
48 |
-
enable_word_time_offsets=
|
49 |
-
model=
|
50 |
-
use_enhanced=
|
51 |
)
|
52 |
|
53 |
self.streaming_config = speech.StreamingRecognitionConfig(
|
54 |
config=recognition_config,
|
55 |
-
interim_results=
|
56 |
-
single_utterance=
|
57 |
)
|
58 |
|
59 |
self.is_streaming = True
|
|
|
40 |
async def start_streaming(self, config: STTConfig) -> None:
|
41 |
"""Initialize streaming session"""
|
42 |
try:
|
43 |
+
# Config'in dict mi STTConfig objesi mi olduğunu kontrol et
|
44 |
+
if isinstance(config, dict):
|
45 |
+
# Dict ise STTConfig objesine çevir
|
46 |
+
stt_config = STTConfig(
|
47 |
+
language=config.get("language", "tr-TR"),
|
48 |
+
sample_rate=config.get("sample_rate", 16000),
|
49 |
+
encoding=config.get("encoding", "WEBM_OPUS"),
|
50 |
+
enable_punctuation=config.get("enable_punctuation", True),
|
51 |
+
enable_word_timestamps=config.get("enable_word_timestamps", False),
|
52 |
+
model=config.get("model", "latest_long"),
|
53 |
+
use_enhanced=config.get("use_enhanced", True),
|
54 |
+
interim_results=config.get("interim_results", True),
|
55 |
+
single_utterance=config.get("single_utterance", False)
|
56 |
+
)
|
57 |
+
else:
|
58 |
+
stt_config = config
|
59 |
+
|
60 |
recognition_config = speech.RecognitionConfig(
|
61 |
+
encoding=self._get_encoding(stt_config.encoding),
|
62 |
+
sample_rate_hertz=stt_config.sample_rate,
|
63 |
+
language_code=stt_config.language,
|
64 |
+
enable_automatic_punctuation=stt_config.enable_punctuation,
|
65 |
+
enable_word_time_offsets=stt_config.enable_word_timestamps,
|
66 |
+
model=stt_config.model,
|
67 |
+
use_enhanced=stt_config.use_enhanced
|
68 |
)
|
69 |
|
70 |
self.streaming_config = speech.StreamingRecognitionConfig(
|
71 |
config=recognition_config,
|
72 |
+
interim_results=stt_config.interim_results,
|
73 |
+
single_utterance=stt_config.single_utterance
|
74 |
)
|
75 |
|
76 |
self.is_streaming = True
|