Spaces:
Building
Building
Update stt/stt_google.py
Browse files- stt/stt_google.py +17 -6
stt/stt_google.py
CHANGED
@@ -361,12 +361,23 @@ class GoogleCloudSTT(STTInterface):
|
|
361 |
sample_rate_hertz=stt_config.sample_rate,
|
362 |
language_code=stt_config.language,
|
363 |
enable_automatic_punctuation=stt_config.enable_punctuation,
|
364 |
-
model=
|
365 |
-
use_enhanced=
|
366 |
-
|
367 |
-
#
|
368 |
-
|
369 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
370 |
|
371 |
self.streaming_config = speech.StreamingRecognitionConfig(
|
372 |
config=recognition_config,
|
|
|
361 |
sample_rate_hertz=stt_config.sample_rate,
|
362 |
language_code=stt_config.language,
|
363 |
enable_automatic_punctuation=stt_config.enable_punctuation,
|
364 |
+
model=config.model,
|
365 |
+
use_enhanced=config.use_enhanced,
|
366 |
+
max_alternatives=1,
|
367 |
+
# Metadata for better recognition
|
368 |
+
metadata=speech.RecognitionMetadata(
|
369 |
+
interaction_type=speech.RecognitionMetadata.InteractionType.VOICE_SEARCH,
|
370 |
+
microphone_distance=speech.RecognitionMetadata.MicrophoneDistance.NEARFIELD,
|
371 |
+
recording_device_type=speech.RecognitionMetadata.RecordingDeviceType.PC,
|
372 |
+
)
|
373 |
+
),
|
374 |
+
interim_results=config.interim_results, # ✅ Bu zaten True
|
375 |
+
single_utterance=config.single_utterance, # ✅ Bu False
|
376 |
+
enable_voice_activity_events=True, # ✅ VAD events'leri de açalım
|
377 |
+
|
378 |
+
log_info(f"📋 Streaming config created: interim_results={config.interim_results}, "
|
379 |
+
f"single_utterance={config.single_utterance}, "
|
380 |
+
f"VAD_events=True")
|
381 |
|
382 |
self.streaming_config = speech.StreamingRecognitionConfig(
|
383 |
config=recognition_config,
|