Spaces:

UcsTurkey
/

flare

Building

App Files Files Community

ciyidogan commited on 11 days ago

Commit

bdc222a

verified ·

1 Parent(s): 48cbaf2

Update stt/stt_google.py

Browse files

Files changed (1) hide show

stt/stt_google.py +74 -65

stt/stt_google.py CHANGED Viewed

@@ -322,73 +322,81 @@ class GoogleCloudSTT(STTInterface):
     async def start_streaming(self, config: STTConfig) -> None:
         """Initialize streaming session with clean state"""
         try:
-            # Clean up any existing stream
-            if self.is_streaming or self.stream_thread:
-                log_warning("⚠️ Previous stream still active, stopping it first")
-                await self.stop_streaming()
-                await asyncio.sleep(0.5)
-            # Reset session
-            self._reset_session()
-            self.single_utterance = config.single_utterance
-            log_info(f"🎤 Starting Google STT streaming session #{self.session_id} with config: {config}")
-            # Create fresh queues
-            self._create_fresh_queues()
-            self.stop_event.clear()
-            self.should_stop = False
-            # Create new client
-            self.client = speech.SpeechClient()
-            log_info("✅ Created new Google Speech client")
-            # Create recognition config
-            recognition_config = speech.RecognitionConfig(
-                encoding=speech.RecognitionConfig.AudioEncoding.WEBM_OPUS,
-                sample_rate_hertz=16000,
-                language_code="tr-TR",
-                enable_automatic_punctuation=True,
-                model="latest_long",
-                use_enhanced=True,
-                max_alternatives=1,
-                metadata=speech.RecognitionMetadata(
-                    interaction_type=speech.RecognitionMetadata.InteractionType.VOICE_SEARCH,
-                    microphone_distance=speech.RecognitionMetadata.MicrophoneDistance.NEARFIELD,
-                    recording_device_type=speech.RecognitionMetadata.RecordingDeviceType.PC,
                 )
-            )
-            # Create streaming config with VAD
-            self.streaming_config = speech.StreamingRecognitionConfig(
-                config=recognition_config,
-                interim_results=True,
-                single_utterance=False,
-                enable_voice_activity_events=True  # ✅ VAD events enabled
-            )
-            self.is_streaming = True
-            self.stop_event.clear()
-            # Start streaming thread
-            self.stream_thread = threading.Thread(target=self._run_stream)
-            self.stream_thread.start()
-            log_info(f"📋 Streaming config created: interim_results={config.interim_results}, "
-                     f"single_utterance={config.single_utterance}, "
-                     f"VAD_events=True")
-            self.is_streaming = True
-            # Start streaming thread
-            self.stream_thread = threading.Thread(
-                target=self._run_stream,
-                name=f"GoogleSTT-Session-{self.session_id}"
-            )
-            self.stream_thread.daemon = True
-            self.stream_thread.start()
-            log_info(f"✅ Google STT streaming session #{self.session_id} started successfully")
         except Exception as e:
             log_error(f"❌ Failed to start Google STT streaming", error=str(e))
@@ -400,13 +408,14 @@ class GoogleCloudSTT(STTInterface):
     def _run_stream(self):
         """Run the streaming recognition loop in a separate thread"""
         try:
-            log_info(f"🎤 Google STT stream thread started - Single utterance mode: {self.single_utterance}")
             # Create request generator
             requests = self._request_generator()
             # Create streaming client
-            log_info("🎤 Creating Google STT streaming client...")
             # Get responses (no timeout parameter!)
             responses = self.client.streaming_recognize(self.streaming_config, requests)

     async def start_streaming(self, config: STTConfig) -> None:
         """Initialize streaming session with clean state"""
         try:
+            # Thread safety için lock kullan
+            async with asyncio.Lock():
+                # Clean up any existing stream
+                if self.is_streaming or self.stream_thread:
+                    log_warning("⚠️ Previous stream still active, stopping it first")
+                    await self.stop_streaming()
+                    await asyncio.sleep(0.5)
+                # Double-check after cleanup
+                if self.stream_thread and self.stream_thread.is_alive():
+                    log_error(f"❌ Stream thread STILL running after cleanup! Thread: {self.stream_thread.name}")
+                    raise Exception("Failed to stop previous stream thread")
+                # Reset session
+                self._reset_session()
+                self.single_utterance = config.single_utterance
+                self.current_encoding = config.encoding
+                log_info(f"🎤 Starting Google STT streaming session #{self.session_id} with config: {config}")
+                # Create fresh queues
+                self._create_fresh_queues()
+                self.stop_event.clear()
+                self.should_stop = False
+                # Create new client
+                self.client = speech.SpeechClient()
+                log_info("✅ Created new Google Speech client")
+                # Create recognition config
+                recognition_config = speech.RecognitionConfig(
+                    encoding=speech.RecognitionConfig.AudioEncoding.WEBM_OPUS,
+                    sample_rate_hertz=16000,
+                    language_code="tr-TR",
+                    enable_automatic_punctuation=True,
+                    model="latest_long",
+                    use_enhanced=True,
+                    max_alternatives=1,
+                    metadata=speech.RecognitionMetadata(
+                        interaction_type=speech.RecognitionMetadata.InteractionType.VOICE_SEARCH,
+                        microphone_distance=speech.RecognitionMetadata.MicrophoneDistance.NEARFIELD,
+                        recording_device_type=speech.RecognitionMetadata.RecordingDeviceType.PC,
+                    )
                 )
+                # Create streaming config with VAD
+                self.streaming_config = speech.StreamingRecognitionConfig(
+                    config=recognition_config,
+                    interim_results=True,
+                    single_utterance=False,
+                    enable_voice_activity_events=True  # ✅ VAD events enabled
+                )
+                self.is_streaming = True
+                self.stop_event.clear()
+                # Thread başlatmadan önce son kontrol
+                if self.stream_thread is not None:
+                    log_error("❌ stream_thread should be None at this point!")
+                    self.stream_thread = None
+                self.is_streaming = True
+                # Start streaming thread with unique ID
+                thread_id = f"GoogleSTT-Session-{self.session_id}-{int(time.time()*1000)}"
+                self.stream_thread = threading.Thread(
+                    target=self._run_stream,
+                    name=thread_id
+                )
+                self.stream_thread.daemon = True
+                log_info(f"🚀 Starting thread: {thread_id}")
+                self.stream_thread.start()
+                log_info(f"✅ Google STT streaming session #{self.session_id} started successfully")
         except Exception as e:
             log_error(f"❌ Failed to start Google STT streaming", error=str(e))
     def _run_stream(self):
         """Run the streaming recognition loop in a separate thread"""
         try:
+            thread_id = threading.current_thread().ident
+            log_info(f"🎤 Google STT stream thread started - Thread ID: {thread_id}, Session: {self.session_id}")
             # Create request generator
             requests = self._request_generator()
             # Create streaming client
+            log_info(f"🎤 Creating Google STT streaming client... Thread ID: {thread_id}")
             # Get responses (no timeout parameter!)
             responses = self.client.streaming_recognize(self.streaming_config, requests)