Spaces:

UcsTurkey
/

flare

Building

App Files Files Community

ciyidogan commited on 17 days ago

Commit

641d903

verified ·

1 Parent(s): 668e7b4

Update stt_google.py

Browse files

Files changed (1) hide show

stt_google.py +127 -100

stt_google.py CHANGED Viewed

@@ -110,120 +110,147 @@ class GoogleCloudSTT(STTInterface):
             log_error(f"❌ Error queuing result: {e}")
     def _run_stream(self):
-            """Run the streaming recognition in a separate thread"""
-            try:
-                log_info("🎤 Google STT stream thread started")
-                def request_generator():
-                    """Generate streaming requests"""
-                    chunk_count = 0
-                    start_time = datetime.now()
-                    while not self.stop_event.is_set():
-                        try:
-                            # 5 dakika sınırına yaklaşıyorsak stream'i sonlandır
-                            elapsed = (datetime.now() - start_time).total_seconds()
-                            if elapsed > 280:  # 4 dakika 40 saniye - güvenli margin
-                                log_warning(f"⚠️ Approaching 5-minute limit ({elapsed:.1f}s), ending stream gracefully")
-                                break
-                            # Get audio chunk with timeout
-                            chunk = self.audio_queue.get(timeout=0.1)
-                            if chunk is None:  # Poison pill
-                                log_info("📛 Poison pill received, stopping request generator")
-                                break
-                            chunk_count += 1
-                            # Sadece önemli milestone'larda logla
-                            if chunk_count == 1:
-                                log_info(f"📤 First chunk sent to Google STT, size: {len(chunk)} bytes")
-                            elif chunk_count % 100 == 0:
-                                log_info(f"📤 Sent {chunk_count} chunks to Google STT (elapsed: {elapsed:.1f}s)")
-                            yield speech.StreamingRecognizeRequest(audio_content=chunk)
-                        except queue.Empty:
-                            continue
-                        except Exception as e:
-                            log_error(f"❌ Error in request generator: {e}")
                             break
-                # Create streaming client
-                requests = request_generator()
-                log_info("🎤 Creating Google STT streaming client...")
-                try:
-                    responses = self.client.streaming_recognize(self.streaming_config, requests)
-                    log_info("✅ Google STT streaming client created")
-                    # Process responses
-                    response_count = 0
-                    empty_response_count = 0
-                    for response in responses:
-                        response_count += 1
-                        if self.stop_event.is_set():
-                            log_info("🛑 Stop event detected, breaking response loop")
-                            break
-                        # Boş response'ları say ama loglama
-                        if not response.results:
-                            empty_response_count += 1
-                            if empty_response_count % 50 == 0:
-                                log_warning(f"⚠️ Received {empty_response_count} empty responses from Google STT")
                             continue
-                        for result in response.results:
-                            if not result.alternatives:
-                                continue
-                            # İlk alternatifi al
-                            alternative = result.alternatives[0]
-                            # Sadece anlamlı text'leri işle
-                            if alternative.transcript.strip():
-                                # Create transcription result
-                                transcription = TranscriptionResult(
-                                    text=alternative.transcript,
-                                    is_final=result.is_final,
-                                    confidence=alternative.confidence if hasattr(alternative, 'confidence') and alternative.confidence else 0.0,
-                                    timestamp=datetime.now().timestamp()
-                                )
-                                # Put result in queue
-                                self._put_result(transcription)
-                                # SADECE final result'ları logla
-                                if result.is_final:
-                                    log_info(f"🎯 GOOGLE STT FINAL: '{alternative.transcript}'")
-                    log_info(f"📊 Google STT stream ended. Total responses: {response_count}, Empty: {empty_response_count}")
-                except Exception as e:
-                    error_msg = str(e)
-                    # Detaylı hata mesajları
-                    if "Exceeded maximum allowed stream duration" in error_msg:
-                        log_warning("���️ Stream duration limit exceeded (5 minutes). This is expected for long sessions.")
-                    elif "Bad language code" in error_msg:
-                        log_error(f"❌ Invalid language code in STT config. Check locale settings.")
-                    elif "invalid_argument" in error_msg:
-                        log_error(f"❌ Invalid STT configuration. Check encoding and sample rate.")
-                    elif "Deadline Exceeded" in error_msg:
-                        log_error(f"❌ Google STT timeout - possibly network issue or slow connection")
-                    elif "503" in error_msg or "Service Unavailable" in error_msg:
-                        log_error(f"❌ Google STT service temporarily unavailable. Will retry...")
-                    else:
-                        log_error(f"❌ Google STT stream error: {error_msg}")
             except Exception as e:
-                import traceback
-                log_error(f"❌ Fatal error in STT stream thread", error=str(e), traceback=traceback.format_exc())
-            finally:
-                log_info("🎤 Google STT stream thread ended")
-                # Thread bittiğinde streaming flag'ini kapat
-                self.is_streaming = False
     async def stream_audio(self, audio_chunk: bytes) -> AsyncIterator[TranscriptionResult]:
         """Stream audio chunk and get transcription results"""

             log_error(f"❌ Error queuing result: {e}")
     def _run_stream(self):
+        """Run the streaming recognition in a separate thread"""
+        try:
+            log_info("🎤 Google STT stream thread started")
+            def request_generator():
+                """Generate streaming requests"""
+                chunk_count = 0
+                total_bytes = 0  # Toplam byte sayısı
+                while not self.stop_event.is_set():
+                    try:
+                        chunk = self.audio_queue.get(timeout=0.1)
+                        if chunk is None:
+                            log_info("📛 Poison pill received, stopping request generator")
                             break
+                        chunk_count += 1
+                        total_bytes += len(chunk)
+                        # İlk chunk'ta audio format kontrolü
+                        if chunk_count == 1:
+                            log_info(f"📤 First chunk - size: {len(chunk)} bytes")
+                            # Audio header kontrolü (WEBM magic bytes)
+                            if chunk[:4] == b'\x1a\x45\xdf\xa3':
+                                log_info("✅ Valid WEBM header detected")
+                            else:
+                                log_warning(f"⚠️ Unknown audio format, first 4 bytes: {chunk[:4].hex()}")
+                        # Her 100 chunk'ta durum raporu
+                        if chunk_count % 100 == 0:
+                            avg_chunk_size = total_bytes / chunk_count
+                            log_info(f"📤 Progress: {chunk_count} chunks, {total_bytes/1024:.1f}KB total, avg {avg_chunk_size:.0f} bytes/chunk")
+                        yield speech.StreamingRecognizeRequest(audio_content=chunk)
+                    except queue.Empty:
+                        continue
+                    except Exception as e:
+                        log_error(f"❌ Error in request generator: {e}")
+                        break
+            # Create streaming client
+            requests = request_generator()
+            log_info("🎤 Creating Google STT streaming client...")
+            try:
+                responses = self.client.streaming_recognize(
+                    self.streaming_config,
+                    requests,
+                    timeout=300 # 5 dakika timeout
+                )
+                log_info("✅ Google STT streaming client created")
+                # Response timeout kontrolü
+                last_response_time = time.time()
+                RESPONSE_TIMEOUT = 30  # 30 saniye içinde response gelmezse
+                # Process responses
+                response_count = 0
+                empty_response_count = 0
+                for response in responses:
+                    last_response_time = time.time()
+                    response_count += 1
+                    # Response type'ı logla
+                    if response_count == 1:
+                        log_info(f"📨 First response received from Google STT")
+                    if self.stop_event.is_set():
+                        log_info("🛑 Stop event detected, breaking response loop")
+                        break
+                    # Response içeriğini kontrol et
+                    if not response.results:
+                        empty_response_count += 1
+                        if empty_response_count == 1:
+                            log_debug("📭 Received empty response (no results)")
+                        continue
+                    for i, result in enumerate(response.results):
+                        log_debug(f"📋 Result {i}: is_final={result.is_final}, alternatives={len(result.alternatives)}")
+                        if not result.alternatives:
+                            log_debug(f"📋 Result {i} has no alternatives")
                             continue
+                        # İlk alternatifi al
+                        alternative = result.alternatives[0]
+                        # Sadece anlamlı text'leri işle
+                        if alternative.transcript.strip():
+                            # Create transcription result
+                            transcription = TranscriptionResult(
+                                text=alternative.transcript,
+                                is_final=result.is_final,
+                                confidence=alternative.confidence if hasattr(alternative, 'confidence') and alternative.confidence else 0.0,
+                                timestamp=datetime.now().timestamp()
+                            )
+                            # Put result in queue
+                            self._put_result(transcription)
+                            # SADECE final result'ları logla
+                            if result.is_final:
+                                log_info(f"🎯 GOOGLE STT FINAL: '{alternative.transcript}'")
+                        else:
+                            log_debug(f"📋 Result {i} has empty transcript")
+                            continue
+                if time.time() - last_response_time > RESPONSE_TIMEOUT:
+                    log_error(f"❌ No response from Google STT for {RESPONSE_TIMEOUT} seconds")
+                log_info(f"📊 Google STT stream ended. Total responses: {response_count}, Empty: {empty_response_count}")
             except Exception as e:
+                error_msg = str(e)
+                # Detaylı hata mesajları
+                if "Exceeded maximum allowed stream duration" in error_msg:
+                    log_warning("⚠️ Stream duration limit exceeded (5 minutes). This is expected for long sessions.")
+                elif "Bad language code" in error_msg:
+                    log_error(f"❌ Invalid language code in STT config. Check locale settings.")
+                elif "invalid_argument" in error_msg:
+                    log_error(f"❌ Invalid STT configuration. Check encoding and sample rate.")
+                elif "Deadline Exceeded" in error_msg:
+                    log_error(f"❌ Google STT response timeout - possibly network issue or slow connection")
+                elif "503" in error_msg or "Service Unavailable" in error_msg:
+                    log_error(f"❌ Google STT service temporarily unavailable. Will retry...")
+                else:
+                    log_error(f"❌ Google STT stream error: {error_msg}")
+        except Exception as e:
+            import traceback
+            log_error(f"❌ Fatal error in STT stream thread", error=str(e), traceback=traceback.format_exc())
+        finally:
+            log_info("🎤 Google STT stream thread ended")
+            # Thread bittiğinde streaming flag'ini kapat
+            self.is_streaming = False
     async def stream_audio(self, audio_chunk: bytes) -> AsyncIterator[TranscriptionResult]:
         """Stream audio chunk and get transcription results"""