Spaces:

UcsTurkey
/

flare

Building

App Files Files Community

ciyidogan commited on 14 days ago

Commit

6472323

verified ·

1 Parent(s): 1340afa

Update stt/stt_deepgram.py

Browse files

Files changed (1) hide show

stt/stt_deepgram.py +25 -25

stt/stt_deepgram.py CHANGED Viewed

@@ -262,49 +262,49 @@ class DeepgramSTT(STTInterface):
         """Stream audio chunk and get transcription results"""
         if not self.is_streaming or not self.live_connection:
             raise RuntimeError("Streaming not started. Call start_streaming() first.")
-        # Don't send audio if final result already received
-        if self.final_result_received:
-            log_debug("Final result already received, ignoring audio chunk")
-            return
         try:
-            # ✅ İlk birkaç chunk için audio formatını analiz et
             if self.total_chunks < 3:
-                # Linear16 formatı kontrolü
                 if len(audio_chunk) >= 4:
-                    # İlk 2 byte'ı int16 olarak oku
                     import struct
                     try:
-                        # Linear16 ise ilk sample'ı okuyabilmeliyiz
                         first_sample = struct.unpack('<h', audio_chunk[:2])[0]
                         log_info(f"🔊 Audio format check - Chunk #{self.total_chunks}: First sample={first_sample}, Size={len(audio_chunk)} bytes")
-                        # Eğer WebM/Opus ise magic bytes farklı olur
-                        if audio_chunk[:4] == b'webm' or audio_chunk[:4] == b'\x1a\x45\xdf\xa3':
-                            log_error("❌ WebM format detected instead of Linear16!")
                     except:
                         log_warning("⚠️ Could not parse as Linear16")
-            # Send audio to Deepgram
-            self.live_connection.send(audio_chunk)
-            self.total_chunks += 1
-            self.total_audio_bytes += len(audio_chunk)
-            # Log progress
-            if self.total_chunks % 50 == 0:
-                log_debug(f"📊 Listening... {self.total_chunks} chunks, {self.total_audio_bytes/1024:.1f}KB")
-            # Check for final results
             while True:
                 try:
                     result = self.responses_queue.get_nowait()
                     if result.is_final:
                         yield result
                 except queue.Empty:
                     break
         except Exception as e:
             log_error(f"❌ Error streaming audio", error=str(e))
             self.is_streaming = False

         """Stream audio chunk and get transcription results"""
         if not self.is_streaming or not self.live_connection:
             raise RuntimeError("Streaming not started. Call start_streaming() first.")
         try:
+            # İlk birkaç chunk için audio formatını analiz et
             if self.total_chunks < 3:
                 if len(audio_chunk) >= 4:
                     import struct
                     try:
                         first_sample = struct.unpack('<h', audio_chunk[:2])[0]
                         log_info(f"🔊 Audio format check - Chunk #{self.total_chunks}: First sample={first_sample}, Size={len(audio_chunk)} bytes")
                     except:
                         log_warning("⚠️ Could not parse as Linear16")
+            # ✅ Final result geldiyse audio gönderme ama queue'yu kontrol et
+            if not self.final_result_received:
+                # Send audio to Deepgram
+                self.live_connection.send(audio_chunk)
+                self.total_chunks += 1
+                self.total_audio_bytes += len(audio_chunk)
+                # Log progress
+                if self.total_chunks % 50 == 0:
+                    log_debug(f"📊 Listening... {self.total_chunks} chunks, {self.total_audio_bytes/1024:.1f}KB")
+            # ✅ Her zaman queue'yu kontrol et ve result'ları yield et
             while True:
                 try:
                     result = self.responses_queue.get_nowait()
+                    # Log for debugging
+                    log_debug(f"🎯 Yielding result: is_final={result.is_final}, text='{result.text}'")
                     if result.is_final:
+                        self.final_result_received = True
+                        yield result  # ✅ Final result'ı yield et
+                        # Artık yeni audio kabul etme
+                    elif not self.final_result_received:
+                        # Final gelmeden önce interim'leri yield et
                         yield result
                 except queue.Empty:
                     break
         except Exception as e:
             log_error(f"❌ Error streaming audio", error=str(e))
             self.is_streaming = False