Spaces:

UcsTurkey
/

flare

Running

App Files Files Community

ciyidogan commited on 16 days ago

Commit

1340afa

verified ·

1 Parent(s): fe3edc5

Update stt/stt_deepgram.py

Browse files

Files changed (1) hide show

stt/stt_deepgram.py +29 -0

stt/stt_deepgram.py CHANGED Viewed

@@ -178,7 +178,19 @@ class DeepgramSTT(STTInterface):
             if not result:
                 log_warning("⚠️ No result in transcript event")
                 return
             # Access properties directly from the result object
             is_final = result.is_final if hasattr(result, 'is_final') else False
@@ -257,6 +269,23 @@ class DeepgramSTT(STTInterface):
             return
         try:
             # Send audio to Deepgram
             self.live_connection.send(audio_chunk)

             if not result:
                 log_warning("⚠️ No result in transcript event")
                 return
+            # ✅ Debug için result objesini detaylı inceleyin
+            if self.total_chunks < 5:  # İlk birkaç event için
+                log_debug(f"🔍 Result object type: {type(result)}")
+                log_debug(f"🔍 Result dir: {[attr for attr in dir(result) if not attr.startswith('_')]}")
+                # Result'un tüm property'lerini logla
+                try:
+                    if hasattr(result, '__dict__'):
+                        log_debug(f"🔍 Result dict: {result.__dict__}")
+                except:
+                    pass
             # Access properties directly from the result object
             is_final = result.is_final if hasattr(result, 'is_final') else False
             return
         try:
+            # ✅ İlk birkaç chunk için audio formatını analiz et
+            if self.total_chunks < 3:
+                # Linear16 formatı kontrolü
+                if len(audio_chunk) >= 4:
+                    # İlk 2 byte'ı int16 olarak oku
+                    import struct
+                    try:
+                        # Linear16 ise ilk sample'ı okuyabilmeliyiz
+                        first_sample = struct.unpack('<h', audio_chunk[:2])[0]
+                        log_info(f"🔊 Audio format check - Chunk #{self.total_chunks}: First sample={first_sample}, Size={len(audio_chunk)} bytes")
+                        # Eğer WebM/Opus ise magic bytes farklı olur
+                        if audio_chunk[:4] == b'webm' or audio_chunk[:4] == b'\x1a\x45\xdf\xa3':
+                            log_error("❌ WebM format detected instead of Linear16!")
+                    except:
+                        log_warning("⚠️ Could not parse as Linear16")
             # Send audio to Deepgram
             self.live_connection.send(audio_chunk)