Spaces:

UcsTurkey
/

flare

Building

App Files Files Community

ciyidogan commited on 16 days ago

Commit

9c4de2d

verified ·

1 Parent(s): 61eaacc

Update websocket_handler.py

Browse files

Files changed (1) hide show

websocket_handler.py +6 -9

websocket_handler.py CHANGED Viewed

@@ -491,7 +491,7 @@ async def handle_audio_chunk(websocket: WebSocket, session: RealtimeSession, mes
         # Decode for processing
         decoded_audio = base64.b64decode(audio_data)
-        # Check silence - LOGLAMA YAPMA
         silence_duration = session.silence_detector.update(decoded_audio)
         # Stream to STT if available
@@ -510,7 +510,7 @@ async def handle_audio_chunk(websocket: WebSocket, session: RealtimeSession, mes
                     return
             try:
-                # Chunk counter - sadece önemli milestone'larda logla
                 if not hasattr(session, 'chunk_counter'):
                     session.chunk_counter = 0
                 session.chunk_counter += 1
@@ -522,7 +522,7 @@ async def handle_audio_chunk(websocket: WebSocket, session: RealtimeSession, mes
                 # STT'ye gönder ve sonuçları bekle
                 async for result in session.stt_manager.stream_audio(decoded_audio):
-                    # SADECE FINAL RESULT'LARI LOGLA VE GÖNDER
                     if result.is_final:
                         log_info(f"✅ FINAL TRANSCRIPTION: '{result.text}'", session_id=session.session.session_id)
@@ -549,14 +549,11 @@ async def handle_audio_chunk(websocket: WebSocket, session: RealtimeSession, mes
                             # Process user input
                             await process_user_input(websocket, session)
-                            # STT'den final result geldiğinde audio buffer'ı ve transcription'ı resetle
                             await session.reset_for_new_utterance()
-                            return  # Bu audio chunk için işlem tamamlandı
-                    # Interim result'ları SADECE ilk kelimede logla (konuşma başlangıcı)
-                    elif result.text.strip() and not hasattr(session, 'speech_started'):
-                        session.speech_started = True
-                        log_info(f"🎤 User started speaking", session_id=session.session.session_id)
             except Exception as e:
                 log_error(f"❌ STT streaming error", error=str(e), traceback=traceback.format_exc(), session_id=session.session.session_id)

         # Decode for processing
         decoded_audio = base64.b64decode(audio_data)
+        # Check silence
         silence_duration = session.silence_detector.update(decoded_audio)
         # Stream to STT if available
                     return
             try:
+                # Chunk counter
                 if not hasattr(session, 'chunk_counter'):
                     session.chunk_counter = 0
                 session.chunk_counter += 1
                 # STT'ye gönder ve sonuçları bekle
                 async for result in session.stt_manager.stream_audio(decoded_audio):
+                    # SADECE FINAL RESULT'LARI İŞLE
                     if result.is_final:
                         log_info(f"✅ FINAL TRANSCRIPTION: '{result.text}'", session_id=session.session.session_id)
                             # Process user input
                             await process_user_input(websocket, session)
+                            # Reset for new utterance
                             await session.reset_for_new_utterance()
+                            return
+                    # Interim result'ları artık göndermiyoruz ve loglama yapmıyoruz
             except Exception as e:
                 log_error(f"❌ STT streaming error", error=str(e), traceback=traceback.format_exc(), session_id=session.session.session_id)