Spaces:

UcsTurkey
/

flare

Building

App Files Files Community

ciyidogan commited on 16 days ago

Commit

975aa9d

verified ·

1 Parent(s): 04f1304

Update stt/stt_google.py

Browse files

Files changed (1) hide show

stt/stt_google.py +69 -58

stt/stt_google.py CHANGED Viewed

@@ -27,44 +27,47 @@ from .stt_interface import STTInterface, STTConfig, TranscriptionResult
 class GoogleCloudSTT(STTInterface):
     """Google Cloud Speech-to-Text implementation"""
-    def __init__(self, credentials_path: str):
-        if not GOOGLE_SPEECH_AVAILABLE:
-            raise ImportError("google-cloud-speech library not installed. Run: pip install google-cloud-speech")
-        if credentials_path and os.path.exists(credentials_path):
-            os.environ['GOOGLE_APPLICATION_CREDENTIALS'] = credentials_path
-            log_info(f"✅ Google credentials set from: {credentials_path}")
-            # Test credential'ları
-            try:
-                # Client'ı burada oluşturma, her seferinde yeni instance oluştur
-                test_client = speech.SpeechClient()
-                log_info("🔐 Testing Google credentials...")
-                log_info("✅ Google credentials valid")
-                # Test client'ı kapat
-                if hasattr(test_client, 'transport') and hasattr(test_client.transport, 'close'):
-                    test_client.transport.close()
-            except Exception as e:
-                log_error(f"❌ Google credentials error", error=str(e))
-                raise
-        else:
-            log_error(f"❌ Google credentials path not found: {credentials_path}")
-            raise FileNotFoundError(f"Credentials file not found: {credentials_path}")
-        # Client'ı burada oluşturma, start_streaming'de oluştur
         self.client = None
         self.streaming_config = None
-        self.is_streaming = False
-        self.audio_queue = None  # Queue'ları None olarak başlat
-        self.responses_queue = None
         self.stream_thread = None
-        self.stop_event = threading.Event()
-        self.credentials_path = credentials_path
-        # Session tracking
         self.session_id = 0
-        self.total_audio_bytes = 0
-        self.total_chunks = 0
     def _get_encoding(self, encoding_str: str):
         """Convert encoding string to Google Speech enum"""
@@ -248,31 +251,37 @@ class GoogleCloudSTT(STTInterface):
         """Get provider name"""
         return "google"
-    def _reset_session_data(self):
-        """Reset all session-specific data"""
-        # Queue'ları temizle
-        if self.audio_queue:
-            while not self.audio_queue.empty():
-                try:
-                    self.audio_queue.get_nowait()
-                except:
-                    pass
-        if self.responses_queue:
-            while not self.responses_queue.empty():
-                try:
-                    self.responses_queue.get_nowait()
-                except:
-                    pass
-        # Counters'ı sıfırla
-        self.total_audio_bytes = 0
-        self.total_chunks = 0
-        # Yeni session ID
         self.session_id += 1
         log_info(f"🔄 Google STT session data reset. New session ID: {self.session_id}")
     def _create_fresh_queues(self):
         """Create fresh queue instances"""
@@ -308,6 +317,8 @@ class GoogleCloudSTT(STTInterface):
             # Session verilerini resetle ve ID'yi artır
             self._reset_session_data()
             log_info(f"🎤 Starting Google STT streaming session #{self.session_id} with config: {config}")
@@ -329,7 +340,7 @@ class GoogleCloudSTT(STTInterface):
                     encoding=config.get("encoding", "WEBM_OPUS"),
                     enable_punctuation=config.get("enable_punctuation", True),
                     interim_results=config.get("interim_results", False),
-                    single_utterance=config.get("single_utterance", True)
                 )
             else:
                 stt_config = config

 class GoogleCloudSTT(STTInterface):
     """Google Cloud Speech-to-Text implementation"""
+    def __init__(self):
+        """Initialize Google Cloud STT"""
+        log_info("🎤 Creating STT provider: google")
+        # Initialize all required attributes
         self.client = None
         self.streaming_config = None
         self.stream_thread = None
+        self.audio_queue = queue.Queue()
+        self.responses_queue = queue.Queue()
+        self.is_streaming = False
+        self.should_stop = False
+        self.error_message = None
         self.session_id = 0
+        self.stream_start_time = None
+        # ✅ Eksik attribute'ları ekleyelim
+        self.lock = threading.Lock()  # Thread lock
+        self.single_utterance = False  # Default value
+        self.chunk_count = 0  # Audio chunk counter
+        self.total_bytes = 0  # Total bytes received
+        # Check Google credentials
+        creds_path = os.environ.get("GOOGLE_APPLICATION_CREDENTIALS")
+        if not creds_path:
+            # Try default location
+            creds_path = "./credentials/google-service-account.json"
+            if os.path.exists(creds_path):
+                os.environ["GOOGLE_APPLICATION_CREDENTIALS"] = creds_path
+                log_info(f"✅ Google credentials set from: {creds_path}")
+            else:
+                raise ValueError("Google credentials not found. Please set GOOGLE_APPLICATION_CREDENTIALS")
+        # Test credentials
+        try:
+            log_info("🔐 Testing Google credentials...")
+            test_client = speech.SpeechClient()
+            log_info("✅ Google credentials valid")
+        except Exception as e:
+            log_error(f"❌ Invalid Google credentials: {e}")
+            raise
     def _get_encoding(self, encoding_str: str):
         """Convert encoding string to Google Speech enum"""
         """Get provider name"""
         return "google"
+    def _reset_session(self):
+        """Reset session data"""
+        # Clear queues
+        while not self.audio_queue.empty():
+            try:
+                self.audio_queue.get_nowait()
+            except queue.Empty:
+                break
+        while not self.responses_queue.empty():
+            try:
+                self.responses_queue.get_nowait()
+            except queue.Empty:
+                break
+        # Reset state
+        self.should_stop = False
+        self.error_message = None
         self.session_id += 1
+        self.stream_start_time = time.time()
+        # ✅ Counter'ları sıfırla
+        self.chunk_count = 0
+        self.total_bytes = 0
         log_info(f"🔄 Google STT session data reset. New session ID: {self.session_id}")
+        # Create fresh queues to be extra safe
+        self.audio_queue = queue.Queue()
+        self.responses_queue = queue.Queue()
+        log_debug("✅ Created fresh queues")
     def _create_fresh_queues(self):
         """Create fresh queue instances"""
             # Session verilerini resetle ve ID'yi artır
             self._reset_session_data()
+            self.single_utterance = config.get("single_utterance", True)
             log_info(f"🎤 Starting Google STT streaming session #{self.session_id} with config: {config}")
                     encoding=config.get("encoding", "WEBM_OPUS"),
                     enable_punctuation=config.get("enable_punctuation", True),
                     interim_results=config.get("interim_results", False),
+                    single_utterance=self.single_utterance
                 )
             else:
                 stt_config = config