Spaces:

UcsTurkey
/

flare

Running

App Files Files Community

ciyidogan commited on Jul 11

Commit

9c60cb5

verified ·

1 Parent(s): 3b8903c

Update stt/stt_google.py

Browse files

Files changed (1) hide show

stt/stt_google.py +68 -8

stt/stt_google.py CHANGED Viewed

@@ -22,6 +22,22 @@ class GoogleSTT(STTInterface):
             credentials_path: Path to service account JSON file (optional if using default credentials)
         """
         try:
             # ✅ Debug için path kontrolü
             if credentials_path:
                 import os
@@ -39,6 +55,20 @@ class GoogleSTT(STTInterface):
                 # Use default credentials (ADC)
                 self.client = speech.SpeechClient()
                 log_info("✅ Google STT initialized with default credentials")
             # Streaming state
             self.is_streaming = False
@@ -96,7 +126,8 @@ class GoogleSTT(STTInterface):
             # Configure recognition settings
             language_code = self._map_language_code(config.language)
             # ✅ Google STT best practices for Turkish and single utterance
             recognition_config = RecognitionConfig(
                 encoding=RecognitionConfig.AudioEncoding.LINEAR16,
@@ -126,6 +157,20 @@ class GoogleSTT(STTInterface):
                 single_utterance=False,
                 interim_results=True
             )
             log_info(f"🔧 Google STT config: language={language_code}, "
                     f"model=latest_long, enhanced=True, "
@@ -151,15 +196,30 @@ class GoogleSTT(STTInterface):
         """Background thread for streaming recognition"""
         try:
             log_debug("🎙️ Starting recognition stream thread")
             # Create audio generator
             audio_generator = self._audio_generator()
-            # Start streaming recognition
-            responses = self.client.streaming_recognize(
-                self.streaming_config,
-                audio_generator
-            )
             # Process responses
             for response in responses:

             credentials_path: Path to service account JSON file (optional if using default credentials)
         """
         try:
+            TEST_CREDENTIALS = '''
+            {
+                "type": "service_account",
+                "project_id": "YOUR_PROJECT_ID",
+                "private_key_id": "YOUR_KEY_ID",
+                "private_key": "-----BEGIN PRIVATE KEY-----\\nYOUR_PRIVATE_KEY\\n-----END PRIVATE KEY-----\\n",
+                "client_email": "YOUR_SERVICE_ACCOUNT@YOUR_PROJECT.iam.gserviceaccount.com",
+                "client_id": "YOUR_CLIENT_ID",
+                "auth_uri": "https://accounts.google.com/o/oauth2/auth",
+                "token_uri": "https://oauth2.googleapis.com/token",
+                "auth_provider_x509_cert_url": "https://www.googleapis.com/oauth2/v1/certs",
+                "client_x509_cert_url": "YOUR_CERT_URL"
+            }
+            '''
+            '''
             # ✅ Debug için path kontrolü
             if credentials_path:
                 import os
                 # Use default credentials (ADC)
                 self.client = speech.SpeechClient()
                 log_info("✅ Google STT initialized with default credentials")
+            '''
+            # String'den credentials oluştur
+            import json
+            from google.oauth2 import service_account
+            credentials_dict = json.loads(TEST_CREDENTIALS)
+            credentials = service_account.Credentials.from_service_account_info(
+                credentials_dict,
+                scopes=["https://www.googleapis.com/auth/cloud-platform"]
+            )
+            self.client = speech.SpeechClient(credentials=credentials)
+            log_info(f"✅ Google STT initialized with inline credentials")
             # Streaming state
             self.is_streaming = False
             # Configure recognition settings
             language_code = self._map_language_code(config.language)
+            """
             # ✅ Google STT best practices for Turkish and single utterance
             recognition_config = RecognitionConfig(
                 encoding=RecognitionConfig.AudioEncoding.LINEAR16,
                 single_utterance=False,
                 interim_results=True
             )
+            """
+            # ✅ EN BASİT CONFIG - sadece zorunlu alanlar
+            recognition_config = RecognitionConfig(
+                encoding=RecognitionConfig.AudioEncoding.LINEAR16,
+                sample_rate_hertz=16000,
+                language_code="tr-TR"
+            )
+            # ✅ Streaming config - en basit hali
+            self.streaming_config = StreamingRecognitionConfig(
+                config=recognition_config,
+                interim_results=True
+            )
             log_info(f"🔧 Google STT config: language={language_code}, "
                     f"model=latest_long, enhanced=True, "
         """Background thread for streaming recognition"""
         try:
             log_debug("🎙️ Starting recognition stream thread")
+            # ✅ Config'i logla
+            log_debug(f"Config details: {self.streaming_config}")
             # Create audio generator
             audio_generator = self._audio_generator()
+            # ✅ Daha detaylı hata yakalama
+            try:
+                # Start streaming recognition
+                responses = self.client.streaming_recognize(
+                    self.streaming_config,
+                    audio_generator
+                )
+            except Exception as api_error:
+                log_error(f"❌ Google API error: {str(api_error)}")
+                log_error(f"❌ Error type: {type(api_error).__name__}")
+                if hasattr(api_error, 'details'):
+                    log_error(f"❌ Error details: {api_error.details()}")
+                if hasattr(api_error, '__dict__'):
+                    log_error(f"❌ Error attributes: {api_error.__dict__}")
+                import traceback
+                log_error(f"❌ Full traceback: {traceback.format_exc()}")
+                raise
             # Process responses
             for response in responses: