Spaces:

UcsTurkey
/

flare

Building

App Files Files Community

ciyidogan commited on about 1 month ago

Commit

7368651

verified ·

1 Parent(s): fd48230

Update tts_interface.py

Browse files

Files changed (1) hide show

tts_interface.py +20 -1

tts_interface.py CHANGED Viewed

@@ -46,13 +46,29 @@ class ElevenLabsTTS(TTSInterface):
         self.base_url = "https://api.elevenlabs.io/v1"
         self.default_voice_id = "2thYbn2sOGtiTwd9QwWH" # Avencia
-                # Debug log
         masked_key = f"{api_key[:4]}...{api_key[-4:]}" if len(api_key) > 8 else "***"
         log(f"🔑 ElevenLabsTTS initialized with key: {masked_key}")
     async def synthesize(self, text: str, voice_id: Optional[str] = None, **kwargs) -> bytes:
         """Convert text to speech using ElevenLabs API"""
         try:
             voice = voice_id or self.default_voice_id
             url = f"{self.base_url}/text-to-speech/{voice}"
@@ -114,6 +130,9 @@ class ElevenLabsTTS(TTSInterface):
             "yoZ06aMxZJJ28mfd3POQ": "Sam (Male)",
         }
 class BlazeTTS(TTSInterface):
     """Placeholder for future Blaze TTS implementation"""

         self.base_url = "https://api.elevenlabs.io/v1"
         self.default_voice_id = "2thYbn2sOGtiTwd9QwWH" # Avencia
+        # ElevenLabs için preprocessing gereken alanlar
+        self.preprocessing_flags = {
+            TTSPreprocessor.PREPROCESS_NUMBERS,    # Büyük sayılar
+            TTSPreprocessor.PREPROCESS_CURRENCY,   # Para birimleri
+            TTSPreprocessor.PREPROCESS_TIME,       # Saat formatı
+            TTSPreprocessor.PREPROCESS_CODES,      # PNR kodları
+            TTSPreprocessor.PREPROCESS_PERCENTAGE  # Yüzdeler
+        }
+        self.preprocessor = TTSPreprocessor(language="tr")
+        # Debug log
         masked_key = f"{api_key[:4]}...{api_key[-4:]}" if len(api_key) > 8 else "***"
         log(f"🔑 ElevenLabsTTS initialized with key: {masked_key}")
     async def synthesize(self, text: str, voice_id: Optional[str] = None, **kwargs) -> bytes:
         """Convert text to speech using ElevenLabs API"""
         try:
+            # Apply preprocessing if not disabled
+            if kwargs.get("disable_preprocessing", False) != True:
+                text = self.preprocessor.preprocess(text, self.preprocessing_flags)
+                log(f"📝 Preprocessed text: {text[:100]}...")
             voice = voice_id or self.default_voice_id
             url = f"{self.base_url}/text-to-speech/{voice}"
             "yoZ06aMxZJJ28mfd3POQ": "Sam (Male)",
         }
+    def get_preprocessing_flags(self) -> Set[str]:
+        """Get preprocessing flags for ElevenLabs"""
+        return self.preprocessing_flags
 class BlazeTTS(TTSInterface):
     """Placeholder for future Blaze TTS implementation"""