Spaces:

Vinay15
/

Text-to-Speech_Model_for_English_Technical_Speech

Sleeping

Vinay15 commited on Oct 27, 2024

Commit

8fa00e8

verified ·

1 Parent(s): 7b03b11

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -25,10 +25,17 @@ def preprocess_text(text):
         text = text.replace(term.upper(), phonetic)
     return text
 # Step 2: Define the TTS function with sentence segmentation
 def text_to_speech(input_text):
     # Preprocess and segment text
     processed_text = preprocess_text(input_text)
     # Split the processed text by punctuation to form shorter segments
     segments = re.split(r'(?<=[.!?]) +', processed_text)
@@ -62,9 +69,9 @@ iface = gr.Interface(
     title="Fine-tuning TTS for Technical Vocabulary",
     description="Enter text with technical jargon for TTS conversion. The model will handle abbreviations and technical terms for better pronunciation.",
     examples=[
-        ["Please configure the API settings for OAuth and JSON data processing."],
-        ["Ensure that CUDA and TensorFlow are optimized for deep learning models."],
-        ["Update the SQL database to include REST endpoints and support NOSQL features."]
     ]
 )

         text = text.replace(term.upper(), phonetic)
     return text
+# Explicitly replace "API" with "A P I" to improve pronunciation
+def custom_acronym_pronunciation(text):
+    text = text.replace("API", "ay p eei")
+    return text
 # Step 2: Define the TTS function with sentence segmentation
 def text_to_speech(input_text):
     # Preprocess and segment text
     processed_text = preprocess_text(input_text)
+    # Apply custom acronym handling
+    processed_text = custom_acronym_pronunciation(processed_text)
     # Split the processed text by punctuation to form shorter segments
     segments = re.split(r'(?<=[.!?]) +', processed_text)
     title="Fine-tuning TTS for Technical Vocabulary",
     description="Enter text with technical jargon for TTS conversion. The model will handle abbreviations and technical terms for better pronunciation.",
     examples=[
+        ["The API allows integration with OAuth and REST for scalable web services."],
+        ["Using CUDA for deep learning optimizes the model training on GPUs."],
+        ["In TTS models, the vocoder is essential for natural-sounding speech."]
     ]
 )