Spaces:

Vinay15
/

Fine-tuning_TTS_for_a_Regional_Language

Runtime error

Vinay15 commited on Oct 24, 2024

Commit

d248bff

verified ·

1 Parent(s): e43ae25

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -3,8 +3,8 @@ import torch
 from datasets import load_dataset
 from transformers import SpeechT5Processor, SpeechT5HifiGan, SpeechT5ForTextToSpeech
-# Load the fine-tuned model and vocoder for Italian
-model_id = "Sandiago21/speecht5_finetuned_voxpopuli_it"
 model = SpeechT5ForTextToSpeech.from_pretrained(model_id)
 vocoder = SpeechT5HifiGan.from_pretrained("microsoft/speecht5_hifigan")
@@ -12,7 +12,7 @@ vocoder = SpeechT5HifiGan.from_pretrained("microsoft/speecht5_hifigan")
 embeddings_dataset = load_dataset("Matthijs/cmu-arctic-xvectors", split="validation")
 speaker_embeddings = torch.tensor(embeddings_dataset[7440]["xvector"]).unsqueeze(0)
-# Load processor for the Italian model
 processor = SpeechT5Processor.from_pretrained(model_id)
 # Optional: Text cleanup for Italian-specific characters
@@ -27,7 +27,7 @@ replacements = [
 # Text-to-speech synthesis function
 def synthesize_speech(text):
-    # Clean up text
     for src, dst in replacements:
         text = text.replace(src, dst)
@@ -58,4 +58,4 @@ interface = gr.Interface(
 )
 # Launch the interface
-interface.launch()

 from datasets import load_dataset
 from transformers import SpeechT5Processor, SpeechT5HifiGan, SpeechT5ForTextToSpeech
+# Load the fine-tuned model and vocoder for Italian from the new model ID
+model_id = "Vinay15/speecht5_finetuned_voxpopuli_it"
 model = SpeechT5ForTextToSpeech.from_pretrained(model_id)
 vocoder = SpeechT5HifiGan.from_pretrained("microsoft/speecht5_hifigan")
 embeddings_dataset = load_dataset("Matthijs/cmu-arctic-xvectors", split="validation")
 speaker_embeddings = torch.tensor(embeddings_dataset[7440]["xvector"]).unsqueeze(0)
+# Load processor for the new Italian model
 processor = SpeechT5Processor.from_pretrained(model_id)
 # Optional: Text cleanup for Italian-specific characters
 # Text-to-speech synthesis function
 def synthesize_speech(text):
+    # Clean up text for Italian-specific accents
     for src, dst in replacements:
         text = text.replace(src, dst)
 )
 # Launch the interface
+interface.launch()