Spaces:

Hammad112
/

Voice_clone

Running

Hammad112 commited on Feb 25

Commit

d1ac783

verified ·

1 Parent(s): 084f05a

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,21 +1,14 @@
 import streamlit as st
-import outetts
-from scipy.io.wavfile import write
 import tempfile
 import os
 from pydub import AudioSegment
-# Initialize model configuration
-model_config = outetts.HFModelConfig_v1(
-    model_path="OuteAI/OuteTTS-0.2-500M",
-    language="en"  # Supported languages: en, zh, ja, ko
-)
-# Initialize the interface
-interface = outetts.InterfaceHF(model_version="0.2", cfg=model_config)
 # Streamlit UI
-st.title("OuteTTS Speech Synthesis")
 st.write("Enter text below to generate speech.")
 # Sidebar for reference voice
@@ -38,18 +31,17 @@ text_input = st.text_area("Text to convert to speech:", "Hello, this is an AI-ge
 if st.button("Generate Speech"):
     with st.spinner("Generating audio..."):
-        # Generate speech with reference audio
-        output = interface.generate(
             text=text_input,
-            temperature=0.1,
-            repetition_penalty=1.1,
-            max_length=4096
         )
-        # Save the synthesized speech to a file
-        output_path = "output.wav"
-        output.save(output_path)
         # Play the audio in the Streamlit app
         st.audio(output_path, format="audio/wav")
         st.success("Speech generated successfully!")

 import streamlit as st
+from TTS.api import TTS
 import tempfile
 import os
 from pydub import AudioSegment
+# Initialize the TTS model
+tts = TTS("tts_models/multilingual/multi-dataset/xtts_v2", gpu=True)
 # Streamlit UI
+st.title("XTTS v2 Speech Synthesis")
 st.write("Enter text below to generate speech.")
 # Sidebar for reference voice
 if st.button("Generate Speech"):
     with st.spinner("Generating audio..."):
+        # Define output path
+        output_path = "output.wav"
+        # Generate speech using XTTS v2
+        tts.tts_to_file(
             text=text_input,
+            file_path=output_path,
+            speaker_wav=ref_audio_path if ref_audio_path else None,
+            language="en"
         )
         # Play the audio in the Streamlit app
         st.audio(output_path, format="audio/wav")
         st.success("Speech generated successfully!")