Spaces:

tykiww
/

TTS_Demo

Runtime error

App Files Files Community

tykiww commited on Jul 26, 2024

Commit

3a4510f

verified ·

1 Parent(s): aca53ab

Update app.py

Browse files

Files changed (1) hide show

app.py +28 -15

app.py CHANGED Viewed

@@ -3,6 +3,8 @@ from TTS.api import TTS
 import gradio as gr
 import os
 import spaces
 #inference:
 #  file_path: "output.wav"
@@ -10,42 +12,49 @@ import spaces
 #  language: "en"
 # Agree to Terms of service
 # os.environ["COQUI_TOS_AGREED"] = "1"
-def init_TTS():
     # Get device
     device = "cuda" if torch.cuda.is_available() else "cpu"
     # Initialize the TTS model
-    tts = TTS("tts_models/multilingual/multi-dataset/xtts_v2").to(device)
     return tts
 @spaces.GPU
-def generate_speech(text):
     # Generate speech using the provided text, speaker voice, and language
-    file_path = "output.wav"
-    speaker_wav = "content/speaker.wav"
-    language = "en"
     tts.tts_to_file(text=text,
-                    file_path=file_path,
-                    speaker_wav=speaker_wav,
-                    language=language)
     return file_path
-def main():
-    # call init
-    tts = init_TTS()
     # Create the Gradio interface
     interface = gr.Interface(
         fn=generate_speech,
         inputs=[
-            gr.Textbox(label="Enter your text")
             #gr.Textbox(label="Path to target speaker WAV file", value="/content/speaker.wav")
             #gr.Dropdown(label="Language", choices=["en"], value="en")
         ],
@@ -59,7 +68,11 @@ def main():
     return 0
 if __name__ == "__main__":
-    main()

 import gradio as gr
 import os
 import spaces
+import yaml
 #inference:
 #  file_path: "output.wav"
 #  language: "en"
+def get_config():
+    # get config path
+    config_path = os.environ["CONFIG_PATH"]
+    # Parse the YAML file
+    with open(config_path, 'r') as file:
+        config = yaml.safe_load(file)
+    print(config['inference'])
+    print(config_path)
+    return config
 # Agree to Terms of service
 # os.environ["COQUI_TOS_AGREED"] = "1"
+def init_TTS(config):
     # Get device
     device = "cuda" if torch.cuda.is_available() else "cpu"
     # Initialize the TTS model
+    tts = TTS(config['inference']['model']).to(device)
     return tts
 @spaces.GPU
+def generate_speech(text, config):
     # Generate speech using the provided text, speaker voice, and language
     tts.tts_to_file(text=text,
+                    file_path=config['inference']['file_path'],
+                    speaker_wav=config['inference']['speaker_wav'],
+                    language=config['inference']['language'])
     return file_path
+def main(config):
     # Create the Gradio interface
     interface = gr.Interface(
         fn=generate_speech,
         inputs=[
+            gr.Textbox(label="Enter your text"),
+            config
             #gr.Textbox(label="Path to target speaker WAV file", value="/content/speaker.wav")
             #gr.Dropdown(label="Language", choices=["en"], value="en")
         ],
     return 0
 if __name__ == "__main__":
+    # Get config
+    config = get_config()
+    # initialize TTS
+    tts = init_TTS(config)
+    main(config)