Spaces:

manufy
/

tts-gradio

Sleeping

Manu commited on May 18, 2024

Commit

4d1dde6

1 Parent(s): 810b795

testing tts

Files changed (2) hide show

.gitignore ADDED Viewed

	@@ -0,0 +1 @@


1	+ *.wav

app.py CHANGED Viewed

@@ -1,5 +1,32 @@
 import gradio as gr
 def greet(name):
     return "Hello " + name + "!!"

 import gradio as gr
+from transformers import pipeline
+from datasets import load_dataset
+import soundfile as sf
+import torch
+import os
+os.environ['TRANSFORMERS_CACHE'] = '.cache'
+print ("----- setting up pipeline -----")
+synthesiser = pipeline("text-to-speech", "microsoft/speecht5_tts")
+print ("----- setting up dataset -----")
+embeddings_dataset = load_dataset("Matthijs/cmu-arctic-xvectors", split="validation")
+speaker_embedding = torch.tensor(embeddings_dataset[7306]["xvector"]).unsqueeze(0)
+# You can replace this embedding with your own as well.
+print ("----- synthetizing audio -----")
+speech = synthesiser("Hello, my dog is cooler than you!", forward_params={"speaker_embeddings": speaker_embedding})
+sf.write("speech.wav", speech["audio"], samplerate=speech["sampling_rate"])
 def greet(name):
     return "Hello " + name + "!!"