Spaces:

miya3333
/

TTSDemo

Running

miya3333 commited on Jan 3

Commit

881ca56

verified ·

1 Parent(s): a152706

Upload 2 files

Files changed (2) hide show

app.py CHANGED Viewed

@@ -1,15 +1,17 @@
 import gradio as gr
 from transformers import pipeline
 import torch
-# モデルのロード (例: Tacotron2 + WaveGlow)
-synthesizer = pipeline("text-to-speech", "tts_model_name", device=0)  # モデル名を指定, GPUを使う場合は device=0
 # 推論関数の定義
 def synthesize_speech(text):
     with torch.no_grad():
-      audio = synthesizer(text)
-    return (synthesizer.sampling_rate, audio["audio"].numpy())
 # Gradioインターフェースの作成
 iface = gr.Interface(

 import gradio as gr
 from transformers import pipeline
+import soundfile as sf
 import torch
+# モデルのロード (例: speechbrain/tts-hifigan-ljspeech)
+synthesizer = pipeline("text-to-speech", "speechbrain/tts-hifigan-ljspeech")
 # 推論関数の定義
 def synthesize_speech(text):
     with torch.no_grad():
+        output = synthesizer(text)
+    sf.write("speech.wav", output["audio"], output["sampling_rate"]) #numpy arrayからwavファイルに変換
+    return "speech.wav"
 # Gradioインターフェースの作成
 iface = gr.Interface(

requirements.txt CHANGED Viewed

@@ -1,4 +1,4 @@
 gradio
 transformers
 torch
-espnet

 gradio
 transformers
 torch
+soundfile