Spaces:

miya3333
/

TTSDemo

Running

miya3333 commited on Jan 3

Commit

cd05d2b

verified ·

1 Parent(s): 5c027d2

Upload 2 files

Files changed (1) hide show

app.py CHANGED Viewed

@@ -2,6 +2,7 @@ import gradio as gr
 import torch
 from speechbrain.inference.TTS import Tacotron2
 from speechbrain.inference.vocoders import HIFIGAN
 # モデルのロード
 hifi_gan = HIFIGAN.from_hparams(source="speechbrain/tts-hifigan-ljspeech", savedir="tmpdir_vocoder")
@@ -17,8 +18,9 @@ def synthesize_speech(text):
     waveforms = hifi_gan.decode_batch(mel_output)
     # torch tensorをwavfileとして保存
-    torch.save(waveforms, "speech.pt")
-    return "speech.pt"
 # Gradioインターフェースの作成
 iface = gr.Interface(

 import torch
 from speechbrain.inference.TTS import Tacotron2
 from speechbrain.inference.vocoders import HIFIGAN
+from scipy.io.wavfile import write
 # モデルのロード
 hifi_gan = HIFIGAN.from_hparams(source="speechbrain/tts-hifigan-ljspeech", savedir="tmpdir_vocoder")
     waveforms = hifi_gan.decode_batch(mel_output)
     # torch tensorをwavfileとして保存
+    # sampling rate を 22050に設定
+    write("speech.wav", rate=22050, data=waveforms.squeeze().cpu().numpy())
+    return "speech.wav"
 # Gradioインターフェースの作成
 iface = gr.Interface(