youngshen commited on
Commit
183bb88
โ€ข
1 Parent(s): c335e76

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +4 -4
app.py CHANGED
@@ -38,7 +38,8 @@ def predict(text, preset):
38
  input_ids = inputs["input_ids"]
39
  input_ids = input_ids[..., :model.config.max_text_positions]
40
 
41
- speaker_embedding = np.load('spkemb/cmu_us_awb_arctic-wav-arctic_a0002.npy', allow_pickle=True)
 
42
  speaker_embedding = torch.tensor(speaker_embedding).unsqueeze(0)
43
  speech = model.generate_speech(input_ids, speaker_embedding, vocoder=vocoder)
44
 
@@ -46,11 +47,10 @@ def predict(text, preset):
46
  return (16000, speech)
47
 
48
 
49
- title = "SpeechT5: Speech Synthesis"
50
 
51
  description = """
52
- The <b>SpeechT5</b> model is pre-trained on text as well as speech inputs, with targets that are also a mix of text and speech.
53
- By pre-training on text and speech at the same time, it learns unified representations for both, resulting in improved modeling capabilities.
54
  """
55
 
56
  article = """
 
38
  input_ids = inputs["input_ids"]
39
  input_ids = input_ids[..., :model.config.max_text_positions]
40
 
41
+ # cmu_us_awb_arctic-wav-arctic_a0002.npy
42
+ speaker_embedding = np.load('spkemb/cmu_us_bdl_arctic-wav-arctic_a0009.npy', allow_pickle=True)
43
  speaker_embedding = torch.tensor(speaker_embedding).unsqueeze(0)
44
  speech = model.generate_speech(input_ids, speaker_embedding, vocoder=vocoder)
45
 
 
47
  return (16000, speech)
48
 
49
 
50
+ title = "Create 423: News to Speech"
51
 
52
  description = """
53
+ Create 423: News to Speech
 
54
  """
55
 
56
  article = """