Alidr79 commited on
Commit
663ffb0
·
verified ·
1 Parent(s): 4b467b1

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +11 -2
app.py CHANGED
@@ -73,7 +73,7 @@ import librosa
73
  def tts_fn(slider_value, input_text):
74
  audio_embedding = dataset[slider_value]['audio']['array']
75
  sample_rate_embedding = dataset[slider_value]['audio']['sampling_rate']
76
- if original_sr != target_sr:
77
  audio_embedding = librosa.resample(audio_embedding, orig_sr=sample_rate_embedding, target_sr=16_000)
78
 
79
 
@@ -113,6 +113,15 @@ def tts_fn(slider_value, input_text):
113
  return 16000, (audio_out.reshape(-1)).astype(np.int16)
114
 
115
 
 
 
 
 
 
 
 
 
 
116
  import gradio as gr
117
 
118
  slider = gr.Slider(
@@ -131,7 +140,7 @@ text_input = gr.Textbox(
131
 
132
 
133
  demo = gr.Interface(
134
- fn = tts_fn,
135
  inputs=[slider, text_input], # List of inputs
136
  outputs = "audio"
137
  )
 
73
  def tts_fn(slider_value, input_text):
74
  audio_embedding = dataset[slider_value]['audio']['array']
75
  sample_rate_embedding = dataset[slider_value]['audio']['sampling_rate']
76
+ if sample_rate_embedding != 16000:
77
  audio_embedding = librosa.resample(audio_embedding, orig_sr=sample_rate_embedding, target_sr=16_000)
78
 
79
 
 
113
  return 16000, (audio_out.reshape(-1)).astype(np.int16)
114
 
115
 
116
+ def master_fn(slider_value, input_text):
117
+ all_speech = []
118
+ for sentence in input_text.split(".")[:-1]:
119
+ sampling_rate_response, audio_chunk_response = tts_fn(slider_value, sentence)
120
+ all_speech.append(audio_chunk_response)
121
+
122
+ audio_response = np.concatenate(all_speech)
123
+ return sampling_rate_response, audio_response
124
+
125
  import gradio as gr
126
 
127
  slider = gr.Slider(
 
140
 
141
 
142
  demo = gr.Interface(
143
+ fn = master_fn,
144
  inputs=[slider, text_input], # List of inputs
145
  outputs = "audio"
146
  )