Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
@@ -3,6 +3,7 @@ import langcodes
|
|
3 |
from transformers import pipeline, VitsModel, AutoTokenizer, set_seed
|
4 |
from huggingface_hub import InferenceClient
|
5 |
from langdetect import detect, DetectorFactory
|
|
|
6 |
import uuid
|
7 |
import scipy.io.wavfile as wav
|
8 |
|
@@ -144,6 +145,15 @@ with playground:
|
|
144 |
# generate_audio_button = gr.Button(value="Generate Audio", variant="primary")
|
145 |
audio_output = gr.Audio(type="filepath", label="Generated Speech")
|
146 |
ITT_Clear_button = gr.ClearButton(components=[img, generated_textbox], value="Clear")
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
147 |
|
148 |
ITT_button.click(launch_image_pipe, inputs=[img], outputs=[generated_textbox, audio_output])
|
149 |
# generate_audio_button.click(generate_audio, inputs=[generated_textbox], outputs=[audio_output])
|
|
|
3 |
from transformers import pipeline, VitsModel, AutoTokenizer, set_seed
|
4 |
from huggingface_hub import InferenceClient
|
5 |
from langdetect import detect, DetectorFactory
|
6 |
+
import torch
|
7 |
import uuid
|
8 |
import scipy.io.wavfile as wav
|
9 |
|
|
|
145 |
# generate_audio_button = gr.Button(value="Generate Audio", variant="primary")
|
146 |
audio_output = gr.Audio(type="filepath", label="Generated Speech")
|
147 |
ITT_Clear_button = gr.ClearButton(components=[img, generated_textbox], value="Clear")
|
148 |
+
|
149 |
+
gr.Examples(
|
150 |
+
examples=[
|
151 |
+
["lion-dog-costume.jpg"],
|
152 |
+
["dog-halloween.jpeg"]
|
153 |
+
],
|
154 |
+
inputs=[img],
|
155 |
+
outputs=[generated_textbox, audio_output],
|
156 |
+
run_on_click=True, cache_examples=True, fn=launch_image_pipe)
|
157 |
|
158 |
ITT_button.click(launch_image_pipe, inputs=[img], outputs=[generated_textbox, audio_output])
|
159 |
# generate_audio_button.click(generate_audio, inputs=[generated_textbox], outputs=[audio_output])
|