Spaces:
Runtime error
Runtime error
import os | |
import gradio as gr | |
from transformers import pipeline | |
from IPython.display import Audio as IPythonAudio | |
pipe = pipeline("image-to-text", | |
model="Salesforce/blip-image-captioning-base") | |
tts_pipe = pipeline("text-to-speech", | |
model="kakao-enterprise/vits-ljs") | |
def launch(input): | |
out = pipe(input) | |
out_tts = tts_pipe(out[0]['generated_text']) | |
return out[0]['generated_text'], (out_tts["sampling_rate"],out_tts["audio"][0]) | |
iface = gr.Interface(launch, | |
inputs=gr.Image(type='pil'), | |
outputs=["text","audio"]) | |
iface.launch() | |