Anything2Image / app.py
laizeqiang
update
e4a59ce
import os
import gradio as gr
from anything2image.api import Anything2Image
anything2img = Anything2Image(imagebind_download_dir='checkpoints')
with gr.Blocks() as demo:
gr.HTML(
"""
<div align='center'> <h1>Anything To Image </h1> </div>
<p align="center"> Generate image from anything with ImageBind's unified latent space and stable-diffusion-2-1-unclip. </p>
<p align="center"><a href="https://github.com/Zeqiang-Lai/Anything2Image"><b>https://github.com/Zeqiang-Lai/Anything2Image</b></p>
"""
)
with gr.Tab('Audio to Image'):
wav_dir = 'assets/wav'
def audio2image(audio): return anything2img(audio=audio)
gr.Interface(
fn=audio2image,
inputs="audio",
outputs="image",
examples=[os.path.join(wav_dir, name) for name in os.listdir(wav_dir)],
)
with gr.Tab('Audio+Text to Image'):
wav_dir = 'assets/wav'
def audiotext2image(prompt, audio): return anything2img(prompt=prompt, audio=audio)
gr.Interface(
fn=audiotext2image,
inputs=["text","audio"],
outputs="image",
examples=[
['A painting', 'assets/wav/cat.wav'],
['A photo', 'assets/wav/cat.wav'],
['A painting', 'assets/wav/dog_audio.wav'],
['A photo', 'assets/wav/dog_audio.wav'],
],
)
with gr.Tab('Audio+Image to Image'):
wav_dir = 'assets/wav'
def audioimage2image(audio, image): return anything2img(image=image, audio=audio)
gr.Interface(
fn=audioimage2image,
inputs=["audio","image"],
outputs="image",
examples=[
['assets/wav/wave.wav', 'assets/image/bird.png'],
['assets/wav/wave.wav', 'assets/image/dog_image.jpg'],
['assets/wav/wave.wav', 'assets/image/room.png'],
['assets/wav/rain.wav', 'assets/image/room.png'],
],
)
with gr.Tab('Image to Image'):
image_dir = 'assets/image'
def image2image(image): return anything2img(image=image)
gr.Interface(
fn=image2image,
inputs=["image"],
outputs="image",
examples=[os.path.join(image_dir, name) for name in os.listdir(image_dir)],
)
with gr.Tab('Text to Image'):
def text2image(text): return anything2img(text=text)
gr.Interface(
fn=text2image,
inputs=["text"],
outputs="image",
examples=['A sunset over the ocean.',
'A photo of a car',
"A bird's-eye view of a cityscape.",
"A close-up of a flower."],
)
with gr.Tab('Text+Any to Image'):
def textany2image(prompt, image, audio): return anything2img(prompt=prompt, image=image, audio=audio)
gr.Interface(
fn=textany2image,
inputs=["text", "image", "audio"],
outputs="image",
examples=[['A painting.', 'assets/image/bird.png', 'assets/wav/wave.wav']],
)
demo.queue(1).launch()