Spaces:
Runtime error
Runtime error
import gradio as gr | |
import imageio | |
import torch | |
from diffusers import TextToVideoZeroPipeline | |
from video_diffusion.tuneavideo.util import save_videos_grid | |
from video_diffusion.utils.model_list import stable_model_list | |
class ZeroShotText2VideoGenerator: | |
def __init__(self): | |
self.pipe = None | |
def load_model(self, model_id): | |
if self.pipe is None: | |
self.pipe = TextToVideoZeroPipeline.from_pretrained(model_id, torch_dtype=torch.float16).to("cuda") | |
self.pipe.to("cuda") | |
self.pipe.enable_xformers_memory_efficient_attention() | |
self.pipe.enable_attention_slicing() | |
return self.pipe | |
def generate_video( | |
self, | |
prompt, | |
negative_prompt, | |
model_id, | |
height, | |
width, | |
video_length, | |
guidance_scale, | |
fps, | |
t0, | |
t1, | |
motion_field_strength_x, | |
motion_field_strength_y, | |
): | |
pipe = self.load_model(model_id) | |
result = pipe( | |
prompt=prompt, | |
negative_prompt=negative_prompt, | |
height=height, | |
width=width, | |
video_length=video_length, | |
guidance_scale=guidance_scale, | |
t0=t0, | |
t1=t1, | |
motion_field_strength_x=motion_field_strength_x, | |
motion_field_strength_y=motion_field_strength_y, | |
).images | |
result = [(r * 255).astype("uint8") for r in result] | |
imageio.mimsave("video.mp4", result, fps=fps) | |
return "video.mp4" | |
def app(): | |
with gr.Blocks(): | |
with gr.Row(): | |
with gr.Column(): | |
zero_shot_text2video_prompt = gr.Textbox( | |
lines=1, | |
placeholder="Prompt", | |
show_label=False, | |
) | |
zero_shot_text2video_negative_prompt = gr.Textbox( | |
lines=1, | |
placeholder="Negative Prompt", | |
show_label=False, | |
) | |
zero_shot_text2video_model_id = gr.Dropdown( | |
choices=stable_model_list, | |
label="Stable Model List", | |
value=stable_model_list[0], | |
) | |
with gr.Row(): | |
with gr.Column(): | |
zero_shot_text2video_guidance_scale = gr.Slider( | |
label="Guidance Scale", | |
minimum=1, | |
maximum=15, | |
step=1, | |
value=7.5, | |
) | |
zero_shot_text2video_video_length = gr.Slider( | |
label="Video Length", | |
minimum=1, | |
maximum=100, | |
step=1, | |
value=10, | |
) | |
zero_shot_text2video_t0 = gr.Slider( | |
label="Timestep T0", | |
minimum=0, | |
maximum=100, | |
step=1, | |
value=44, | |
) | |
zero_shot_text2video_motion_field_strength_x = gr.Slider( | |
label="Motion Field Strength X", | |
minimum=0, | |
maximum=100, | |
step=1, | |
value=12, | |
) | |
zero_shot_text2video_fps = gr.Slider( | |
label="Fps", | |
minimum=1, | |
maximum=60, | |
step=1, | |
value=10, | |
) | |
with gr.Row(): | |
with gr.Column(): | |
zero_shot_text2video_height = gr.Slider( | |
label="Height", | |
minimum=128, | |
maximum=1280, | |
step=32, | |
value=512, | |
) | |
zero_shot_text2video_width = gr.Slider( | |
label="Width", | |
minimum=128, | |
maximum=1280, | |
step=32, | |
value=512, | |
) | |
zero_shot_text2video_t1 = gr.Slider( | |
label="Timestep T1", | |
minimum=0, | |
maximum=100, | |
step=1, | |
value=47, | |
) | |
zero_shot_text2video_motion_field_strength_y = gr.Slider( | |
label="Motion Field Strength Y", | |
minimum=0, | |
maximum=100, | |
step=1, | |
value=12, | |
) | |
zero_shot_text2video_button = gr.Button(value="Generator") | |
with gr.Column(): | |
zero_shot_text2video_output = gr.Video(label="Output") | |
zero_shot_text2video_button.click( | |
fn=ZeroShotText2VideoGenerator().generate_video, | |
inputs=[ | |
zero_shot_text2video_prompt, | |
zero_shot_text2video_negative_prompt, | |
zero_shot_text2video_model_id, | |
zero_shot_text2video_height, | |
zero_shot_text2video_width, | |
zero_shot_text2video_video_length, | |
zero_shot_text2video_guidance_scale, | |
zero_shot_text2video_fps, | |
zero_shot_text2video_t0, | |
zero_shot_text2video_t1, | |
zero_shot_text2video_motion_field_strength_x, | |
zero_shot_text2video_motion_field_strength_y, | |
], | |
outputs=zero_shot_text2video_output, | |
) | |