morbiwalaq commited on
Commit
f21ef4e
·
verified ·
1 Parent(s): a1e0acd

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +49 -42
app.py CHANGED
@@ -1,55 +1,62 @@
 
1
  import gradio as gr
2
- from modelscope.pipelines import pipeline
3
- from modelscope.utils.constant import Tasks
4
 
5
- # Use CogVideo, a publicly available text-to-video model on Hugging Face.
6
- # (Replace 'THUDM/CogVideo-5M' with the correct ID if needed.)
7
- video_model = pipeline(Tasks.text_to_video_synthesis, model='THUDM/CogVideoX-5b')
8
 
9
- def generate_pokemon_anime_video(prompt, style, duration, image):
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
10
  """
11
- Generate a Pokémon anime–themed video.
12
- The prompt is enriched with style and context so that the model "imagines"
13
- iconic Pokémon scenes (e.g., Ash, Pikachu, Team Rocket).
 
 
 
14
  """
 
15
  full_prompt = (
16
- f"{prompt}, in {style} style. "
17
  "Include iconic Pokémon elements like Ash, Pikachu, and Team Rocket."
18
  )
19
 
20
- # Prepare inputs for the model.
21
- # (If the model doesn't support image conditioning, the 'image' key may be ignored.)
22
- inputs = {'text': full_prompt, 'duration': duration}
23
- if image:
24
- inputs['image'] = image
25
-
26
- result = video_model(inputs)
27
- return result["output_video"]
28
 
29
- # Build the Gradio UI with dropdown, slider, and file upload.
30
- with gr.Blocks() as iface:
31
  gr.Markdown("# 🎥 PokeVidGen AI")
32
- gr.Markdown(
33
- "Generate Pokémon anime shorts with AI! "
34
- "Enter a scene prompt, select an animation style, set the video duration, and optionally upload an image."
35
- )
36
  with gr.Row():
37
- prompt = gr.Textbox(
38
- label="Enter Pokémon Scene",
39
- placeholder="Ash battles Team Rocket with Pikachu's Thunderbolt"
40
- )
41
- style = gr.Dropdown(
42
- ["Anime Classic", "Modern 3D", "Cartoon"],
43
- label="Animation Style",
44
- value="Anime Classic"
45
- )
46
- duration = gr.Slider(1, 10, step=1, label="Video Duration (Seconds)", value=5)
47
- image = gr.Image(label="Upload an Image (Optional)", type="filepath")
48
- generate_btn = gr.Button("Generate Pokémon Anime Video")
49
- output_video = gr.Video(label="Generated Video")
50
-
51
- generate_btn.click(generate_pokemon_anime_video,
52
- inputs=[prompt, style, duration, image],
53
- outputs=output_video)
54
 
55
- iface.launch()
 
1
+ import torch
2
  import gradio as gr
3
+ from diffusers import CogVideoXPipeline, CogVideoXDPMScheduler, CogVideoXTransformer3DModel
4
+ from huggingface_hub import hf_hub_download, snapshot_download
5
 
6
+ # Set device
7
+ device = "cuda" if torch.cuda.is_available() else "cpu"
 
8
 
9
+ # (Optional) Download additional assets for upscaling or interpolation if needed.
10
+ hf_hub_download(repo_id="ai-forever/Real-ESRGAN", filename="RealESRGAN_x4.pth", local_dir="model_real_esran")
11
+ snapshot_download(repo_id="AlexWortega/RIFE", local_dir="model_rife")
12
+
13
+ # Load the text-to-video model using diffusers' CogVideoXPipeline.
14
+ # (Replace with your model ID if different.)
15
+ pipe = CogVideoXPipeline.from_pretrained("THUDM/CogVideoX-5b", torch_dtype=torch.bfloat16).to(device)
16
+ pipe.scheduler = CogVideoXDPMScheduler.from_config(pipe.scheduler.config, timestep_spacing="trailing")
17
+
18
+ # Optionally load an image-to-video transformer if your pipeline supports image conditioning.
19
+ # (This may be used if you want to condition on an uploaded image.)
20
+ i2v_transformer = CogVideoXTransformer3DModel.from_pretrained(
21
+ "THUDM/CogVideoX-5b-I2V", subfolder="transformer", torch_dtype=torch.bfloat16
22
+ )
23
+
24
+ def generate_video(prompt, style, duration, image):
25
  """
26
+ Generate a Pokémon-themed video.
27
+
28
+ The function "flavors" the text prompt with the chosen style and mentions iconic
29
+ Pokémon elements (e.g. Ash, Pikachu, Team Rocket). The duration (in seconds) is passed
30
+ to the pipeline (if supported). The 'image' input is optional and may be ignored if the
31
+ pipeline does not support image conditioning.
32
  """
33
+ # Build a full prompt by combining user input with style and Pokémon-specific flavor.
34
  full_prompt = (
35
+ f"{prompt}, in {style} style, lasting {duration} seconds. "
36
  "Include iconic Pokémon elements like Ash, Pikachu, and Team Rocket."
37
  )
38
 
39
+ # Generate video (adjust inference parameters as needed)
40
+ result = pipe(full_prompt, num_inference_steps=50, guidance_scale=7.5)
41
+
42
+ # Assuming the pipeline returns a dict with a 'videos' key (a list of generated videos)
43
+ video = result.videos[0]
44
+ return video
 
 
45
 
46
+ # Build the Gradio UI.
47
+ with gr.Blocks() as demo:
48
  gr.Markdown("# 🎥 PokeVidGen AI")
49
+ gr.Markdown("Generate Pokémon anime shorts using CogVideoX-5b! Enter your scene prompt, choose an animation style, set the duration, and optionally upload an image.")
50
+
 
 
51
  with gr.Row():
52
+ prompt_input = gr.Textbox(label="Enter Pokémon Scene", placeholder="Ash battles Team Rocket with Pikachu's Thunderbolt")
53
+ style_input = gr.Dropdown(choices=["Anime Classic", "Modern 3D", "Cartoon"], label="Animation Style", value="Anime Classic")
54
+
55
+ duration_input = gr.Slider(minimum=1, maximum=10, step=1, label="Duration (seconds)", value=5)
56
+ image_input = gr.Image(label="Optional Image", type="filepath")
57
+ generate_button = gr.Button("Generate Video")
58
+ video_output = gr.Video(label="Generated Video")
59
+
60
+ generate_button.click(fn=generate_video, inputs=[prompt_input, style_input, duration_input, image_input], outputs=video_output)
 
 
 
 
 
 
 
 
61
 
62
+ demo.launch()