Spaces:

nalin0503
/

Metamorph

Running

App Files Files Community

nalin0503 commited on 23 days ago

Commit

963b1a5

1 Parent(s): 9f0a675

Upload code from latest repo

Browse files

Files changed (7) hide show

FILM.py +102 -0
Image-Morpher +1 -1
Makefile +51 -0
app.py +4 -1
metamorphLogo_nobg.png +0 -0
requirements.txt +4 -1
run_morphing.py +248 -0

FILM.py ADDED Viewed

	@@ -0,0 +1,102 @@

+"""
+FILM-based Video Frame Interpolation
+This script uses the FILM (Frame Interpolation for Large Motion) model to generate
+smooth transitions between keyframes, creating a high-quality interpolated video.
+It takes a series of PNG images as input and produces an MP4 video as output.
+The script performs the following main steps:
+1. Loads keyframes from a specified input folder
+2. Preprocesses the images
+3. Applies recursive frame interpolation using the FILM model
+4. Generates a video from the interpolated frames
+5. Saves the output video with a unique timestamp
+Usage:
+Set the 'input_folder' to the directory containing your PNG keyframes
+Set the 'output_folder' to the desired location for the generated video
+Adjust 'fps' and 'num_recursions' parameters as needed
+"""
+import os
+import tensorflow as tf
+import tensorflow_hub as hub
+import cv2
+import numpy as np
+from glob import glob
+from datetime import datetime
+import time
+# Load the FILM model
+model = hub.load('https://tfhub.dev/google/film/1')
+def preprocess_image(image_path):
+    """Load and preprocess an image for the FILM model."""
+    img = tf.io.read_file(image_path)
+    img = tf.image.decode_png(img, channels=3) # remove alpha transparency
+    img = tf.image.convert_image_dtype(img, tf.float32)
+    return img
+class Interpolator:
+    """Wrapper class for the FILM model to perform frame interpolation."""
+    def __init__(self, align=64):
+        self._model = model
+        self._align = align
+    def __call__(self, x0, x1, dt):
+        """Interpolate between two frames at a given time step."""
+        inputs = {'x0': x0, 'x1': x1, 'time': dt[..., np.newaxis]} # Prepare input- 2 frames and timestamp
+        result = self._model(inputs, training=False) # FILM call for interpolated frame
+        return result['image'].numpy()
+def _recursive_generator(frame1, frame2, num_recursions, interpolator):
+    """Recursively generate interpolated frames between two input frames."""
+    if num_recursions == 0:
+        yield frame1 # exit condition
+    else:
+        time = np.full(shape=(1,), fill_value=0.5, dtype=np.float32)
+        mid_frame = interpolator(
+            np.expand_dims(frame1, axis=0), np.expand_dims(frame2, axis=0), time)[0]
+        yield from _recursive_generator(frame1, mid_frame, num_recursions - 1, interpolator) # 1st half
+        yield from _recursive_generator(mid_frame, frame2, num_recursions - 1, interpolator) # 2nd half
+def interpolate_recursively(frames, num_recursions, interpolator):
+    """Apply recursive interpolation to a list of input frames."""
+    n = len(frames)
+    for i in range(1, n):
+        yield from _recursive_generator(frames[i - 1], frames[i], num_recursions, interpolator)
+    yield frames[-1]
+def process_keyframes(input_folder, output_folder, fps=30, num_recursions=3):
+    """Process keyframes to create an interpolated video, using functions above"""
+    keyframes = sorted(glob(os.path.join(input_folder, '*.png')))
+    frames = [preprocess_image(frame).numpy() for frame in keyframes]
+    interpolator = Interpolator()
+    interpolated_frames = list(interpolate_recursively(frames, num_recursions, interpolator))
+    timestamp = datetime.now().strftime("%Y%m%d_%H%M%S") # For unique output..
+    output_video = os.path.join(output_folder, f'output_video_{timestamp}.mp4')
+    # Set up for fusing into a morphing video
+    first_frame = cv2.imread(keyframes[0])
+    height, width, _ = first_frame.shape
+    fourcc = cv2.VideoWriter_fourcc(*'mp4v')
+    out = cv2.VideoWriter(output_video, fourcc, fps, (width, height))
+    for frame in interpolated_frames:
+        frame_bgr = cv2.cvtColor((frame * 255).astype(np.uint8), cv2.COLOR_RGB2BGR)
+        out.write(frame_bgr) # writes
+    out.release()
+    print(f'Video created with {len(interpolated_frames)} frames: {output_video}')
+# Usage
+# input_folder = 'sample_keyframes'
+# output_folder = 'FILM_Results'
+# start_time = time.time()
+# process_keyframes(input_folder, output_folder, fps=30, num_recursions=3)
+# end_time = time.time()
+# total_execution_time = end_time - start_time
+# print(f'Total script execution time: {total_execution_time:.2f} seconds')

Image-Morpher CHANGED Viewed

	@@ -1 +1 @@
1	- Subproject commit ~~609232f9b1ecbdf84deaa02865e9ab3065738670~~


1	+ Subproject commit 678bc8264fd301eb17cd1150ee25d44cd5f3dd6b

Makefile ADDED Viewed

	@@ -0,0 +1,51 @@

+# Variables
+PYTHON = python # or python3
+MAIN_SCRIPT = run_morphing.py
+OUTPUT_DIR = ./results
+FILM_OUTPUT = ./FILM_Results
+# Default target: Run the entire morphing pipeline
+all: submodule morph
+# Ensure the DiffMorpher submodule is initialized and updated
+submodule:
+	@echo "Initializing and updating submodules..."
+	git submodule init
+	git submodule sync
+	git submodule update --remote
+# Initialize environment by installing dependencies and (optionally) submodules
+init: submodule
+	@echo "Installing required Python packages..."
+	$(PYTHON) -m pip install -r requirements.txt
+# Run morphing pipeline with FILM
+# (TODO - configure CLI run command to be able to run make morph FRAMES=30 FILM=true)
+morph:
+	$(PYTHON) $(MAIN_SCRIPT) \
+		--image_path_0 ./assets/Trump.jpg \
+		--prompt_0 "A photo of an American man" \
+		--image_path_1 ./assets/Biden.jpg \
+		--prompt_1 "A photo of an American man" \
+		--output_path $(OUTPUT_DIR) \
+		--use_adain \
+		--use_reschedule \
+		--save_inter \
+		--num_frames 16 \
+		--duration 100 \
+		--use_film \
+		--film_fps 30 \
+		--film_num_recursions 3
+### Add more options here later, make install, make init (install reqs)
+# Help message
+help:
+	@echo "Makefile for Image Morphing Project"
+	@echo "Available commands:"
+	@echo "  make           - Initialize submodules and run the entire morphing pipeline"
+	@echo "  make init      - Install dependencies and set up the environment"
+	@echo "  make submodule - Initialize and update Git submodules"
+	@echo "  make morph     - Run the morphing pipeline with FILM"
+	@echo "  make help      - Show this help message"

app.py CHANGED Viewed

@@ -1,3 +1,6 @@
 import os
 import sys
 import subprocess
@@ -114,7 +117,7 @@ def main():
     )
     # ---------------- HEADER & LOGO ----------------
-    logo_path = os.path.join("lcm-lora", "metamorphLogo_nobg.png")
     if os.path.exists(logo_path):
         try:
             logo = Image.open(logo_path)

+"""
+Cleaned up version, Close-to-Final UI features and functionality logic.
+"""
 import os
 import sys
 import subprocess
     )
     # ---------------- HEADER & LOGO ----------------
+    logo_path = "metamorphLogo_nobg.png"
     if os.path.exists(logo_path):
         try:
             logo = Image.open(logo_path)

metamorphLogo_nobg.png ADDED Viewed

requirements.txt CHANGED Viewed

@@ -13,4 +13,7 @@ transformers==4.34.1
 torch
 torchvision
 lpips
-# peft

 torch
 torchvision
 lpips
+# peft
+tensorflow==2.18.0
+tensorflow_hub==0.16.1

run_morphing.py ADDED Viewed

	@@ -0,0 +1,248 @@

+# T.B.C.
+import os
+import sys
+import time
+import subprocess
+import argparse
+from FILM import process_keyframes
+def parse_arguments():
+    parser = argparse.ArgumentParser(
+        description="Orchestrate DiffMorpher || LCM-LoRa || LCM, and FILM for smooth morphing between two images.")
+    # ------------------- KEYFRAME METHOD SELECTION -------------------
+    # TODO multiple methods not supported yet
+    # parser.add_argument(
+    #     "--keyframe_method", type=str, default="diffmorpher",
+    #     choices=["diffmorpher", "lcm_lora", "diffmorpher_lcm"],
+    #     help="Choose which method to use for keyframe generation."
+    # )
+    # i think this would be to select the models. so theres
+    # stable diffusion 2-1 (without lcm)
+    # stable diffusion 1-5 (has lcm support)
+    # dreamshaper 7, fine-tuned 1-5, more glam, (has lcm support)
+    # ------------------- DIFFMORPHER ARGS -------------------
+    parser.add_argument(
+        "--model_path", type=str, default="stabilityai/stable-diffusion-2-1-base", # yeah this needs to be chnaged TODO
+        help="Pretrained model to use for DiffMorpher (default: %(default)s)"
+    )
+    parser.add_argument(
+        "--image_path_0", type=str, required=True,
+        help="Path of the first image"
+    )
+    parser.add_argument(
+        "--prompt_0", type=str, default="",
+        help="Prompt describing the first image (default: %(default)s)"
+    )
+    parser.add_argument(
+        "--image_path_1", type=str, required=True,
+        help="Path of the second image"
+    )
+    parser.add_argument(
+        "--prompt_1", type=str, default="",
+        help="Prompt describing the second image (default: %(default)s)"
+    )
+    parser.add_argument(
+        "--output_path", type=str, default="./results",
+        help="Output folder for DiffMorpher keyframes/gif (default: %(default)s)"
+    )
+    parser.add_argument(
+        "--save_lora_dir", type=str, default="./lora",
+        help="Directory to save LoRA outputs (default: %(default)s)"
+    )
+    parser.add_argument(
+        "--load_lora_path_0", type=str, default="",
+        help="Path to LoRA checkpoint for image 0 (default: %(default)s)"
+    )
+    parser.add_argument(
+        "--load_lora_path_1", type=str, default="",
+        help="Path to LoRA checkpoint for image 1 (default: %(default)s)"
+    )
+    parser.add_argument(
+        "--use_adain", action="store_true",
+        help="Use AdaIN in DiffMorpher pipeline"
+    )
+    parser.add_argument(
+        "--use_reschedule", action="store_true",
+        help="Use reschedule sampling in DiffMorpher"
+    )
+    parser.add_argument(
+        "--lamb", type=float, default=0.6,
+        help="Lambda for self-attention replacement in DiffMorpher (default: %(default)s)"
+    )
+    parser.add_argument(
+        "--fix_lora_value", type=float, default=None,
+        help="Fix LoRA value in DiffMorpher (default: LoRA interpolation)"
+    )
+    parser.add_argument(
+        "--save_inter", action="store_true",
+        help="Save intermediate frames as individual images (e.g. .png) in DiffMorpher"
+    )
+    parser.add_argument(
+        "--num_frames", type=int, default=16,
+        help="Number of keyframes to generate (default: %(default)s)"
+    )
+    parser.add_argument(
+        "--duration", type=int, default=100,
+        help="Duration of each keyframe in the final .gif (default: %(default)s ms)"
+    )
+    parser.add_argument(
+        "--no_lora", action="store_true",
+        help="Disable LoRA usage in DiffMorpher"
+    )
+    # ------------------- FILM ARGS -------------------
+    parser.add_argument(
+        "--use_film", action="store_true",
+        help="Flag to indicate whether to run FILM after generating keyframes"
+    )
+    parser.add_argument(
+        "--film_input_folder", type=str, default="",
+        help="Folder containing keyframes for FILM. If empty, will use DiffMorpher output folder."
+    )
+    parser.add_argument(
+        "--film_output_folder", type=str, default="./FILM_Results",
+        help="Folder where FILM’s final interpolated video is saved (default: %(default)s)"
+    )
+    parser.add_argument(
+        "--film_fps", type=int, default=40,
+        help="FPS for the final video - 'Pseudo-Playback-Speed', since total frames are same (default: %(default)s)"
+    )
+    parser.add_argument(
+        "--film_num_recursions", type=int, default=3,
+        help="Number of recursive interpolations to perform in FILM (default: %(default)s)"
+    )
+    return parser.parse_args()
+def run_diffmorpher(args):
+    """
+    Calls DiffMorpher's main.py via subprocess using the CLI arguments.
+    Expects `DiffMorpher/` to be a submodule in the current repo.
+    """
+    diffmorpher_script = os.path.join("DiffMorpher", "main.py")
+    cmd = [
+        sys.executable, diffmorpher_script,
+        "--model_path", args.model_path,
+        "--image_path_0", args.image_path_0,
+        "--prompt_0", args.prompt_0,
+        "--image_path_1", args.image_path_1,
+        "--prompt_1", args.prompt_1,
+        "--output_path", args.output_path,
+        "--save_lora_dir", args.save_lora_dir,
+        "--lamb", str(args.lamb),
+        "--num_frames", str(args.num_frames),
+        "--duration", str(args.duration),
+    ]
+    if args.load_lora_path_0:
+        cmd += ["--load_lora_path_0", args.load_lora_path_0]
+    if args.load_lora_path_1:
+        cmd += ["--load_lora_path_1", args.load_lora_path_1]
+    if args.use_adain:
+        cmd.append("--use_adain")
+    if args.use_reschedule:
+        cmd.append("--use_reschedule")
+    if args.fix_lora_value is not None:
+        cmd += ["--fix_lora_value", str(args.fix_lora_value)]
+    if args.save_inter:
+        cmd.append("--save_inter")
+    if args.no_lora:
+        cmd.append("--no_lora")
+    print("[INFO] Running DiffMorpher with command:")
+    print(" ".join(cmd))
+    start = time.time()
+    subprocess.run(cmd, check=True)
+    end = time.time()
+    print(f"[INFO] DiffMorpher completed in {end - start:.2f} seconds.")
+def run_lcm_lora(args):
+    """
+    Run the LCM-LoRA accelerated Keyframe generator
+    """
+    # THIS would be a flag passed to diffmorpher instead.
+    pass
+def create_simple_video_from_keyframes(keyframes_folder, output_folder, fps=40):
+    """
+    If the user does NOT want FILM, we still make a basic video from keyframes.
+    Assumes frames are saved as .png or .jpg in keyframes_folder.
+    """
+    import cv2
+    from glob import glob
+    import os
+    from datetime import datetime
+    os.makedirs(output_folder, exist_ok=True)
+    images = sorted(glob(os.path.join(keyframes_folder, "*.png")))
+    if not images:
+        images = sorted(glob(os.path.join(keyframes_folder, "*.jpg")))
+    if not images:
+        print(f"[WARN] No .png or .jpg frames found in {keyframes_folder}.")
+        return
+    # Prepare video writer
+    first_frame = cv2.imread(images[0])
+    height, width, _ = first_frame.shape
+    fourcc = cv2.VideoWriter_fourcc(*'mp4v')
+    timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
+    out_video_path = os.path.join(output_folder, f"simple_morph_{timestamp}.mp4")
+    out = cv2.VideoWriter(out_video_path, fourcc, fps, (width, height))
+    for img_path in images:
+        frame = cv2.imread(img_path)
+        out.write(frame)
+    out.release()
+    print(f"[INFO] Basic morphing video saved at: {out_video_path}")
+def main():
+    args = parse_arguments()
+    overall_start_time = time.time()
+    # 1) Run DiffMorpher to generate keyframes
+    run_diffmorpher(args)
+    # 2) Determine the folder containing the keyframes
+    # If user didn’t explicitly give `--film_input_folder`, use `args.output_path`
+    keyframes_folder = args.film_input_folder if args.film_input_folder else args.output_path
+    # 3) If user wants to use FILM, perform high-quality interpolation on the keyframes
+    if args.use_film:
+        print("[INFO] Running FILM to enhance the keyframes...")
+        start_film_time = time.time()
+        # from FILM.py:
+        process_keyframes(
+            input_folder=keyframes_folder,
+            output_folder=args.film_output_folder,
+            fps=args.film_fps,
+            num_recursions=args.film_num_recursions
+        )
+        end_film_time = time.time()
+        print(f"[INFO] FILM interpolation completed in {end_film_time - start_film_time:.2f} seconds.")
+    else:
+        # 4) If user does NOT want FILM, create a simple .mp4 from the keyframes
+        print("[INFO] Skipping FILM interpolation. Creating a basic video from DiffMorpher keyframes...")
+        create_simple_video_from_keyframes(
+            keyframes_folder=keyframes_folder,
+            output_folder=args.film_output_folder,
+            fps=args.film_fps
+        )
+    # 5) Print total execution time
+    overall_end_time = time.time()
+    print(f"[INFO] Entire pipeline completed in {overall_end_time - overall_start_time:.2f} seconds.")
+if __name__ == "__main__":
+    main()