Spaces:

jbilcke-hf
/

VideoModelStudio

Running

App Files Files Community

jbilcke-hf HF Staff commited on Mar 13

Commit

0431fa9

1 Parent(s): de828f6

improving the preview_tab

Browse files

Files changed (2) hide show

vms/ui/project/services/previewing.py +38 -19
vms/ui/project/tabs/preview_tab.py +108 -14

vms/ui/project/services/previewing.py CHANGED Viewed

@@ -85,10 +85,17 @@ class PreviewingService:
                 # Return updated log string for UI updates
                 return "\n".join(log_messages)
-            # Find latest LoRA weights
-            lora_path = self.find_latest_lora_weights()
-            if not lora_path:
-                return None, "Error: No LoRA weights found", log("Error: No LoRA weights found in output directory")
             # Add prefix to prompt
             if prompt_prefix and not prompt.startswith(prompt_prefix):
@@ -143,12 +150,13 @@ class PreviewingService:
             log(f"Generating video with model type: {internal_model_type}")
             log(f"Using model version: {model_version}")
-            log(f"Using LoRA weights from: {lora_path}")
             log(f"Resolution: {width}x{height}, Frames: {num_frames}, FPS: {fps}")
-            log(f"Guidance Scale: {guidance_scale}, Flow Shift: {flow_shift}, LoRA Weight: {lora_weight}")
             log(f"Generation Seed: {seed}")
-            log(f"Prompt: {full_prompt}")
-            log(f"Negative Prompt: {negative_prompt}")
             # Import required components based on model type
             if internal_model_type == "wan":
@@ -246,11 +254,14 @@ class PreviewingService:
                 log_fn("Enabling model CPU offload...")
                 pipe.enable_model_cpu_offload()
-            log_fn(f"Loading LoRA weights from {lora_path} with weight {lora_weight}...")
-            pipe.load_lora_weights(lora_path)
-            # TODO: Set the lora scale directly instead of using fuse_lora
-            #pipe._lora_scale = lora_weight
             # Create temporary file for the output
             with tempfile.NamedTemporaryFile(suffix='.mp4', delete=False) as temp_file:
@@ -371,9 +382,13 @@ class PreviewingService:
                 log_fn("Enabling model CPU offload...")
                 pipe.enable_model_cpu_offload()
-            log_fn(f"Loading LoRA weights from {lora_path} with weight {lora_weight}...")
-            pipe.load_lora_weights(lora_path)
-            pipe.fuse_lora(lora_weight)
             # Create temporary file for the output
             with tempfile.NamedTemporaryFile(suffix='.mp4', delete=False) as temp_file:
@@ -488,9 +503,13 @@ class PreviewingService:
                 log_fn("Enabling model CPU offload...")
                 pipe.enable_model_cpu_offload()
-            log_fn(f"Loading LoRA weights from {lora_path} with weight {lora_weight}...")
-            pipe.load_lora_weights(lora_path)
-            pipe.fuse_lora(lora_weight)
             # Create temporary file for the output
             with tempfile.NamedTemporaryFile(suffix='.mp4', delete=False) as temp_file:

                 # Return updated log string for UI updates
                 return "\n".join(log_messages)
+            # Find latest LoRA weights if lora_weight > 0
+            lora_path = None
+            using_lora = lora_weight > 0
+            if using_lora:
+                lora_path = self.find_latest_lora_weights()
+                if not lora_path:
+                    return None, "Error: No LoRA weights found", log("Error: No LoRA weights found in output directory")
+                log(f"Using LoRA weights with weight {lora_weight}")
+            else:
+                log("Using original model without LoRA weights")
             # Add prefix to prompt
             if prompt_prefix and not prompt.startswith(prompt_prefix):
             log(f"Generating video with model type: {internal_model_type}")
             log(f"Using model version: {model_version}")
+            if using_lora and lora_path:
+                log(f"Using LoRA weights from: {lora_path}")
             log(f"Resolution: {width}x{height}, Frames: {num_frames}, FPS: {fps}")
+            log(f"Guidance Scale: {guidance_scale}, Flow Shift: {flow_shift}, LoRA Weight: {lora_weight if using_lora else 0}")
             log(f"Generation Seed: {seed}")
+            #log(f"Prompt: {full_prompt}")
+            #log(f"Negative Prompt: {negative_prompt}")
             # Import required components based on model type
             if internal_model_type == "wan":
                 log_fn("Enabling model CPU offload...")
                 pipe.enable_model_cpu_offload()
+            # Apply LoRA weights if using them
+            if lora_weight > 0 and lora_path:
+                log_fn(f"Loading LoRA weights from {lora_path} with weight {lora_weight}...")
+                pipe.load_lora_weights(lora_path)
+                # TODO: Set the lora scale directly instead of using fuse_lora
+                #pipe._lora_scale = lora_weight
+            else:
+                log_fn("Using base model without LoRA weights")
             # Create temporary file for the output
             with tempfile.NamedTemporaryFile(suffix='.mp4', delete=False) as temp_file:
                 log_fn("Enabling model CPU offload...")
                 pipe.enable_model_cpu_offload()
+            # Apply LoRA weights if using them
+            if lora_weight > 0 and lora_path:
+                log_fn(f"Loading LoRA weights from {lora_path} with weight {lora_weight}...")
+                pipe.load_lora_weights(lora_path)
+                pipe.fuse_lora(lora_weight)
+            else:
+                log_fn("Using base model without LoRA weights")
             # Create temporary file for the output
             with tempfile.NamedTemporaryFile(suffix='.mp4', delete=False) as temp_file:
                 log_fn("Enabling model CPU offload...")
                 pipe.enable_model_cpu_offload()
+            # Apply LoRA weights if using them
+            if lora_weight > 0 and lora_path:
+                log_fn(f"Loading LoRA weights from {lora_path} with weight {lora_weight}...")
+                pipe.load_lora_weights(lora_path)
+                pipe.fuse_lora(lora_weight)
+            else:
+                log_fn("Using base model without LoRA weights")
             # Create temporary file for the output
             with tempfile.NamedTemporaryFile(suffix='.mp4', delete=False) as temp_file:

vms/ui/project/tabs/preview_tab.py CHANGED Viewed

@@ -52,13 +52,15 @@ class PreviewTab(BaseTab):
                         value=DEFAULT_PROMPT_PREFIX
                     )
                     self.components["seed"] = gr.Slider(
                         label="Generation Seed (-1 for random)",
                         minimum=-1,
                         maximum=2147483647,  # 2^31 - 1
                         step=1,
                         value=-1,
-                        info="Set to -1 for random seed or specific value for reproducible results"
                     )
                     with gr.Row():
@@ -81,6 +83,24 @@ class PreviewTab(BaseTab):
                                 value=self.get_default_model_version(default_model)
                             )
                     # Add image input for image-to-video models
                     self.components["conditioning_image"] = gr.Image(
                         label="Conditioning Image (for Image-to-Video models)",
@@ -148,7 +168,8 @@ class PreviewTab(BaseTab):
                             minimum=0.0,
                             maximum=1.0,
                             step=0.01,
-                            value=0.7
                         )
                         self.components["inference_steps"] = gr.Slider(
@@ -156,12 +177,12 @@ class PreviewTab(BaseTab):
                             minimum=1,
                             maximum=100,
                             step=1,
-                            value=30
                         )
                     self.components["enable_cpu_offload"] = gr.Checkbox(
                         label="Enable Model CPU Offload (for low-VRAM GPUs)",
-                        value=True
                     )
                     self.components["generate_btn"] = gr.Button(
@@ -184,10 +205,37 @@ class PreviewTab(BaseTab):
                         self.components["log"] = gr.TextArea(
                             label="Generation Log",
                             interactive=False,
-                            lines=15
                         )
         return tab
     def get_model_version_choices(self, model_type: str) -> List[str]:
         """Get model version choices based on model type"""
@@ -325,6 +373,13 @@ class PreviewTab(BaseTab):
             ]
         )
         # Load preview UI state when the tab is selected
         if hasattr(self.app, 'tabs_component') and self.app.tabs_component is not None:
             self.app.tabs_component.select(
@@ -343,7 +398,9 @@ class PreviewTab(BaseTab):
                     self.components["lora_weight"],
                     self.components["inference_steps"],
                     self.components["enable_cpu_offload"],
-                    self.components["model_version"]
                 ]
             )
@@ -351,7 +408,7 @@ class PreviewTab(BaseTab):
         for component_name in [
             "prompt", "negative_prompt", "prompt_prefix", "model_version", "resolution_preset",
             "width", "height", "num_frames", "fps", "guidance_scale", "flow_shift",
-            "lora_weight", "inference_steps", "enable_cpu_offload"
         ]:
             if component_name in self.components:
                 self.components[component_name].change(
@@ -378,7 +435,9 @@ class PreviewTab(BaseTab):
                 self.components["inference_steps"],
                 self.components["enable_cpu_offload"],
                 self.components["fps"],
-                self.components["conditioning_image"]
             ],
             outputs=[
                 self.components["preview_video"],
@@ -444,6 +503,26 @@ class PreviewTab(BaseTab):
             if model_version not in model_version_choices and model_version_choices:
                 model_version = model_version_choices[0]
             return (
                 preview_state.get("prompt", ""),
                 preview_state.get("negative_prompt", "worst quality, low quality, blurry, jittery, distorted, ugly, deformed, disfigured, messy background"),
@@ -457,7 +536,9 @@ class PreviewTab(BaseTab):
                 preview_state.get("lora_weight", 0.7),
                 preview_state.get("inference_steps", 30),
                 preview_state.get("enable_cpu_offload", True),
-                model_version
             )
         except Exception as e:
             logger.error(f"Error loading preview state: {e}")
@@ -467,7 +548,9 @@ class PreviewTab(BaseTab):
                 "worst quality, low quality, blurry, jittery, distorted, ugly, deformed, disfigured, messy background",
                 DEFAULT_PROMPT_PREFIX,
                 832, 480, 49, 16, 5.0, 3.0, 0.7, 30, True,
-                self.get_default_model_version(self.get_default_model_type())
             )
     def save_preview_state_value(self, value: Any) -> None:
@@ -522,7 +605,9 @@ class PreviewTab(BaseTab):
         inference_steps: int,
         enable_cpu_offload: bool,
         fps: int,
-        conditioning_image: Optional[str] = None
     ) -> Tuple[Optional[str], str, str]:
         """Handler for generate button click, delegates to preview service"""
         # Save all the parameters to preview state before generating
@@ -550,7 +635,9 @@ class PreviewTab(BaseTab):
                 "flow_shift": flow_shift,
                 "lora_weight": lora_weight,
                 "inference_steps": inference_steps,
-                "enable_cpu_offload": enable_cpu_offload
             }
             state["preview"] = preview_state
@@ -564,7 +651,13 @@ class PreviewTab(BaseTab):
         # Initial UI update
         video_path, status, log = None, "Initializing generation...", "Starting video generation process..."
         # Start actual generation
         result = self.app.previewing.generate_video(
             model_type=model_type,
             model_version=model_version_id,
@@ -576,11 +669,12 @@ class PreviewTab(BaseTab):
             num_frames=num_frames,
             guidance_scale=guidance_scale,
             flow_shift=flow_shift,
-            lora_weight=lora_weight,
             inference_steps=inference_steps,
             enable_cpu_offload=enable_cpu_offload,
             fps=fps,
-            conditioning_image=conditioning_image
         )
         # Return final result

                         value=DEFAULT_PROMPT_PREFIX
                     )
+                    # Ensure seed is interactive with a slider
                     self.components["seed"] = gr.Slider(
                         label="Generation Seed (-1 for random)",
                         minimum=-1,
                         maximum=2147483647,  # 2^31 - 1
                         step=1,
                         value=-1,
+                        info="Set to -1 for random seed or specific value for reproducible results",
+                        interactive=True
                     )
                     with gr.Row():
                                 value=self.get_default_model_version(default_model)
                             )
+                    # Add dropdown to choose between LoRA and original model
+                    has_lora = self.check_lora_model_exists()
+                    lora_choices = []
+                    default_lora_choice = ""
+                    if has_lora:
+                        lora_choices = ["Use LoRA model", "Use original model"]
+                        default_lora_choice = "Use LoRA model"
+                    else:
+                        lora_choices = ["Cannot find LoRA model", "Use original model"]
+                        default_lora_choice = "Use original model"
+                    self.components["use_lora"] = gr.Dropdown(
+                        choices=lora_choices,
+                        label="Model Selection",
+                        value=default_lora_choice
+                    )
                     # Add image input for image-to-video models
                     self.components["conditioning_image"] = gr.Image(
                         label="Conditioning Image (for Image-to-Video models)",
                             minimum=0.0,
                             maximum=1.0,
                             step=0.01,
+                            value=0.7,
+                            visible=has_lora  # Only visible if using LoRA
                         )
                         self.components["inference_steps"] = gr.Slider(
                             minimum=1,
                             maximum=100,
                             step=1,
+                            value=20
                         )
                     self.components["enable_cpu_offload"] = gr.Checkbox(
                         label="Enable Model CPU Offload (for low-VRAM GPUs)",
+                        value=False # let's assume user is using a video model training rig with a good GPU
                     )
                     self.components["generate_btn"] = gr.Button(
                         self.components["log"] = gr.TextArea(
                             label="Generation Log",
                             interactive=False,
+                            lines=20
                         )
         return tab
+    def check_lora_model_exists(self) -> bool:
+        """Check if any LoRA model files exist in the output directory"""
+        # Look for the standard LoRA weights file
+        lora_path = OUTPUT_PATH / "pytorch_lora_weights.safetensors"
+        if lora_path.exists():
+            return True
+        # If not found in the expected location, try to find in checkpoints
+        checkpoints = list(OUTPUT_PATH.glob("checkpoint-*"))
+        if not checkpoints:
+            return False
+        for checkpoint in checkpoints:
+            lora_path = checkpoint / "pytorch_lora_weights.safetensors"
+            if lora_path.exists():
+                return True
+        return False
+    def update_lora_ui(self, use_lora_value: str) -> Dict[str, Any]:
+        """Update UI based on LoRA selection"""
+        is_using_lora = "Use LoRA model" in use_lora_value
+        return {
+            self.components["lora_weight"]: gr.Slider(visible=is_using_lora)
+        }
     def get_model_version_choices(self, model_type: str) -> List[str]:
         """Get model version choices based on model type"""
             ]
         )
+        # Connect LoRA selection dropdown to update LoRA weight visibility
+        self.components["use_lora"].change(
+            fn=self.update_lora_ui,
+            inputs=[self.components["use_lora"]],
+            outputs=[self.components["lora_weight"]]
+        )
         # Load preview UI state when the tab is selected
         if hasattr(self.app, 'tabs_component') and self.app.tabs_component is not None:
             self.app.tabs_component.select(
                     self.components["lora_weight"],
                     self.components["inference_steps"],
                     self.components["enable_cpu_offload"],
+                    self.components["model_version"],
+                    self.components["seed"],
+                    self.components["use_lora"]
                 ]
             )
         for component_name in [
             "prompt", "negative_prompt", "prompt_prefix", "model_version", "resolution_preset",
             "width", "height", "num_frames", "fps", "guidance_scale", "flow_shift",
+            "lora_weight", "inference_steps", "enable_cpu_offload", "seed", "use_lora"
         ]:
             if component_name in self.components:
                 self.components[component_name].change(
                 self.components["inference_steps"],
                 self.components["enable_cpu_offload"],
                 self.components["fps"],
+                self.components["conditioning_image"],
+                self.components["seed"],
+                self.components["use_lora"]
             ],
             outputs=[
                 self.components["preview_video"],
             if model_version not in model_version_choices and model_version_choices:
                 model_version = model_version_choices[0]
+            # Check if LoRA exists and set appropriate dropdown options
+            has_lora = self.check_lora_model_exists()
+            use_lora = preview_state.get("use_lora", "")
+            # Validate use_lora value against current state
+            if has_lora:
+                valid_choices = ["Use LoRA model", "Use original model"]
+                if use_lora not in valid_choices:
+                    use_lora = "Use LoRA model"  # Default when LoRA exists
+            else:
+                valid_choices = ["Cannot find LoRA model", "Use original model"]
+                if use_lora not in valid_choices:
+                    use_lora = "Use original model"  # Default when no LoRA
+            # Update the dropdown choices in the UI
+            try:
+                self.components["use_lora"].choices = valid_choices
+            except Exception as e:
+                logger.error(f"Failed to update use_lora choices: {e}")
             return (
                 preview_state.get("prompt", ""),
                 preview_state.get("negative_prompt", "worst quality, low quality, blurry, jittery, distorted, ugly, deformed, disfigured, messy background"),
                 preview_state.get("lora_weight", 0.7),
                 preview_state.get("inference_steps", 30),
                 preview_state.get("enable_cpu_offload", True),
+                model_version,
+                preview_state.get("seed", -1),
+                use_lora
             )
         except Exception as e:
             logger.error(f"Error loading preview state: {e}")
                 "worst quality, low quality, blurry, jittery, distorted, ugly, deformed, disfigured, messy background",
                 DEFAULT_PROMPT_PREFIX,
                 832, 480, 49, 16, 5.0, 3.0, 0.7, 30, True,
+                self.get_default_model_version(self.get_default_model_type()),
+                -1,
+                "Use original model" if not self.check_lora_model_exists() else "Use LoRA model"
             )
     def save_preview_state_value(self, value: Any) -> None:
         inference_steps: int,
         enable_cpu_offload: bool,
         fps: int,
+        conditioning_image: Optional[str] = None,
+        seed: int = -1,
+        use_lora: str = "Use LoRA model"
     ) -> Tuple[Optional[str], str, str]:
         """Handler for generate button click, delegates to preview service"""
         # Save all the parameters to preview state before generating
                 "flow_shift": flow_shift,
                 "lora_weight": lora_weight,
                 "inference_steps": inference_steps,
+                "enable_cpu_offload": enable_cpu_offload,
+                "seed": seed,
+                "use_lora": use_lora
             }
             state["preview"] = preview_state
         # Initial UI update
         video_path, status, log = None, "Initializing generation...", "Starting video generation process..."
+        # Set lora_path to None if not using LoRA
+        use_lora_model = use_lora == "Use LoRA model"
         # Start actual generation
+        # If not using LoRA, set lora_weight to 0 to disable it
+        effective_lora_weight = lora_weight if use_lora_model else 0.0
         result = self.app.previewing.generate_video(
             model_type=model_type,
             model_version=model_version_id,
             num_frames=num_frames,
             guidance_scale=guidance_scale,
             flow_shift=flow_shift,
+            lora_weight=effective_lora_weight,  # Use 0.0 if not using LoRA
             inference_steps=inference_steps,
             enable_cpu_offload=enable_cpu_offload,
             fps=fps,
+            conditioning_image=conditioning_image,
+            seed=seed
         )
         # Return final result