Spaces:

liruiw
/

hma

Runtime error

App Files Files Community

liruiw commited on Dec 12, 2024

Commit

14420e9

1 Parent(s): f64bf43

fix

Browse files

Files changed (1) hide show

app.py +48 -17

app.py CHANGED Viewed

@@ -1,36 +1,52 @@
 import gradio as gr
 import spaces
 import numpy as np
 from PIL import Image
 import cv2
 from sim.simulator import GenieSimulator
 RES = 512
-image = Image.open("sim/assets/langtable_prompt/frame_06.png")
 genie = GenieSimulator(
     image_encoder_type='temporalvae',
     image_encoder_ckpt='stabilityai/stable-video-diffusion-img2vid',
     quantize=False,
     backbone_type='stmar',
-    backbone_ckpt='data/mar_ckpt/langtable',
-    prompt_horizon=3,
     action_stride=1,
     domain='language_table',
 )
-prompt_image = np.tile(
-    np.array(image), (genie.prompt_horizon, 1, 1, 1)
-).astype(np.uint8)
-prompt_action = np.zeros(
-    (genie.prompt_horizon - 1, genie.action_stride, 2)
-).astype(np.float32)
-genie.set_initial_state((prompt_image, prompt_action))
-image = genie.reset()
-image = cv2.resize(image, (RES, RES))
-image = Image.fromarray(image)
 # Example model: takes a direction and returns a random image
-def model(direction: str, genie=genie):
     if direction == 'right':
         action = np.array([0, 0.05])
     elif direction == 'left':
@@ -52,10 +68,22 @@ def handle_input(direction):
     new_image = model(direction)  # Get a new image from the model
     return new_image
 if __name__ == '__main__':
     with gr.Blocks() as demo:
         with gr.Row():
-            image_display = gr.Image(value=image, type="pil", label="Generated Image")
         with gr.Row():
             up = gr.Button("↑ Up")
         with gr.Row():
@@ -63,10 +91,13 @@ if __name__ == '__main__':
             down = gr.Button("↓ Down")
             right = gr.Button("→ Right")
-        # Define button interactions
         up.click(fn=lambda: handle_input("up"), outputs=image_display, show_progress='hidden')
         down.click(fn=lambda: handle_input("down"), outputs=image_display, show_progress='hidden')
         left.click(fn=lambda: handle_input("left"), outputs=image_display, show_progress='hidden')
         right.click(fn=lambda: handle_input("right"), outputs=image_display, show_progress='hidden')
-    demo.launch()

 import gradio as gr
 import spaces
+import gradio as gr
 import numpy as np
 from PIL import Image
 import cv2
 from sim.simulator import GenieSimulator
+import os
+if not os.path.exists("data/mar_ckpt/langtable"):
+    # download from google drive
+    import gdown
+    gdown.download_folder("https://drive.google.com/drive/u/2/folders/1XU87cRqV-IMZA6RLiabIR_uZngynvUFN")
+    os.system("mkdir -p data/mar_ckpt/; mv langtable data/mar_ckpt/")
 RES = 512
+PROMPT_HORIZON = 3
+IMAGE_DIR = "sim/assets/langtable_prompt/"
+# Load available images
+available_images = sorted([img for img in os.listdir(IMAGE_DIR) if img.endswith(".png")])
 genie = GenieSimulator(
     image_encoder_type='temporalvae',
     image_encoder_ckpt='stabilityai/stable-video-diffusion-img2vid',
     quantize=False,
     backbone_type='stmar',
+    backbone_ckpt='data/mar_ckpt_long2/langtable',
+    prompt_horizon=PROMPT_HORIZON,
     action_stride=1,
     domain='language_table',
 )
+# Helper function to reset GenieSimulator with the selected image
+def initialize_simulator(image_name):
+    image_path = os.path.join(IMAGE_DIR, image_name)
+    image = Image.open(image_path)
+    prompt_image = np.tile(np.array(image), (genie.prompt_horizon, 1, 1, 1)).astype(np.uint8)
+    prompt_action = np.zeros((genie.prompt_horizon - 1, genie.action_stride, 2)).astype(np.float32)
+    genie.set_initial_state((prompt_image, prompt_action))
+    reset_image = genie.reset()
+    reset_image = cv2.resize(reset_image, (RES, RES))
+    return Image.fromarray(reset_image)
 # Example model: takes a direction and returns a random image
+def model(direction: str):
     if direction == 'right':
         action = np.array([0, 0.05])
     elif direction == 'left':
     new_image = model(direction)  # Get a new image from the model
     return new_image
+# Gradio function to handle image selection
+def handle_image_selection(image_name):
+    print(f"User selected image: {image_name}")
+    return initialize_simulator(image_name)
 if __name__ == '__main__':
     with gr.Blocks() as demo:
         with gr.Row():
+            image_selector = gr.Dropdown(
+                choices=available_images, value=available_images[0], label="Select an Image"
+            )
+            select_button = gr.Button("Load Image")
+        with gr.Row():
+            image_display = gr.Image(type="pil", label="Generated Image")
         with gr.Row():
             up = gr.Button("↑ Up")
         with gr.Row():
             down = gr.Button("↓ Down")
             right = gr.Button("→ Right")
+        # Define interactions
+        select_button.click(
+            fn=handle_image_selection, inputs=image_selector, outputs=image_display
+        )
         up.click(fn=lambda: handle_input("up"), outputs=image_display, show_progress='hidden')
         down.click(fn=lambda: handle_input("down"), outputs=image_display, show_progress='hidden')
         left.click(fn=lambda: handle_input("left"), outputs=image_display, show_progress='hidden')
         right.click(fn=lambda: handle_input("right"), outputs=image_display, show_progress='hidden')
+    demo.launch(share=True)