DenseAV

Runtime error

mhamilton723 commited on Jun 12, 2024

Commit

bb26736

verified ·

1 Parent(s): 1b98c12

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -11,21 +11,19 @@ from PIL import Image
 from featup.util import norm
 from torchaudio.functional import resample
 from denseav.plotting import plot_attention_video, plot_2head_attention_video, plot_feature_video
 from denseav.shared import norm, crop_to_divisor, blur_dim
 from os.path import join
 if __name__ == "__main__":
-    mode = "hf2"
     if mode == "local":
         sample_videos_dir = "samples"
     else:
         os.environ['TORCH_HOME'] = '/tmp/.cache'
-        os.environ['HF_HOME'] = '/tmp/.cache'
-        os.environ['HF_DATASETS_CACHE'] = '/tmp/.cache'
-        os.environ['TRANSFORMERS_CACHE'] = '/tmp/.cache'
         os.environ['GRADIO_EXAMPLES_CACHE'] = '/tmp/gradio_cache'
         sample_videos_dir = "/tmp/samples"
@@ -59,7 +57,7 @@ if __name__ == "__main__":
             print(f"{filename} already exists. Skipping download.")
     csv.field_size_limit(100000000)
-    options = ['language', "sound_and_language", "sound"]
     load_size = 224
     plot_size = 224
@@ -71,7 +69,7 @@ if __name__ == "__main__":
                              height=480)
     video_output3 = gr.Video(label="Visual Features", height=480)
-    models = {o: torch.hub.load("mhamilton723/DenseAV", o) for o in options}
     def process_video(video, model_option):

 from featup.util import norm
 from torchaudio.functional import resample
+from denseav.train import LitAVAligner
 from denseav.plotting import plot_attention_video, plot_2head_attention_video, plot_feature_video
 from denseav.shared import norm, crop_to_divisor, blur_dim
 from os.path import join
 if __name__ == "__main__":
+    mode = "hf"
     if mode == "local":
         sample_videos_dir = "samples"
     else:
         os.environ['TORCH_HOME'] = '/tmp/.cache'
         os.environ['GRADIO_EXAMPLES_CACHE'] = '/tmp/gradio_cache'
         sample_videos_dir = "/tmp/samples"
             print(f"{filename} already exists. Skipping download.")
     csv.field_size_limit(100000000)
+    options = ['language', "sound-language", "sound"]
     load_size = 224
     plot_size = 224
                              height=480)
     video_output3 = gr.Video(label="Visual Features", height=480)
+    models = {o: LitAVAligner.from_pretrained(f"mhamilton723/DenseAV-{o}") for o in options}
     def process_video(video, model_option):