Spaces:

Jiaqi-hkust
/

hawk

Runtime error

Jiaqi-hkust commited on Feb 24

Commit

d38bd7b

verified ·

1 Parent(s): b2ed81d

Update hawk/models/video_llama.py

Files changed (1) hide show

hawk/models/video_llama.py CHANGED Viewed

@@ -403,11 +403,11 @@ class VideoLLAMA(Blip2Base):
     def encode_videoQformer_visual(self, image, motion=False):
         if motion is False:
-            device = image.device
             # input shape b,c,t,h,w
             batch_size,_,time_length,_,_ = image.size()
-            image = einops.rearrange(image, 'b c t h w -> (b t) c h w')
             with self.maybe_autocast():
                 # embed image features with blip2, out: (b t) q h
@@ -454,12 +454,12 @@ class VideoLLAMA(Blip2Base):
         else:
             # Motion Encoder
-            device = image.device
             # input shape b,c,t,h,w
             batch_size,_,time_length,_,_ = image.size()
-            image = einops.rearrange(image, 'b c t h w -> (b t) c h w')
             with self.maybe_autocast():

     def encode_videoQformer_visual(self, image, motion=False):
         if motion is False:
+            device = "cuda:0"
             # input shape b,c,t,h,w
             batch_size,_,time_length,_,_ = image.size()
+            image = einops.rearrange(image, 'b c t h w -> (b t) c h w').to(device)
             with self.maybe_autocast():
                 # embed image features with blip2, out: (b t) q h
         else:
             # Motion Encoder
+            device = "cuda:0"
             # input shape b,c,t,h,w
             batch_size,_,time_length,_,_ = image.size()
+            image = einops.rearrange(image, 'b c t h w -> (b t) c h w').to(device)
             with self.maybe_autocast():