Spaces:
Running
on
Zero
Running
on
Zero
Update utils/model.py
Browse files- utils/model.py +2 -1
utils/model.py
CHANGED
@@ -424,9 +424,10 @@ class OwlViTForClassification(nn.Module):
|
|
424 |
txt_embeds = self.owlvit.text_model.embeddings.token_embedding(text_inputs_parts['input_ids'])
|
425 |
print(f"position_embedding: {self.owlvit.text_model.embeddings.position_embedding(position_ids).shape}")
|
426 |
print(f"text_embeds: {txt_embeds.shape}")
|
427 |
-
|
428 |
text_inputs_parts["position_ids"] = position_ids
|
429 |
position_ids = position_ids.repeat(1, 1, txt_embeds.size(-1) // position_ids.size(-1))
|
|
|
430 |
text_embeds_parts = self.owlvit.text_model.get_text_features(**text_inputs_parts)
|
431 |
|
432 |
# # Embed images and text queries
|
|
|
424 |
txt_embeds = self.owlvit.text_model.embeddings.token_embedding(text_inputs_parts['input_ids'])
|
425 |
print(f"position_embedding: {self.owlvit.text_model.embeddings.position_embedding(position_ids).shape}")
|
426 |
print(f"text_embeds: {txt_embeds.shape}")
|
427 |
+
|
428 |
text_inputs_parts["position_ids"] = position_ids
|
429 |
position_ids = position_ids.repeat(1, 1, txt_embeds.size(-1) // position_ids.size(-1))
|
430 |
+
print(f"pos + emb: {(txt_embeds + position_ids).shape}")
|
431 |
text_embeds_parts = self.owlvit.text_model.get_text_features(**text_inputs_parts)
|
432 |
|
433 |
# # Embed images and text queries
|