Spaces:
Running
on
Zero
Running
on
Zero
Update utils/model.py
Browse files- utils/model.py +2 -2
utils/model.py
CHANGED
@@ -428,10 +428,10 @@ class OwlViTForClassification(nn.Module):
|
|
428 |
device_ = txt_embeds.device
|
429 |
position_ids = position_ids.to(device_)
|
430 |
txt_embeds_size_0 = text_embeds.size(0)
|
431 |
-
position_embedding = position_ids.repeat(txt_embeds_size_0, 1, 1)
|
432 |
text_inputs_parts["position_ids"] = position_ids
|
433 |
print(f"position_embedding : {position_embedding.shape}")
|
434 |
-
print(f"pos + emb: {(txt_embeds + position_embedding).shape}")
|
435 |
text_embeds_parts = self.owlvit.text_model.get_text_features(**text_inputs_parts)
|
436 |
|
437 |
# # Embed images and text queries
|
|
|
428 |
device_ = txt_embeds.device
|
429 |
position_ids = position_ids.to(device_)
|
430 |
txt_embeds_size_0 = text_embeds.size(0)
|
431 |
+
position_embedding = position_ids.cpu().repeat(txt_embeds_size_0, 1, 1)
|
432 |
text_inputs_parts["position_ids"] = position_ids
|
433 |
print(f"position_embedding : {position_embedding.shape}")
|
434 |
+
print(f"pos + emb: {(txt_embeds.cpu() + position_embedding).shape}")
|
435 |
text_embeds_parts = self.owlvit.text_model.get_text_features(**text_inputs_parts)
|
436 |
|
437 |
# # Embed images and text queries
|