Update modeling_llava_qwen2.py
Browse files- modeling_llava_qwen2.py +2 -2
modeling_llava_qwen2.py
CHANGED
|
@@ -538,13 +538,13 @@ class SigLipVisionTower(nn.Module):
|
|
| 538 |
image_forward_out = self.vision_tower(image.to(device=self.device, dtype=self.dtype).unsqueeze(0),
|
| 539 |
output_hidden_states=True)
|
| 540 |
image_feature = image_forward_out.hidden_states[-1].to(image.dtype)
|
| 541 |
-
assert image_features.shape[-2] == 729
|
| 542 |
image_features.append(image_feature)
|
| 543 |
else:
|
| 544 |
image_forward_outs = self.vision_tower(images.to(device=self.device, dtype=self.dtype),
|
| 545 |
output_hidden_states=True)
|
| 546 |
image_features = image_forward_outs.hidden_states[-1].to(images.dtype)
|
| 547 |
-
assert image_features.shape[-2] == 729
|
| 548 |
|
| 549 |
return image_features
|
| 550 |
|
|
|
|
| 538 |
image_forward_out = self.vision_tower(image.to(device=self.device, dtype=self.dtype).unsqueeze(0),
|
| 539 |
output_hidden_states=True)
|
| 540 |
image_feature = image_forward_out.hidden_states[-1].to(image.dtype)
|
| 541 |
+
# assert image_features.shape[-2] == 729
|
| 542 |
image_features.append(image_feature)
|
| 543 |
else:
|
| 544 |
image_forward_outs = self.vision_tower(images.to(device=self.device, dtype=self.dtype),
|
| 545 |
output_hidden_states=True)
|
| 546 |
image_features = image_forward_outs.hidden_states[-1].to(images.dtype)
|
| 547 |
+
# assert image_features.shape[-2] == 729
|
| 548 |
|
| 549 |
return image_features
|
| 550 |
|