Update modeling_llava_qwen2.py
Browse files- modeling_llava_qwen2.py +2 -2
modeling_llava_qwen2.py
CHANGED
@@ -538,13 +538,13 @@ class SigLipVisionTower(nn.Module):
|
|
538 |
image_forward_out = self.vision_tower(image.to(device=self.device, dtype=self.dtype).unsqueeze(0),
|
539 |
output_hidden_states=True)
|
540 |
image_feature = image_forward_out.hidden_states[-1].to(image.dtype)
|
541 |
-
assert image_features.shape[-2] == 729
|
542 |
image_features.append(image_feature)
|
543 |
else:
|
544 |
image_forward_outs = self.vision_tower(images.to(device=self.device, dtype=self.dtype),
|
545 |
output_hidden_states=True)
|
546 |
image_features = image_forward_outs.hidden_states[-1].to(images.dtype)
|
547 |
-
assert image_features.shape[-2] == 729
|
548 |
|
549 |
return image_features
|
550 |
|
|
|
538 |
image_forward_out = self.vision_tower(image.to(device=self.device, dtype=self.dtype).unsqueeze(0),
|
539 |
output_hidden_states=True)
|
540 |
image_feature = image_forward_out.hidden_states[-1].to(image.dtype)
|
541 |
+
# assert image_features.shape[-2] == 729
|
542 |
image_features.append(image_feature)
|
543 |
else:
|
544 |
image_forward_outs = self.vision_tower(images.to(device=self.device, dtype=self.dtype),
|
545 |
output_hidden_states=True)
|
546 |
image_features = image_forward_outs.hidden_states[-1].to(images.dtype)
|
547 |
+
# assert image_features.shape[-2] == 729
|
548 |
|
549 |
return image_features
|
550 |
|