[Model] Avoid token selection in SigLIP pooling head (#32389)

Signed-off-by: DarkLight1337 <tlleungac@connect.ust.hk>
This commit is contained in:
Cyrus Leung
2026-01-15 17:01:59 +08:00
committed by GitHub
parent a52d1396a7
commit cdba4c74b3

View File

@@ -690,9 +690,9 @@ class SiglipMultiheadAttentionPoolingHead(nn.Module):
hidden_state = self.mlp(hidden_state)
hidden_state += residual
pooled = hidden_state[:, 0]
return pooled.unsqueeze(1)
# Handled by resolve_visual_encoder_outputs
# return hidden_state[:, 0]
return hidden_state
class SiglipVisionTransformer(nn.Module):