diff --git a/vllm/model_executor/models/qwen3_vl.py b/vllm/model_executor/models/qwen3_vl.py index 42cadb20e..7e36672b7 100644 --- a/vllm/model_executor/models/qwen3_vl.py +++ b/vllm/model_executor/models/qwen3_vl.py @@ -557,7 +557,6 @@ class Qwen3_VisionTransformer(nn.Module): max_seqlen = torch.tensor( MMEncoderAttention.compute_max_seqlen(self.attn_backend, cu_seqlens), dtype=torch.int32, - device=self.device, ) cu_seqlens = MMEncoderAttention.maybe_recompute_cu_seqlens( self.attn_backend,