diff --git a/vllm/model_executor/layers/rotary_embedding.py b/vllm/model_executor/layers/rotary_embedding.py index db5c7080b..71af9b26e 100644 --- a/vllm/model_executor/layers/rotary_embedding.py +++ b/vllm/model_executor/layers/rotary_embedding.py @@ -143,8 +143,8 @@ class RotaryEmbedding(nn.Module): offsets: Optional[torch.Tensor] = None, ) -> Tuple[torch.Tensor, torch.Tensor]: self.cos_sin_cache = self.cos_sin_cache.to(positions.get_device()) - # ops.rotary_embedding()/batched_rotary_embedding() are in-place operations that - # update the query and key tensors. + # ops.rotary_embedding()/batched_rotary_embedding() + # are in-place operations that update the query and key tensors. if offsets is not None: ops.batched_rotary_embedding(positions, query, key, self.head_size, self.cos_sin_cache,