diff --git a/vllm/lora/ops/triton_ops/fused_moe_lora_op.py b/vllm/lora/ops/triton_ops/fused_moe_lora_op.py index 3b90b3f9d..c9c85c194 100644 --- a/vllm/lora/ops/triton_ops/fused_moe_lora_op.py +++ b/vllm/lora/ops/triton_ops/fused_moe_lora_op.py @@ -779,7 +779,6 @@ def _fused_moe_lora_shrink_fake( def _fused_moe_lora_expand_fake( output: torch.Tensor, a_intermediate_cache1: torch.Tensor, - b_intermediate_cache1: torch.Tensor, lora_b_stacked: list[torch.Tensor], topk_weights: torch.Tensor, sorted_token_ids: torch.Tensor | None,