Remove unused logic in models/mistral.py (#33095)

Signed-off-by: Andy Lo <andy@mistral.ai>
2026-01-26 17:01:52 +00:00
parent a2393ed496
commit d56afd45fd
1 changed files with 0 additions and 8 deletions
--- a/vllm/model_executor/models/mistral.py
+++ b/vllm/model_executor/models/mistral.py
@@ -156,16 +156,8 @@ class MistralDecoderLayer(LlamaDecoderLayer):
        )

        self.layer_idx = int(prefix.split(sep=".")[-1])
-        quant_config = self.get_quant_config(vllm_config)
        config = config or vllm_config.model_config.hf_config

-        do_fusion = getattr(
-            quant_config, "enable_quantization_scaling_fusion", False
-        ) and vllm_config.cache_config.cache_dtype.startswith("fp8")
-        if do_fusion:
-            self.input_layernorm.quant_scaling_from = self.self_attn.qkv_proj
-            self.post_attention_layernorm.quant_scaling_from = self.mlp.gate_up_proj
-
        if getattr(config, "ada_rms_norm_t_cond", False):
            self.ada_rms_norm_t_cond = nn.Sequential(
                ColumnParallelLinear(