From 54ab804e87dd534c0a8cb8ad8eec7ad5d75775ae Mon Sep 17 00:00:00 2001 From: Hojin Yang <57383540+effortprogrammer@users.noreply.github.com> Date: Mon, 23 Mar 2026 16:36:57 +0900 Subject: [PATCH] [Bugfix] Store Qwen3Next A_log in fp32 (#37810) Signed-off-by: effortprogrammer Co-authored-by: Roger Wang --- vllm/model_executor/models/qwen3_next.py | 1 + 1 file changed, 1 insertion(+) diff --git a/vllm/model_executor/models/qwen3_next.py b/vllm/model_executor/models/qwen3_next.py index c97257053..abba104bf 100644 --- a/vllm/model_executor/models/qwen3_next.py +++ b/vllm/model_executor/models/qwen3_next.py @@ -501,6 +501,7 @@ class Qwen3NextGatedDeltaNet(nn.Module, MambaBase): self.A_log = nn.Parameter( torch.empty( divide(self.num_v_heads, self.tp_size), + dtype=torch.float32, ) )