[Bugfix] Adopt ChunkGatedDeltaRule for Qwen3.5 (#34198)

Signed-off-by: Roger Wang <hey@rogerw.io>
This commit is contained in:
Roger Wang
2026-02-09 19:47:54 -08:00
committed by GitHub
parent e94ec59733
commit 047a457fa4

View File

@@ -99,6 +99,7 @@ from .interfaces import (
)
from .qwen2_moe import Qwen2MoeMLP as Qwen3NextMLP
from .qwen3_next import (
ChunkGatedDeltaRule,
Qwen3NextAttention,
Qwen3NextDecoderLayer,
Qwen3NextGatedDeltaNet,
@@ -268,6 +269,8 @@ class Qwen3_5GatedDeltaNet(Qwen3NextGatedDeltaNet):
prefix=f"{prefix}.out_proj",
)
self.chunk_gated_delta_rule = ChunkGatedDeltaRule()
compilation_config = get_current_vllm_config().compilation_config
if prefix in compilation_config.static_forward_context:
raise ValueError(f"Duplicate layer name: {prefix}")