[Bugfix] Fix Qwen2.5-VL quantized model weights loading (#23512)

Signed-off-by: Zifei Tong <zifeitong@gmail.com>
This commit is contained in:
zifeitong
2025-08-24 19:40:22 -07:00
committed by GitHub
parent 39971db3aa
commit a71e4765cc

View File

@@ -135,7 +135,7 @@ class Qwen2_5_VLVideoPixelInputs(TypedDict):
second_per_grid_ts: torch.Tensor
"""
The video time interval (in seconds) for each grid along the temporal
The video time interval (in seconds) for each grid along the temporal
dimension in the 3D position IDs. Returned when `videos` is not `None`.
"""
@@ -852,6 +852,10 @@ class Qwen2_5_VLForConditionalGeneration(nn.Module, SupportsMultiModal,
SupportsLoRA, SupportsPP,
SupportsQuant):
packed_modules_mapping = {
"gate_up_proj": ["gate_proj", "up_proj"],
}
# To ensure correct weight loading and mapping.
hf_to_vllm_mapper = WeightsMapper(
orig_to_new_prefix={