[Bugfix] Respect num-gpu-blocks-override in v1 (#19503)

Signed-off-by: Jon Swenson <jmswen@gmail.com>
This commit is contained in:
jmswen
2025-06-12 04:00:23 -07:00
committed by GitHub
parent af09b3f0a0
commit c9280e6346
2 changed files with 17 additions and 0 deletions

View File

@@ -660,6 +660,7 @@ def get_num_blocks(vllm_config: VllmConfig, num_layers: int,
logger.info(
"Overriding num_gpu_blocks=%d with "
"num_gpu_blocks_override=%d", num_blocks, num_gpu_blocks_override)
num_blocks = num_gpu_blocks_override
return num_blocks