[MRV2] Avoid recompilation of _gather_block_tables_kernel (#37645)

Signed-off-by: Woosuk Kwon <woosuk@inferact.ai>
This commit is contained in:
Woosuk Kwon
2026-03-20 10:31:45 -07:00
committed by GitHub
parent d0532bf38d
commit e80cfe575d

View File

@@ -169,7 +169,7 @@ class BlockTables:
return self.slot_mappings[:, :num_tokens]
@triton.jit
@triton.jit(do_not_specialize=["num_reqs"])
def _gather_block_tables_kernel(
batch_idx_to_req_idx, # [batch_size]
src_block_table_ptrs, # [num_kv_cache_groups]