diff --git a/vllm/config/vllm.py b/vllm/config/vllm.py index 3e5a4b8f5..690597418 100644 --- a/vllm/config/vllm.py +++ b/vllm/config/vllm.py @@ -358,13 +358,6 @@ class VllmConfig: ] return hash_str - def pad_for_cudagraph(self, batch_size: int) -> int: - # if batch_size > self.compilation_config.max_cudagraph_capture_size, - # it should raise an IndexError. - # the caller should make sure the batch_size is within the range, - # i.e., batch_size <= self.compilation_config.max_cudagraph_capture_size - return self.compilation_config.bs_to_padded_graph_size[batch_size] - @property def needs_dp_coordinator(self) -> bool: """