Print warnings/errors for large swap space (#123)
This commit is contained in:
@@ -84,6 +84,7 @@ class LLMServer:
|
||||
|
||||
def _verify_args(self) -> None:
|
||||
self.model_config.verify_with_parallel_config(self.parallel_config)
|
||||
self.cache_config.verify_with_parallel_config(self.parallel_config)
|
||||
|
||||
def _init_cache(self) -> None:
|
||||
# Get the maximum number of blocks that can be allocated on GPU and CPU.
|
||||
|
||||
Reference in New Issue
Block a user