[ci] Use env var to control whether to use S3 bucket in CI (#13634)
This commit is contained in:
@@ -22,6 +22,7 @@ from vllm.executor.executor_base import ExecutorBase
|
||||
from vllm.logger import init_logger
|
||||
from vllm.model_executor.layers.quantization import QUANTIZATION_METHODS
|
||||
from vllm.plugins import load_general_plugins
|
||||
from vllm.test_utils import MODEL_WEIGHTS_S3_BUCKET, MODELS_ON_S3
|
||||
from vllm.transformers_utils.utils import check_gguf_file
|
||||
from vllm.usage.usage_lib import UsageContext
|
||||
from vllm.utils import FlexibleArgumentParser, StoreBoolean
|
||||
@@ -1141,6 +1142,14 @@ class EngineArgs:
|
||||
f", but got {self.cpu_offload_gb}")
|
||||
|
||||
device_config = DeviceConfig(device=self.device)
|
||||
|
||||
# NOTE: This is to allow model loading from S3 in CI
|
||||
if (not isinstance(self, AsyncEngineArgs) and envs.VLLM_CI_USE_S3
|
||||
and self.model in MODELS_ON_S3
|
||||
and self.load_format == LoadFormat.AUTO): # noqa: E501
|
||||
self.model = f"{MODEL_WEIGHTS_S3_BUCKET}/{self.model}"
|
||||
self.load_format = LoadFormat.RUNAI_STREAMER
|
||||
|
||||
model_config = self.create_model_config()
|
||||
|
||||
if (model_config.is_multimodal_model and not envs.VLLM_USE_V1
|
||||
|
||||
Reference in New Issue
Block a user