[Doc] Update docs to refer to pooling models (#11093)

Signed-off-by: DarkLight1337 <tlleungac@connect.ust.hk>
This commit is contained in:
Cyrus Leung
2024-12-11 21:36:27 +08:00
committed by GitHub
parent 8f10d5e393
commit cad5c0a6ed
14 changed files with 26 additions and 21 deletions

View File

@@ -893,7 +893,7 @@ class EngineArgs:
'--override-pooler-config',
type=PoolerConfig.from_json,
default=None,
help="Override or set the pooling method in the embedding model. "
help="Override or set the pooling method for pooling models. "
"e.g. {\"pooling_type\": \"mean\", \"normalize\": false}.'")
parser.add_argument('--compilation-config',
@@ -1085,7 +1085,7 @@ class EngineArgs:
"setting --max-model-len to a smaller value.", max_model_len)
elif (self.enable_chunked_prefill
and model_config.runner_type == "pooling"):
msg = "Chunked prefill is not supported for embedding models"
msg = "Chunked prefill is not supported for pooling models"
raise ValueError(msg)