Set torch_dtype in TransformersModel (#13088)
Signed-off-by: Harry Mellor <19981378+hmellor@users.noreply.github.com>
This commit is contained in:
@@ -143,6 +143,7 @@ class TransformersModel(nn.Module):
|
|||||||
self.model: PreTrainedModel = AutoModel.from_config(
|
self.model: PreTrainedModel = AutoModel.from_config(
|
||||||
self.config,
|
self.config,
|
||||||
attn_implementation="vllm",
|
attn_implementation="vllm",
|
||||||
|
torch_dtype=vllm_config.model_config.dtype,
|
||||||
trust_remote_code=vllm_config.model_config.trust_remote_code,
|
trust_remote_code=vllm_config.model_config.trust_remote_code,
|
||||||
)
|
)
|
||||||
prefix = self.model.base_model_prefix
|
prefix = self.model.base_model_prefix
|
||||||
|
|||||||
Reference in New Issue
Block a user