[Misc] Improve the readability of BNB error messages (#12320)
Signed-off-by: Jee Jee Li <pandaleefree@gmail.com>
This commit is contained in:
@@ -1076,8 +1076,8 @@ class BitsAndBytesModelLoader(BaseModelLoader):
|
|||||||
# weight tensor. So TP does not work with pre_quantized bnb models.
|
# weight tensor. So TP does not work with pre_quantized bnb models.
|
||||||
if pre_quant and get_tensor_model_parallel_world_size() > 1:
|
if pre_quant and get_tensor_model_parallel_world_size() > 1:
|
||||||
raise ValueError(
|
raise ValueError(
|
||||||
"Prequant BitsAndBytes models with TP is not supported."
|
"Prequant BitsAndBytes models with tensor parallelism is not "
|
||||||
"Please try with PP.")
|
"supported. Please try with pipeline parallelism.")
|
||||||
|
|
||||||
load_8bit = False
|
load_8bit = False
|
||||||
if pre_quant:
|
if pre_quant:
|
||||||
|
|||||||
Reference in New Issue
Block a user