[Misc] Update gptq_marlin to use new vLLMParameters (#7281)
This commit is contained in:
@@ -20,7 +20,9 @@ from vllm.model_executor.utils import set_weight_attrs
|
||||
|
||||
logger = init_logger(__name__)
|
||||
|
||||
WEIGHT_LOADER_V2_SUPPORTED = ["CompressedTensorsLinearMethod"]
|
||||
WEIGHT_LOADER_V2_SUPPORTED = [
|
||||
"CompressedTensorsLinearMethod", "GPTQMarlinLinearMethod"
|
||||
]
|
||||
|
||||
|
||||
def adjust_marlin_shard(param, shard_size, shard_offset):
|
||||
|
||||
Reference in New Issue
Block a user