[CI/Build][Bugfix]Fix Quantized Models Test on AMD (#27712)
Signed-off-by: zhewenli <zhewenli@meta.com>
This commit is contained in:
@@ -413,7 +413,7 @@ class RocmPlatform(Platform):
|
||||
"Using AWQ quantization with ROCm, but VLLM_USE_TRITON_AWQ"
|
||||
" is not set, enabling VLLM_USE_TRITON_AWQ."
|
||||
)
|
||||
envs.VLLM_USE_TRITON_AWQ = True
|
||||
os.environ["VLLM_USE_TRITON_AWQ"] = "1"
|
||||
|
||||
@classmethod
|
||||
def get_punica_wrapper(cls) -> str:
|
||||
|
||||
Reference in New Issue
Block a user