Remove ScaledActivation for AWQ (#10057)

Signed-off-by: mgoin <michael@neuralmagic.com>
2024-11-06 09:27:06 -05:00
parent 406d4cc480
commit 399c798608
34 changed files with 19 additions and 124 deletions
--- a/vllm/model_executor/layers/quantization/gguf.py
+++ b/vllm/model_executor/layers/quantization/gguf.py
@@ -48,9 +48,6 @@ class GGUFConfig(QuantizationConfig):
            return GGUFEmbeddingMethod(self)
        return None

-    def get_scaled_act_names(self) -> List[str]:
-        return []
-

 def _fuse_mul_mat(x: torch.Tensor, qweight: torch.Tensor,
                  qweight_type: int) -> torch.Tensor: