Remove ScaledActivation for AWQ (#10057)

Signed-off-by: mgoin <michael@neuralmagic.com>
This commit is contained in:
Michael Goin
2024-11-06 09:27:06 -05:00
committed by GitHub
parent 406d4cc480
commit 399c798608
34 changed files with 19 additions and 124 deletions

View File

@@ -57,9 +57,6 @@ class NeuronQuantConfig(QuantizationConfig):
"Neuron Quantization is only supported through"
" transformers_neuronx.")
def get_scaled_act_names(self) -> List[str]:
return []
def get_quantization_config(self):
from transformers_neuronx.config import QuantizationConfig
return QuantizationConfig(quant_dtype=self.quant_dtype,