[AMD][FP8][BugFix] Remove V1 check in arg_utils.py for FP8 since it is not necessary (#17215)
Signed-off-by: Randall Smith <Randall.Smith@amd.com>
This commit is contained in:
@@ -307,18 +307,6 @@ class QuarkConfig(QuantizationConfig):
|
||||
# If no matches, return None
|
||||
return None
|
||||
|
||||
def has_fp8_layer_weights(self):
|
||||
layer_quant_config = self.quant_config.get("layer_quant_config")
|
||||
to_dict = lambda obj: cast(Dict[str, Any], obj) or {}
|
||||
return any([
|
||||
'fp8' in cast(
|
||||
str,
|
||||
to_dict(
|
||||
to_dict(to_dict(layer_quant_config).get(layer_name)).get(
|
||||
"weight")).get("dtype"))
|
||||
for layer_name in ["*v_proj", "*k_proj", "*q_proj"]
|
||||
])
|
||||
|
||||
|
||||
class QuarkLinearMethod(LinearMethodBase):
|
||||
|
||||
|
||||
Reference in New Issue
Block a user