Remove weight_scale.T special case for SM90 Block FP8 CUTLASS kernel (#28431)
Signed-off-by: mgoin <mgoin64@gmail.com>
This commit is contained in:
@@ -540,7 +540,7 @@ class Fp8LinearMethod(LinearMethodBase):
|
||||
return
|
||||
|
||||
if self.block_quant:
|
||||
maybe_post_process_fp8_weight_block(layer, self.cutlass_block_fp8_supported)
|
||||
maybe_post_process_fp8_weight_block(layer)
|
||||
|
||||
def apply(
|
||||
self,
|
||||
|
||||
Reference in New Issue
Block a user