diff --git a/deep_gemm/mega/__init__.py b/deep_gemm/mega/__init__.py index e2ff491..bd459d9 100644 --- a/deep_gemm/mega/__init__.py +++ b/deep_gemm/mega/__init__.py @@ -286,6 +286,8 @@ def transform_nvfp4_weights_for_mega_moe( l1_sf_mn, l1_n, l1_k, (1, 16), num_experts) l2_sf_transformed = transform_sf_into_required_layout( l2_sf_mn, l2_n, l2_k, (1, 16), num_experts) + print(f"[debug-pre-interleave] l1_sf_transformed: shape={tuple(l1_sf_transformed.shape)} strides={l1_sf_transformed.stride()}", flush=True) + print(f"[debug-pre-interleave] l2_sf_transformed: shape={tuple(l2_sf_transformed.shape)} strides={l2_sf_transformed.stride()}", flush=True) # L1: interleave gate/up l1_interleaved = _interleave_l1_weights((l1_weights[0], l1_sf_transformed))