fix: proper v_major from tensor

This commit is contained in:
2026-05-24 01:55:37 +00:00
parent 384de55dfd
commit 394f08601a

View File

@@ -39,12 +39,11 @@ def main():
# Derive major modes exactly as FmhaKernel does
from cutlass.utils import LayoutEnum
from cutlass.cute.nvgpu import OperandMajorMode
a_major = LayoutEnum.from_tensor(mQ).mma_major_mode()
b_major = LayoutEnum.from_tensor(mK).mma_major_mode()
# V FMHA layout: use explicit constants
# pv_n_tile=256, s_k=128
v_major = LayoutEnum.COL_MAJOR # layout (256, 128, 1) stride (1, 256, 32768) = col-major
v_major = LayoutEnum.from_tensor(mV).mma_major_mode()
print(f"a_major: {a_major}, b_major: {b_major}, v_major: {v_major}") # layout (256, 128, 1) stride (1, 256, 32768) = col-major
c_layout = LayoutEnum.from_tensor(mC)