Files
DeepGEMM/deep_gemm/utils/layout.py
Chenggang Zhao 7f2a703ed5 [Public release 26/04] Introducing Mega MoE, FP4 Indexer and other features/fixes (#304)
* Merge with private repo

* Update README

* Update README

* Update README

* Add PyTorch requirements

* Fix sync scopes for MQA logits (#256)

* Update README
2026-04-17 09:45:14 +08:00

22 lines
680 B
Python

try:
from .._C import (
get_tma_aligned_size,
get_mn_major_tma_aligned_tensor,
get_mn_major_tma_aligned_packed_ue8m0_tensor,
get_k_grouped_mn_major_tma_aligned_packed_ue8m0_tensor
)
except ImportError:
# Expected behavior for CUDA runtime version before 12.1
pass
# Valid for all CUDA versions
from .._C import (
set_mk_alignment_for_contiguous_layout,
get_mk_alignment_for_contiguous_layout,
get_theoretical_mk_alignment_for_contiguous_layout,
)
# Some alias
get_m_alignment_for_contiguous_layout = get_mk_alignment_for_contiguous_layout
get_k_alignment_for_contiguous_layout = get_mk_alignment_for_contiguous_layout