Make various updates and fixes: (#164)

- Add BF16 support for SM90 and SM100
- Refactor Python APIs
- Other fixes and code refactoring
This commit is contained in:
Ray Wang
2025-08-15 18:32:35 +08:00
committed by GitHub
parent 3254b758e2
commit f85ec649d7
34 changed files with 2293 additions and 495 deletions

View File

@@ -27,6 +27,10 @@ third_party_include_dirs = [
'third-party/cutlass/include/cutlass',
]
# Use driver API for older CUDA compatibility
if int(os.environ.get('DG_JIT_USE_DRIVER_API', '0')):
cxx_flags.append('-DDG_JIT_USE_DRIVER_API')
class CustomBuildPy(build_py):
def run(self):