Files
DeepGEMM/tests/test_lazy_init.py
Chenggang Zhao 7f2a703ed5 [Public release 26/04] Introducing Mega MoE, FP4 Indexer and other features/fixes (#304)
* Merge with private repo

* Update README

* Update README

* Update README

* Add PyTorch requirements

* Fix sync scopes for MQA logits (#256)

* Update README
2026-04-17 09:45:14 +08:00

21 lines
562 B
Python

import argparse
import torch
import torch.multiprocessing as mp
import deep_gemm
def main(local_rank: int):
torch.cuda.set_device(local_rank)
if __name__ == '__main__':
parser = argparse.ArgumentParser(description='Test lazy initialization')
parser.add_argument('--num-processes', type=int, default=8, help='Number of processes to spawn (default: 8)')
args = parser.parse_args()
procs = [mp.Process(target=main, args=(i, ), ) for i in range(args.num_processes)]
for p in procs:
p.start()
for p in procs:
p.join()