Modularize fused experts and integrate PPLX kernels (#15956)
This commit is contained in:
@@ -341,7 +341,8 @@ def init_worker_distributed_environment(
|
||||
distributed_init_method, local_rank)
|
||||
|
||||
ensure_model_parallel_initialized(parallel_config.tensor_parallel_size,
|
||||
parallel_config.pipeline_parallel_size)
|
||||
parallel_config.pipeline_parallel_size,
|
||||
parallel_config.enable_expert_parallel)
|
||||
|
||||
ensure_kv_transfer_initialized(vllm_config)
|
||||
|
||||
|
||||
Reference in New Issue
Block a user