[Bugfix] Add custom Triton cache manager to resolve MoE MP issue (#6140)
Signed-off-by: Thomas Parnell <tpa@zurich.ibm.com> Co-authored-by: Chih-Chieh-Yang <chih.chieh.yang@ibm.com>
This commit is contained in:
6
vllm/triton_utils/__init__.py
Normal file
6
vllm/triton_utils/__init__.py
Normal file
@@ -0,0 +1,6 @@
|
||||
from vllm.triton_utils.custom_cache_manager import (
|
||||
maybe_set_triton_cache_manager)
|
||||
|
||||
__all__ = [
|
||||
"maybe_set_triton_cache_manager",
|
||||
]
|
||||
Reference in New Issue
Block a user