[Model] Pipeline Parallel Support for DeepSeek v2 (#6519)
Signed-off-by: Travis Johnson <tsjohnso@us.ibm.com>
This commit is contained in:
@@ -31,6 +31,7 @@ _EMBEDDING_MODEL_MAX_NUM_BATCHED_TOKENS = 32768
|
||||
_PP_SUPPORTED_MODELS = [
|
||||
"AquilaModel",
|
||||
"AquilaForCausalLM",
|
||||
"DeepseekV2ForCausalLM",
|
||||
"InternLMForCausalLM",
|
||||
"LlamaForCausalLM",
|
||||
"LLaMAForCausalLM",
|
||||
|
||||
Reference in New Issue
Block a user