[Model] Pipeline parallel support for Qwen2 (#6924)

This commit is contained in:
xuyi
2024-08-01 09:49:51 +08:00
committed by GitHub
parent 7ecee34321
commit 1d2e7fb73f
3 changed files with 101 additions and 27 deletions

View File

@@ -40,6 +40,8 @@ _PP_SUPPORTED_MODELS = [
"GPT2LMHeadModel",
"MixtralForCausalLM",
"NemotronForCausalLM",
"Qwen2ForCausalLM",
"Qwen2MoeForCausalLM",
]