Adding support to Sarvam's MoE models (#33942)

Signed-off-by: rahul-sarvam <140298821+rahul-sarvam@users.noreply.github.com>
This commit is contained in:
rahul-sarvam
2026-03-08 01:16:24 +08:00
committed by GitHub
parent 5261223c2d
commit 85f50eb41f
4 changed files with 802 additions and 0 deletions

View File

@@ -191,6 +191,8 @@ _TEXT_GENERATION_MODELS = {
"Qwen3ForCausalLM": ("qwen3", "Qwen3ForCausalLM"),
"Qwen3MoeForCausalLM": ("qwen3_moe", "Qwen3MoeForCausalLM"),
"RWForCausalLM": ("falcon", "FalconForCausalLM"),
"SarvamMoEForCausalLM": ("sarvam", "SarvamMoEForCausalLM"),
"SarvamMLAForCausalLM": ("sarvam", "SarvamMLAForCausalLM"),
"SeedOssForCausalLM": ("seed_oss", "SeedOssForCausalLM"),
"Step1ForCausalLM": ("step1", "Step1ForCausalLM"),
"Step3TextForCausalLM": ("step3_text", "Step3TextForCausalLM"),