Adding support to Sarvam's MoE models (#33942)

Signed-off-by: rahul-sarvam <140298821+rahul-sarvam@users.noreply.github.com>
This commit is contained in:
rahul-sarvam
2026-03-08 01:16:24 +08:00
committed by GitHub
parent 5261223c2d
commit 85f50eb41f
4 changed files with 802 additions and 0 deletions

View File

@@ -480,6 +480,18 @@ _TEXT_GENERATION_EXAMPLE_MODELS = {
min_transformers_version="4.56.3",
),
"RWForCausalLM": _HfExamplesInfo("tiiuae/falcon-40b"),
"SarvamMoEForCausalLM": _HfExamplesInfo(
"sarvamai/sarvam-30b",
trust_remote_code=True,
max_model_len=4096,
is_available_online=True,
),
"SarvamMLAForCausalLM": _HfExamplesInfo(
"sarvamai/sarvam-105b",
trust_remote_code=True,
max_model_len=4096,
is_available_online=True,
),
"SeedOssForCausalLM": _HfExamplesInfo(
"ByteDance-Seed/Seed-OSS-36B-Instruct",
trust_remote_code=True,