[Model] Add support for BERT-like Chinese ERNIE pooling models (#36385)

Signed-off-by: whyiug <whyiug@hotmail.com>
Co-authored-by: wang.yuqi <yuqi.wang@daocloud.io>
This commit is contained in:
whyiug
2026-03-13 11:23:53 +08:00
committed by GitHub
parent 10f08dedfa
commit 1ce13cf992
7 changed files with 317 additions and 3 deletions

View File

@@ -18,6 +18,7 @@ from vllm.platforms import current_platform
pytest.mark.slow_test,
],
),
pytest.param("Forrest20231206/ernie-3.0-base-zh-cls"),
],
)
@pytest.mark.parametrize("dtype", ["half"] if current_platform.is_rocm() else ["float"])
@@ -47,5 +48,6 @@ def test_models(
assert torch.allclose(
hf_output,
vllm_output,
atol=1e-3 if dtype == "float" else 1e-2,
rtol=2e-3 if dtype == "float" else 1e-2,
)