[Bugfix] Fix parameter name in get_tokenizer (#4107)

This commit is contained in:
Cyrus Leung
2024-04-26 10:10:48 +08:00
committed by GitHub
parent cf29b7eda4
commit a74dee9b62
2 changed files with 26 additions and 5 deletions

View File

@@ -0,0 +1,20 @@
import pytest
from transformers import PreTrainedTokenizerBase
from vllm.transformers_utils.tokenizer import get_tokenizer
TOKENIZER_NAMES = [
"facebook/opt-125m",
"gpt2",
]
@pytest.mark.parametrize("tokenizer_name", TOKENIZER_NAMES)
def test_tokenizer_revision(tokenizer_name: str):
# Assume that "main" branch always exists
tokenizer = get_tokenizer(tokenizer_name, revision="main")
assert isinstance(tokenizer, PreTrainedTokenizerBase)
# Assume that "never" branch always does not exist
with pytest.raises(OSError, match='not a valid git identifier'):
get_tokenizer(tokenizer_name, revision="never")