diff --git a/.buildkite/test-amd.yaml b/.buildkite/test-amd.yaml index 791f0f190..b3d20caab 100644 --- a/.buildkite/test-amd.yaml +++ b/.buildkite/test-amd.yaml @@ -55,9 +55,11 @@ steps: grade: Blocking source_file_dependencies: - vllm/ + - tests/detokenizer - tests/multimodal - tests/utils_ commands: + - pytest -v -s detokenizer - pytest -v -s -m 'not cpu_test' multimodal - pytest -v -s utils_ @@ -547,7 +549,7 @@ steps: - tests/samplers - tests/conftest.py commands: - - pytest -v -s -m 'not skip_v1' samplers + - pytest -v -s -m samplers - label: LoRA Test %N # 20min each timeout_in_minutes: 30 @@ -2213,7 +2215,7 @@ steps: - tests/samplers - tests/conftest.py commands: - - pytest -v -s -m 'not skip_v1' samplers + - pytest -v -s -m samplers - label: LoRA Test %N # 20min each timeout_in_minutes: 30 diff --git a/.buildkite/test-pipeline.yaml b/.buildkite/test-pipeline.yaml index 24bd1736a..ecbf1a878 100644 --- a/.buildkite/test-pipeline.yaml +++ b/.buildkite/test-pipeline.yaml @@ -51,9 +51,11 @@ steps: mirror_hardwares: [amdexperimental] source_file_dependencies: - vllm/ + - tests/detokenizer - tests/multimodal - tests/utils_ commands: + - pytest -v -s detokenizer - pytest -v -s -m 'not cpu_test' multimodal - pytest -v -s utils_ diff --git a/.buildkite/test_areas/misc.yaml b/.buildkite/test_areas/misc.yaml index c80db1b89..f58aa204b 100644 --- a/.buildkite/test_areas/misc.yaml +++ b/.buildkite/test_areas/misc.yaml @@ -108,9 +108,11 @@ steps: timeout_in_minutes: 50 source_file_dependencies: - vllm/ + - tests/detokenizer - tests/multimodal - tests/utils_ commands: + - pytest -v -s detokenizer - pytest -v -s -m 'not cpu_test' multimodal - pytest -v -s utils_ diff --git a/.buildkite/test_areas/samplers.yaml b/.buildkite/test_areas/samplers.yaml index 7a71fa433..cc84d2a48 100644 --- a/.buildkite/test_areas/samplers.yaml +++ b/.buildkite/test_areas/samplers.yaml @@ -18,4 +18,4 @@ steps: depends_on: - image-build-amd commands: - - pytest -v -s -m 'not skip_v1' samplers + - pytest -v -s -m samplers diff --git a/pyproject.toml b/pyproject.toml index b64254bf5..551c6ba77 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -113,7 +113,6 @@ markers = [ "cpu_test: mark test as CPU-only test", "split: run this test as part of a split", "distributed: run this test only in distributed GPU tests", - "skip_v1: do not run this test with v1", "optional: optional tests that are automatically skipped, include --optional to run them", ] diff --git a/tests/detokenizer/test_disable_detokenization.py b/tests/detokenizer/test_disable_detokenization.py index a77626df5..71ecb5566 100644 --- a/tests/detokenizer/test_disable_detokenization.py +++ b/tests/detokenizer/test_disable_detokenization.py @@ -7,7 +7,6 @@ from vllm.entrypoints.llm import LLM from vllm.sampling_params import SamplingParams -@pytest.mark.skip_v1 @pytest.mark.parametrize("model", ["distilbert/distilgpt2"]) def test_computed_prefix_blocks(model: str): # This test checks if the engine generates completions both with and