diff --git a/.buildkite/test-amd.yaml b/.buildkite/test-amd.yaml index ea117d4ed..d278dc983 100644 --- a/.buildkite/test-amd.yaml +++ b/.buildkite/test-amd.yaml @@ -889,7 +889,7 @@ steps: commands: # Install fast path packages for testing against transformers # Note: also needed to run plamo2 model in vLLM - - uv pip install --system --no-build-isolation 'git+https://github.com/state-spaces/mamba@v2.2.5' + - uv pip install --system --no-build-isolation 'git+https://github.com/AndreasKaratzas/mamba@fix-rocm-7.0-warp-size-constexpr' - uv pip install --system --no-build-isolation 'git+https://github.com/Dao-AILab/causal-conv1d@v1.5.2' # Shard hybrid language model tests - pytest -v -s models/language/generation \ @@ -910,7 +910,7 @@ steps: commands: # Install fast path packages for testing against transformers # Note: also needed to run plamo2 model in vLLM - - uv pip install --system --no-build-isolation 'git+https://github.com/state-spaces/mamba@v2.2.5' + - uv pip install --system --no-build-isolation 'git+https://github.com/AndreasKaratzas/mamba@fix-rocm-7.0-warp-size-constexpr' - uv pip install --system --no-build-isolation 'git+https://github.com/Dao-AILab/causal-conv1d@v1.5.2' - pytest -v -s models/language/generation -m '(not core_model) and (not hybrid_model)' diff --git a/tests/models/language/generation/test_phimoe.py b/tests/models/language/generation/test_phimoe.py index e64065578..1f03cf9cd 100644 --- a/tests/models/language/generation/test_phimoe.py +++ b/tests/models/language/generation/test_phimoe.py @@ -60,6 +60,19 @@ def test_phimoe_routing_function(): assert torch.equal(topk_ids, ground_truth[test_id]["topk_ids"]) +# There is a known issue that triggers `AttributeError: 'DynamicCache' +# object has no attribute 'seen_tokens'` when running: +# `tests/models/language/generation/test_phimoe.py::test_models +# [5-64-bfloat16-microsoft/Phi-3.5-MoE-instruct]` +# This issue is being investigated and tracked in: +# https://huggingface.co/microsoft/Phi-3.5-MoE-instruct/discussions/58 +# It is platform-agnostic. Therefore, we skip this test on all platforms for now. +@pytest.mark.skip( + reason="Skipping due to known issue: " + "'DynamicCache' object has no attribute 'seen_tokens'. See: " + "https://huggingface.co/microsoft/Phi-3.5-MoE-instruct/discussions/58 " + "for details.", +) @pytest.mark.skipif( condition=current_platform.is_cpu(), reason="This test takes a lot time to run on CPU, "