diff --git a/.buildkite/test-pipeline.yaml b/.buildkite/test-pipeline.yaml index f5be8dca05f1..c85010ab262d 100644 --- a/.buildkite/test-pipeline.yaml +++ b/.buildkite/test-pipeline.yaml @@ -453,6 +453,15 @@ steps: - pip install git+https://github.com/TIGER-AI-Lab/Mantis.git - pytest -v -s models/decoder_only/vision_language/test_models.py -m 'split(group=1) and not core_model and not quant_model' +- label: SSM and Hybrid Models Test # 12min + source_file_dependencies: + - vllm/ + - tests/models/decoder_only/language/test_hybrid.py + - tests/models/decoder_only/language/test_mamba.py + commands: + - pytest -v -s models/decoder_only/language/test_hybrid.py + - pytest -v -s models/decoder_only/language/test_mamba.py + # This test is used only in PR development phase to test individual models and should never run on main - label: Custom Models Test optional: true diff --git a/vllm/model_executor/models/bamba.py b/vllm/model_executor/models/bamba.py index 61b68125e07e..de0209d0b43b 100644 --- a/vllm/model_executor/models/bamba.py +++ b/vllm/model_executor/models/bamba.py @@ -38,8 +38,6 @@ make_empty_intermediate_tensors_factory, make_layers, maybe_prefix) -KVCache = Tuple[torch.Tensor, torch.Tensor] - class BambaMLP(nn.Module):