From 65d4da19c7b8886e9bc0cdf919b844980e327ae5 Mon Sep 17 00:00:00 2001 From: Benjamin Chislett Date: Fri, 10 Apr 2026 12:03:20 -0400 Subject: [PATCH] Revert "Add nightly b200 test for spec decode eagle correctness (#38577)" This reverts commit adaabb8a55b3109babaaee7e2821ceefe05d6db4. Signed-off-by: Benjamin Chislett --- .buildkite/test_areas/spec_decode.yaml | 34 -------------------------- 1 file changed, 34 deletions(-) diff --git a/.buildkite/test_areas/spec_decode.yaml b/.buildkite/test_areas/spec_decode.yaml index e3fcdd0ecdd9..a0b730968675 100644 --- a/.buildkite/test_areas/spec_decode.yaml +++ b/.buildkite/test_areas/spec_decode.yaml @@ -12,17 +12,6 @@ steps: commands: - pytest -v -s v1/e2e/spec_decode -k "eagle_correctness" -- label: Spec Decode Eagle Nightly B200 - timeout_in_minutes: 30 - device: b200 - optional: true - source_file_dependencies: - - vllm/v1/spec_decode/ - - vllm/v1/worker/gpu/spec_decode/ - - tests/v1/e2e/spec_decode/ - commands: - - pytest -v -s v1/e2e/spec_decode -k "eagle_correctness" - - label: Spec Decode Speculators + MTP timeout_in_minutes: 30 device: h200_18gb @@ -34,18 +23,6 @@ steps: commands: - pytest -v -s v1/e2e/spec_decode -k "speculators or mtp_correctness" -- label: Spec Decode Speculators + MTP Nightly B200 - timeout_in_minutes: 30 - device: b200 - optional: true - source_file_dependencies: - - vllm/v1/spec_decode/ - - vllm/v1/worker/gpu/spec_decode/ - - vllm/transformers_utils/configs/speculators/ - - tests/v1/e2e/spec_decode/ - commands: - - pytest -v -s v1/e2e/spec_decode -k "speculators or mtp_correctness" - - label: Spec Decode Ngram + Suffix timeout_in_minutes: 30 device: h200_18gb @@ -65,14 +42,3 @@ steps: - tests/v1/e2e/spec_decode/ commands: - pytest -v -s v1/e2e/spec_decode -k "draft_model or no_sync or batch_inference" - -- label: Spec Decode Draft Model Nightly B200 - timeout_in_minutes: 30 - device: b200 - optional: true - source_file_dependencies: - - vllm/v1/spec_decode/ - - vllm/v1/worker/gpu/spec_decode/ - - tests/v1/e2e/spec_decode/ - commands: - - pytest -v -s v1/e2e/spec_decode -k "draft_model or no_sync or batch_inference"