From 70c376986b19bd6102a69e0ae16d3b61ace010e9 Mon Sep 17 00:00:00 2001 From: Nick Hill Date: Mon, 1 Jun 2026 09:43:03 -0700 Subject: [PATCH] [Test][BugFix] Fix double-BOS in PD+specdec acceptance test Signed-off-by: Nick Hill --- .../nixl_integration/test_spec_decode_acceptance.py | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/tests/v1/kv_connector/nixl_integration/test_spec_decode_acceptance.py b/tests/v1/kv_connector/nixl_integration/test_spec_decode_acceptance.py index c86a407ff8e3..15f386f5f5a8 100644 --- a/tests/v1/kv_connector/nixl_integration/test_spec_decode_acceptance.py +++ b/tests/v1/kv_connector/nixl_integration/test_spec_decode_acceptance.py @@ -158,6 +158,10 @@ def test_spec_decode_acceptance_length(): max_tokens=DEFAULT_OUTPUT_LEN, temperature=0.0, top_p=1.0, + # Prompts are already chat-templated (contain BOS); avoid the + # completions API prepending a second BOS, which would lower + # acceptance ~5% vs the add_special_tokens=False standalone baselines. + extra_body={"add_special_tokens": False}, ) if i < 3: text = resp.choices[0].text.strip()[:100]