From 95ff7eeeebd5cca911bc50526fe266a794455ba7 Mon Sep 17 00:00:00 2001 From: Matthew Bonanni Date: Tue, 3 Mar 2026 11:42:32 -0500 Subject: [PATCH 1/2] Bump Signed-off-by: Matthew Bonanni --- tests/evals/gsm8k/configs/DeepSeek-V3.2-DP.yaml | 2 +- tests/evals/gsm8k/configs/DeepSeek-V3.2-TP.yaml | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/tests/evals/gsm8k/configs/DeepSeek-V3.2-DP.yaml b/tests/evals/gsm8k/configs/DeepSeek-V3.2-DP.yaml index d7d1df974aab..c0e2e8f044be 100644 --- a/tests/evals/gsm8k/configs/DeepSeek-V3.2-DP.yaml +++ b/tests/evals/gsm8k/configs/DeepSeek-V3.2-DP.yaml @@ -8,4 +8,4 @@ server_args: >- --max-model-len 4096 --data-parallel-size 8 --enable-expert-parallel - --speculative-config '{"method":"mtp","num_speculative_tokens":1}' + --speculative-config '{"method":"mtp","num_speculative_tokens":3}' diff --git a/tests/evals/gsm8k/configs/DeepSeek-V3.2-TP.yaml b/tests/evals/gsm8k/configs/DeepSeek-V3.2-TP.yaml index 83687594d415..d31c63b8d764 100644 --- a/tests/evals/gsm8k/configs/DeepSeek-V3.2-TP.yaml +++ b/tests/evals/gsm8k/configs/DeepSeek-V3.2-TP.yaml @@ -8,4 +8,4 @@ server_args: >- --max-model-len 4096 --tensor-parallel-size 8 --enable-expert-parallel - --speculative-config '{"method":"mtp","num_speculative_tokens":1}' + --speculative-config '{"method":"mtp","num_speculative_tokens":3}' From beee1f9b7d8a41256463d37484e770e7b2388862 Mon Sep 17 00:00:00 2001 From: Matthew Bonanni Date: Tue, 3 Mar 2026 11:52:49 -0500 Subject: [PATCH 2/2] Apply to R1 too Signed-off-by: Matthew Bonanni --- tests/evals/gsm8k/configs/DeepSeek-R1-DP.yaml | 2 +- tests/evals/gsm8k/configs/DeepSeek-R1-TP.yaml | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/tests/evals/gsm8k/configs/DeepSeek-R1-DP.yaml b/tests/evals/gsm8k/configs/DeepSeek-R1-DP.yaml index f351a1722064..0c6a598a8a90 100644 --- a/tests/evals/gsm8k/configs/DeepSeek-R1-DP.yaml +++ b/tests/evals/gsm8k/configs/DeepSeek-R1-DP.yaml @@ -8,4 +8,4 @@ server_args: >- --max-model-len 4096 --data-parallel-size 8 --enable-expert-parallel - --speculative-config '{"method":"mtp","num_speculative_tokens":1}' + --speculative-config '{"method":"mtp","num_speculative_tokens":3}' diff --git a/tests/evals/gsm8k/configs/DeepSeek-R1-TP.yaml b/tests/evals/gsm8k/configs/DeepSeek-R1-TP.yaml index ba3463463b5e..f6ab81008588 100644 --- a/tests/evals/gsm8k/configs/DeepSeek-R1-TP.yaml +++ b/tests/evals/gsm8k/configs/DeepSeek-R1-TP.yaml @@ -8,4 +8,4 @@ server_args: >- --max-model-len 4096 --tensor-parallel-size 8 --enable-expert-parallel - --speculative-config '{"method":"mtp","num_speculative_tokens":1}' + --speculative-config '{"method":"mtp","num_speculative_tokens":3}'