diff --git a/tests/e2e/nightly/multi_node/config/DeepSeek-R1-W8A8-longseq.yaml b/tests/e2e/nightly/multi_node/config/DeepSeek-R1-W8A8-longseq.yaml index bc88aaaa075..e6bbd7ae1ad 100644 --- a/tests/e2e/nightly/multi_node/config/DeepSeek-R1-W8A8-longseq.yaml +++ b/tests/e2e/nightly/multi_node/config/DeepSeek-R1-W8A8-longseq.yaml @@ -34,7 +34,7 @@ deployment: --seed 1024 --quantization ascend --max-num-seqs 4 - --max-model-len 32768 + --max-model-len 36864 --max-num-batched-tokens 16384 --trust-remote-code --gpu-memory-utilization 0.9 @@ -72,7 +72,7 @@ deployment: --seed 1024 --quantization ascend --max-num-seqs 4 - --max-model-len 32768 + --max-model-len 36864 --max-num-batched-tokens 256 --trust-remote-code --gpu-memory-utilization 0.9