Skip to content

Commit 44d5ccf

Browse files
authored
[None][ci] move qwen3 tests from GB200 to B200 (#7733)
Signed-off-by: junq <[email protected]>
1 parent 536e877 commit 44d5ccf

File tree

3 files changed

+15
-32
lines changed

3 files changed

+15
-32
lines changed

jenkins/L0_Test.groovy

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -2033,8 +2033,9 @@ def launchTestJobs(pipeline, testFilter)
20332033
"H100_PCIe-CPP-2": ["h100-cr", "l0_h100", 2, 2],
20342034
"H100_PCIe-TensorRT-1": ["h100-cr", "l0_h100", 1, 2],
20352035
"H100_PCIe-TensorRT-2": ["h100-cr", "l0_h100", 2, 2],
2036-
"B200_PCIe-PyTorch-1": ["b100-ts2", "l0_b200", 1, 2],
2037-
"B200_PCIe-PyTorch-2": ["b100-ts2", "l0_b200", 2, 2],
2036+
"B200_PCIe-PyTorch-1": ["b100-ts2", "l0_b200", 1, 3],
2037+
"B200_PCIe-PyTorch-2": ["b100-ts2", "l0_b200", 2, 3],
2038+
"B200_PCIe-PyTorch-3": ["b100-ts2", "l0_b200", 3, 3],
20382039
"RTX5090-PyTorch-1": ["rtx-5090", "l0_gb202", 1, 1],
20392040
"RTX5080-TensorRT-1": ["rtx-5080", "l0_gb203", 1, 2],
20402041
"RTX5080-TensorRT-2": ["rtx-5080", "l0_gb203", 2, 2],
@@ -2137,7 +2138,6 @@ def launchTestJobs(pipeline, testFilter)
21372138
fullSet += SBSATestConfigs.keySet()
21382139

21392140
SBSASlurmTestConfigs = [
2140-
"GB200-PyTorch-1": ["gb200-single", "l0_gb200", 1, 1],
21412141
"GB200-4_GPUs-PyTorch-1": ["gb200-x4", "l0_gb200_multi_gpus", 1, 1, 4],
21422142
"GB200-4_GPUs-PyTorch-Post-Merge-1": ["gb200-x4", "l0_gb200_multi_gpus", 1, 1, 4],
21432143
]

tests/integration/test_lists/test-db/l0_b200.yml

Lines changed: 12 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -39,6 +39,18 @@ l0_b200:
3939
- accuracy/test_llm_api_pytorch.py::TestGPTOSS::test_w4_1gpu[True-True-trtllm-fp8]
4040
- accuracy/test_llm_api_pytorch.py::TestGPTOSS::test_w4_1gpu[True-True-triton-auto]
4141
- accuracy/test_llm_api_pytorch.py::TestQwen3_8B::test_fp8_block_scales[latency] # Cover nvbugs 5461712 and 5505402
42+
- accuracy/test_llm_api_pytorch.py::TestQwen3_8B::test_w4a8_mxfp4[fp8-latency]
43+
- accuracy/test_llm_api_pytorch.py::TestQwen3_8B::test_w4a8_mxfp4[mxfp8-latency]
44+
- accuracy/test_llm_api_pytorch.py::TestQwen3_30B_A3B::test_nvfp4[latency_moe_cutlass-torch_compile=False]
45+
- accuracy/test_llm_api_pytorch.py::TestQwen3_30B_A3B::test_nvfp4[latency_moe_cutlass-torch_compile=True]
46+
- accuracy/test_llm_api_pytorch.py::TestQwen3_30B_A3B::test_nvfp4[latency_moe_trtllm-torch_compile=False]
47+
- accuracy/test_llm_api_pytorch.py::TestQwen3_30B_A3B::test_nvfp4[latency_moe_trtllm-torch_compile=True]
48+
- accuracy/test_llm_api_pytorch.py::TestQwen3_30B_A3B::test_w4a8_mxfp4[fp8-latency-CUTLASS]
49+
- accuracy/test_llm_api_pytorch.py::TestQwen3_30B_A3B::test_w4a8_mxfp4[fp8-latency-TRITON]
50+
- accuracy/test_llm_api_pytorch.py::TestQwen3_30B_A3B::test_w4a8_mxfp4[fp8-latency-TRTLLM]
51+
- accuracy/test_llm_api_pytorch.py::TestQwen3_30B_A3B::test_w4a8_mxfp4[mxfp8-latency-TRTLLM]
52+
- accuracy/test_llm_api_pytorch.py::TestQwen3_30B_A3B::test_w4a8_mxfp4[mxfp8-latency-CUTLASS]
53+
- accuracy/test_llm_api_pytorch.py::TestQwen3_30B_A3B::test_w4a16_mxfp4[latency-TRTLLM]
4254
- disaggregated/test_workers.py::test_workers_kv_cache_aware_router_eviction[TinyLlama-1.1B-Chat-v1.0] # nvbugs 5300551
4355
- test_e2e.py::test_ptp_quickstart_advanced[Llama3.1-8B-NVFP4-nvfp4-quantized/Meta-Llama-3.1-8B]
4456
- test_e2e.py::test_ptp_quickstart_advanced[Llama3.1-8B-FP8-llama-3.1-model/Llama-3.1-8B-Instruct-FP8]

tests/integration/test_lists/test-db/l0_gb200.yml

Lines changed: 0 additions & 29 deletions
This file was deleted.

0 commit comments

Comments
 (0)