diff --git a/tests/integration/test_lists/waives.txt b/tests/integration/test_lists/waives.txt index 8faf53dde9b..4d3c94e452e 100644 --- a/tests/integration/test_lists/waives.txt +++ b/tests/integration/test_lists/waives.txt @@ -357,3 +357,7 @@ accuracy/test_cli_flow.py::TestMinitron4BBase::test_fp8 SKIP (https://nvbugs/560 examples/test_gpt.py::test_llm_minitron_fp8_with_pseudo_loras[4b] SKIP (https://nvbugs/5606233) disaggregated/test_disaggregated_single_gpu.py::test_disaggregated_simple_deepseek[True-False-DeepSeek-V3-Lite-fp8/fp8] SKIP (https://nvbugs/5626197) disaggregated/test_disaggregated_single_gpu.py::test_disaggregated_simple_deepseek[True-True-DeepSeek-V3-Lite-fp8/fp8] SKIP (https://nvbugs/5628952) +cpp/test_e2e.py::test_benchmarks[t5-90] SKIP (https://nvbugs/5630196) +accuracy/test_llm_api_pytorch.py::TestQwen3_235B_A22B::test_nvfp4_4gpus[latency_moe_trtllm_eagle3] SKIP (https://nvbugs/5630700) +accuracy/test_disaggregated_serving.py::TestQwen3_8B::test_nixl_backend SKIP (https://nvbugs/5628952) +accuracy/test_disaggregated_serving.py::TestDeepSeekV3Lite::test_guided_decoding[xgrammar-mtp_nextn=2] SKIP (https://nvbugs/5628952) diff --git a/tests/unittest/_torch/thop/parallel/test_mamba2_chunk_ss_update.py b/tests/unittest/_torch/thop/parallel/test_mamba2_chunk_ss_update.py index e5d9e7e9fde..17c28f75fac 100644 --- a/tests/unittest/_torch/thop/parallel/test_mamba2_chunk_ss_update.py +++ b/tests/unittest/_torch/thop/parallel/test_mamba2_chunk_ss_update.py @@ -363,6 +363,7 @@ def test_mamba2_chunk_scan_selective_state_update(dim, headdim, ngroups, dstate, atol=atol[dtype]) +@pytest.mark.skip(reason="https://nvbugs/5606178") @pytest.mark.parametrize("mamba_chunk_size", [8, 256]) @pytest.mark.parametrize("seqlens", [ (16, 2, 8, 13),