diff --git a/test/registered/amd/test_moriep_small.py b/test/registered/amd/test_moriep_small.py index 42547cf9ecfb..0d073b5f3e30 100644 --- a/test/registered/amd/test_moriep_small.py +++ b/test/registered/amd/test_moriep_small.py @@ -400,6 +400,7 @@ def setUpClass(cls): env["SGLANG_MORI_DISPATCH_DTYPE"] = "bf16" env["SGLANG_MORI_NUM_MAX_DISPATCH_TOKENS_PER_RANK"] = "4096" env["MORI_SHMEM_MODE"] = "ISOLATION" # avoid out of symmetric heap memory + env["SGLANG_ENABLE_SPEC_V2"] = "false" cls.process = popen_launch_server( cls.model, @@ -458,6 +459,7 @@ def setUpClass(cls): env["SGLANG_USE_AITER"] = "1" env["SGLANG_MORI_DISPATCH_DTYPE"] = "bf16" env["SGLANG_MORI_NUM_MAX_DISPATCH_TOKENS_PER_RANK"] = "4096" + env["SGLANG_ENABLE_SPEC_V2"] = "false" env["MORI_SHMEM_MODE"] = "ISOLATION" # avoid out of symmetric heap memory # FIXME(billishyahao): enable p2p due to no rdma devices on CI machine # env["MORI_DISABLE_P2P"] = "1"