diff --git a/scripts/performance/configs/qwen/qwen3_workload_base_configs.py b/scripts/performance/configs/qwen/qwen3_workload_base_configs.py index 0cd9f66c8b..b59a100dcf 100644 --- a/scripts/performance/configs/qwen/qwen3_workload_base_configs.py +++ b/scripts/performance/configs/qwen/qwen3_workload_base_configs.py @@ -31,6 +31,7 @@ BASE_QWEN3_235B_A22B_CONFIG = WorkloadBaseConfig( expert_tensor_parallel_size=1, + moe_flex_dispatcher_backend="deepep", ) @@ -38,6 +39,7 @@ expert_model_parallel_size=8, expert_tensor_parallel_size=1, global_batch_size=512, + moe_flex_dispatcher_backend="deepep", ) BASE_QWEN3_NEXT_80B_A3B_CONFIG = WorkloadBaseConfig(