From e386b2da4fdab6f54c13598b39ab3e1d2e7f055d Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?oliver=20k=C3=B6nig?= Date: Sun, 22 Feb 2026 20:29:21 +0000 Subject: [PATCH] fix: all2all for qwen3-next H100 MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Signed-off-by: oliver könig --- scripts/performance/configs/qwen/qwen3_llm_pretrain.py | 1 + 1 file changed, 1 insertion(+) diff --git a/scripts/performance/configs/qwen/qwen3_llm_pretrain.py b/scripts/performance/configs/qwen/qwen3_llm_pretrain.py index 2eecd74d59..c7a295dbc3 100644 --- a/scripts/performance/configs/qwen/qwen3_llm_pretrain.py +++ b/scripts/performance/configs/qwen/qwen3_llm_pretrain.py @@ -433,6 +433,7 @@ def qwen3_next_80b_a3b_pretrain_config_h100( cfg = qwen3_next_80b_a3b_pretrain_config() cfg.mixed_precision = precision_config cfg.comm_overlap = CommOverlapConfig(tp_comm_overlap=True) + cfg.model.moe_token_dispatcher_type = "alltoall" set_qwen3_next_common_configs(cfg) set_workload_base_configs(cfg, base_cfg)