From 9b8949074aa4298c203384a853d4bd83c5ad2228 Mon Sep 17 00:00:00 2001 From: Eran Geva <19514940+MrGeva@users.noreply.github.com> Date: Wed, 3 Dec 2025 03:47:51 -0800 Subject: [PATCH 1/2] Switch AutoDeploy's default allreduce strategy to NCCL Signed-off-by: Eran Geva <19514940+MrGeva@users.noreply.github.com> --- tensorrt_llm/_torch/auto_deploy/config/default.yaml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/tensorrt_llm/_torch/auto_deploy/config/default.yaml b/tensorrt_llm/_torch/auto_deploy/config/default.yaml index 42d4e763d979..a2f47ace301b 100644 --- a/tensorrt_llm/_torch/auto_deploy/config/default.yaml +++ b/tensorrt_llm/_torch/auto_deploy/config/default.yaml @@ -79,7 +79,7 @@ transforms: sharding_source: ['manual', 'factory', 'heuristic'] support_partial_config: true sharding_dims: ['tp', 'ep', 'bmm'] - allreduce_strategy: 'AUTO' + allreduce_strategy: 'NCCL' dist_backend: auto requires_shape_prop: true sharding_transform_executor: From 00a6c120be97ae951cdcee33812abc309d5606a3 Mon Sep 17 00:00:00 2001 From: Eran Geva <19514940+MrGeva@users.noreply.github.com> Date: Thu, 4 Dec 2025 08:41:12 -0800 Subject: [PATCH 2/2] changed nano v3 to auto Signed-off-by: Eran Geva <19514940+MrGeva@users.noreply.github.com> --- examples/auto_deploy/nano_v3.yaml | 1 + 1 file changed, 1 insertion(+) diff --git a/examples/auto_deploy/nano_v3.yaml b/examples/auto_deploy/nano_v3.yaml index 1f2cfd0c6144..9595018ef341 100644 --- a/examples/auto_deploy/nano_v3.yaml +++ b/examples/auto_deploy/nano_v3.yaml @@ -15,6 +15,7 @@ transforms: detect_sharding: sharding_source: ['factory', 'heuristic'] sharding_dims: ['ep', 'bmm'] + allreduce_strategy: 'AUTO' multi_stream_moe: stage: compile enabled: true