From b2663c0a0d7231d3b1203f2624b33a4a54ec1952 Mon Sep 17 00:00:00 2001 From: yewentao256 Date: Wed, 8 Oct 2025 18:06:13 -0400 Subject: [PATCH 1/4] fix pre-commit issue Signed-off-by: yewentao256 --- vllm/distributed/device_communicators/all2all.py | 3 +++ 1 file changed, 3 insertions(+) diff --git a/vllm/distributed/device_communicators/all2all.py b/vllm/distributed/device_communicators/all2all.py index a22f43cd88d1..7b583148f3fb 100644 --- a/vllm/distributed/device_communicators/all2all.py +++ b/vllm/distributed/device_communicators/all2all.py @@ -377,6 +377,9 @@ class FlashInferAllToAllManager(All2AllManagerBase): All2All communication based on flashinfer kernels. """ + rank: int + world_size: int + def __init__(self, cpu_group): assert has_flashinfer_all2all(), ( "flashinfer all2all module not found. Please install/check flashinfer" From a4f902e2b8f2bb8323bfa8db554cb9fc1d17fed4 Mon Sep 17 00:00:00 2001 From: yewentao256 Date: Thu, 9 Oct 2025 13:46:24 -0700 Subject: [PATCH 2/4] move distributed out Signed-off-by: yewentao256 --- tools/pre_commit/mypy.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/tools/pre_commit/mypy.py b/tools/pre_commit/mypy.py index 22ee08535bdd..f22e07bc7b1d 100755 --- a/tools/pre_commit/mypy.py +++ b/tools/pre_commit/mypy.py @@ -27,6 +27,7 @@ FILES = [ "vllm/*.py", "vllm/assets", + "vllm/distributed", "vllm/entrypoints", "vllm/inputs", "vllm/logging_utils", @@ -43,7 +44,6 @@ "tests", "vllm/attention", "vllm/compilation", - "vllm/distributed", "vllm/engine", "vllm/executor", "vllm/inputs", From 569d95020da30db3260498c9acd6d79d90cad1dd Mon Sep 17 00:00:00 2001 From: yewentao256 Date: Thu, 9 Oct 2025 13:51:51 -0700 Subject: [PATCH 3/4] update Signed-off-by: yewentao256 --- tools/pre_commit/mypy.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/tools/pre_commit/mypy.py b/tools/pre_commit/mypy.py index f22e07bc7b1d..22ee08535bdd 100755 --- a/tools/pre_commit/mypy.py +++ b/tools/pre_commit/mypy.py @@ -27,7 +27,6 @@ FILES = [ "vllm/*.py", "vllm/assets", - "vllm/distributed", "vllm/entrypoints", "vllm/inputs", "vllm/logging_utils", @@ -44,6 +43,7 @@ "tests", "vllm/attention", "vllm/compilation", + "vllm/distributed", "vllm/engine", "vllm/executor", "vllm/inputs", From 2e7660307729152560dc62bb668916b3e96b5a64 Mon Sep 17 00:00:00 2001 From: yewentao256 Date: Thu, 9 Oct 2025 14:07:34 -0700 Subject: [PATCH 4/4] add comment Signed-off-by: yewentao256 --- vllm/distributed/device_communicators/all2all.py | 2 ++ 1 file changed, 2 insertions(+) diff --git a/vllm/distributed/device_communicators/all2all.py b/vllm/distributed/device_communicators/all2all.py index 7b583148f3fb..a67405f44206 100644 --- a/vllm/distributed/device_communicators/all2all.py +++ b/vllm/distributed/device_communicators/all2all.py @@ -377,6 +377,8 @@ class FlashInferAllToAllManager(All2AllManagerBase): All2All communication based on flashinfer kernels. """ + # This type lint could be removed after all of the work in + # https://github.com/vllm-project/vllm/issues/26533 done. rank: int world_size: int