diff --git a/vllm/model_executor/layers/fused_moe/router/aiter_shared_routed_fused_moe_router.py b/vllm/model_executor/layers/fused_moe/router/aiter_shared_routed_fused_moe_router.py index 9d92f570df5a..48a9596a920e 100644 --- a/vllm/model_executor/layers/fused_moe/router/aiter_shared_routed_fused_moe_router.py +++ b/vllm/model_executor/layers/fused_moe/router/aiter_shared_routed_fused_moe_router.py @@ -73,7 +73,7 @@ def _compute_routing( "Number of tokens mismatch" ) - from vllm.model_executor.layers.fused_moe.rocm_aiter_fused_moe import ( + from vllm.model_executor.layers.fused_moe.experts.rocm_aiter_moe import ( aiter_topK_meta_data, ) @@ -127,7 +127,7 @@ def _compute_routing( ) if aiter_topK_meta_data is not None: - from vllm.model_executor.layers.fused_moe.rocm_aiter_fused_moe import ( + from vllm.model_executor.layers.fused_moe.experts.rocm_aiter_moe import ( inject_shared_expert_weights, )