diff --git a/vllm/v1/worker/mamba_utils.py b/vllm/v1/worker/mamba_utils.py index a0a1ae224f2a..56fb02380bf0 100644 --- a/vllm/v1/worker/mamba_utils.py +++ b/vllm/v1/worker/mamba_utils.py @@ -4,13 +4,12 @@ from typing import Any import torch -import triton -import triton.language as tl from vllm.config import CacheConfig from vllm.model_executor.layers.mamba.mamba_utils import ( MambaStateCopyFunc, ) +from vllm.triton_utils import tl, triton from vllm.v1.core.sched.output import SchedulerOutput from vllm.v1.kv_cache_interface import KVCacheConfig, MambaSpec from vllm.v1.worker.gpu_input_batch import CachedRequestState