fix for navi

fsx950223 · fsx950223 · commit dd36f7962e25 · 2025-07-02T05:24:57.000Z
Signed-off-by: fsx950223 &lt;fsx950223@outlook.com&gt;
diff --git a/vllm/attention/ops/chunked_prefill_paged_decode.py b/vllm/attention/ops/chunked_prefill_paged_decode.py
@@ -9,6 +9,7 @@
 
 import torch
 
+from vllm import _custom_ops as ops
 from vllm.platforms import current_platform
 from vllm.platforms.rocm import use_rocm_custom_paged_attention
 from vllm.triton_utils import tl, triton
@@ -304,7 +305,7 @@ def chunked_prefill_paged_decode(
         )
         max_logits = torch.empty_like(exp_sums)
 
-        torch.ops.aiter.paged_attention_rocm(
+        ops.paged_attention_rocm(
             output,
             exp_sums,
             max_logits,
@@ -315,9 +316,10 @@ def chunked_prefill_paged_decode(
             num_kv_heads,
             scale=sm_scale,
             block_tables=block_table,
-            context_lens=seq_lens,
+            seq_lens=seq_lens,
+            query_start_loc=query_start_loc,
             block_size=block_size,
-            max_context_len=max_seq_len,
+            max_seq_len=max_seq_len,
             alibi_slopes=alibi_slopes,
             kv_cache_dtype=kv_cache_dtype,
             k_scale=k_scale,