@@ -669,7 +669,12 @@ def _prepare_inputs(
669669 seq_lens = self .seq_lens [:num_reqs ]
670670
671671 common_attn_metadata = CommonAttentionMetadata (
672- query_start_loc = query_start_loc , seq_lens = seq_lens )
672+ query_start_loc = query_start_loc ,
673+ seq_lens = seq_lens ,
674+ num_reqs = num_reqs ,
675+ num_actual_tokens = total_num_scheduled_tokens ,
676+ max_query_len = max_num_scheduled_tokens ,
677+ )
673678
674679 attn_metadata : dict [str , Any ] = {}
675680 # Prepare the attention metadata for each KV cache group and make layers
@@ -690,11 +695,9 @@ def _prepare_inputs(
690695
691696 attn_metadata_i = (
692697 self .attn_metadata_builders [kv_cache_group_id ].build (
693- num_reqs = num_reqs ,
694- num_actual_tokens = total_num_scheduled_tokens ,
695- max_query_len = max_num_scheduled_tokens ,
696698 common_prefix_len = common_prefix_len ,
697- common_attn_metadata = common_attn_metadata ))
699+ common_attn_metadata = common_attn_metadata ,
700+ ))
698701 for layer_name in kv_cache_group_spec .layer_names :
699702 attn_metadata [layer_name ] = attn_metadata_i
700703
@@ -1809,18 +1812,20 @@ def _dummy_run(
18091812 seq_lens = self .seq_lens [:num_reqs ]
18101813
18111814 common_attn_metadata = CommonAttentionMetadata (
1812- query_start_loc = query_start_loc , seq_lens = seq_lens )
1815+ query_start_loc = query_start_loc ,
1816+ seq_lens = seq_lens ,
1817+ num_reqs = num_reqs ,
1818+ num_actual_tokens = num_tokens ,
1819+ max_query_len = num_tokens ,
1820+ )
18131821
18141822 attn_metadata = {}
18151823 for kv_cache_group_id , kv_cache_group_spec in enumerate (
18161824 self .kv_cache_config .kv_cache_groups ):
18171825
18181826 attn_metadata_i = self .attn_metadata_builders [
18191827 kv_cache_group_id ].build_for_cudagraph_capture (
1820- num_reqs = num_reqs ,
1821- num_tokens = num_tokens ,
1822- common_attn_metadata = common_attn_metadata ,
1823- )
1828+ common_attn_metadata )
18241829 for layer_name in kv_cache_group_spec .layer_names :
18251830 attn_metadata [layer_name ] = attn_metadata_i
18261831
0 commit comments