File tree Expand file tree Collapse file tree 1 file changed +1
-5
lines changed 
cpp/tensorrt_llm/batch_manager Expand file tree Collapse file tree 1 file changed +1
-5
lines changed Original file line number Diff line number Diff line change @@ -1891,11 +1891,7 @@ void KVCacheManager::addSequence(
18911891
18921892    for  (auto  const  [windowSize, metadata] : mBlockManager .getWindowSizesMetadata ())
18931893    {
1894-         auto  const  maxTokenNum = metadata.maxTokenNum ;
1895-         auto  const  temporaryAttentionWindow = metadata.temporaryAttentionWindow ;
1896- 
1897-         //  Consider the temporaryAttentionWindow when allocating blocks.
1898-         auto  const  effectiveInputLength = std::min (inputLength, maxTokenNum + temporaryAttentionWindow);
1894+         auto  const  effectiveInputLength = std::min (inputLength, windowSize);
18991895        auto  const  numContextBlocks = tc::ceilDiv (effectiveInputLength, getTokensPerBlock ());
19001896        if  (!sequence.isCyclic () && mEnableBlockReuse )
19011897        {
 
 
   
 
     
   
   
          
    
    
     
    
      
     
     
    You can’t perform that action at this time.
  
 
    
  
    
      
        
     
       
      
     
   
 
    
    
  
 
  
 
     
    
0 commit comments