File tree Expand file tree Collapse file tree 1 file changed +1
-5
lines changed
cpp/tensorrt_llm/batch_manager Expand file tree Collapse file tree 1 file changed +1
-5
lines changed Original file line number Diff line number Diff line change @@ -1961,11 +1961,7 @@ void KVCacheManager::addSequence(
19611961
19621962 for (auto const [windowSize, metadata] : mBlockManager .getWindowSizesMetadata ())
19631963 {
1964- auto const maxTokenNum = metadata.maxTokenNum ;
1965- auto const temporaryAttentionWindow = metadata.temporaryAttentionWindow ;
1966-
1967- // Consider the temporaryAttentionWindow when allocating blocks.
1968- auto const effectiveInputLength = std::min (inputLength, maxTokenNum + temporaryAttentionWindow);
1964+ auto const effectiveInputLength = std::min (inputLength, windowSize);
19691965 auto const numContextBlocks = tc::ceilDiv (effectiveInputLength, getTokensPerBlock ());
19701966 if (!sequence.isCyclic () && mEnableBlockReuse )
19711967 {
You can’t perform that action at this time.
0 commit comments