File tree Expand file tree Collapse file tree 1 file changed +1
-5
lines changed
cpp/tensorrt_llm/batch_manager Expand file tree Collapse file tree 1 file changed +1
-5
lines changed Original file line number Diff line number Diff line change @@ -1891,11 +1891,7 @@ void KVCacheManager::addSequence(
18911891
18921892 for (auto const [windowSize, metadata] : mBlockManager .getWindowSizesMetadata ())
18931893 {
1894- auto const maxTokenNum = metadata.maxTokenNum ;
1895- auto const temporaryAttentionWindow = metadata.temporaryAttentionWindow ;
1896-
1897- // Consider the temporaryAttentionWindow when allocating blocks.
1898- auto const effectiveInputLength = std::min (inputLength, maxTokenNum + temporaryAttentionWindow);
1894+ auto const effectiveInputLength = std::min (inputLength, windowSize);
18991895 auto const numContextBlocks = tc::ceilDiv (effectiveInputLength, getTokensPerBlock ());
19001896 if (!sequence.isCyclic () && mEnableBlockReuse )
19011897 {
You can’t perform that action at this time.
0 commit comments