File tree Expand file tree Collapse file tree 2 files changed +5
-1
lines changed
include/tensorrt_llm/batch_manager
tensorrt_llm/batch_manager Expand file tree Collapse file tree 2 files changed +5
-1
lines changed Original file line number Diff line number Diff line change @@ -183,6 +183,10 @@ class BlockRange
183183 auto windowSize = cacheManager.getBlockManager ().getPoolWindowSize (poolIdx);
184184 mPoolsPerWindow [windowSize].push_back (cacheManager.getBlockManager ().getPrimaryPool (poolIdx));
185185 }
186+ if (cacheManager.isEnableIndexerKCache ())
187+ {
188+ mIndexerKCachePool = cacheManager.getIndexerKCachePool ();
189+ }
186190 }
187191
188192 BlockRange (BaseKVCacheManager const & cacheManager, LlmRequest::RequestIdType requestId)
Original file line number Diff line number Diff line change @@ -806,7 +806,7 @@ class CacheReceiver::Impl
806806
807807 RequestInfo requestInfo (requestId, mSelfState );
808808
809- if (mFormatter ->getCacheManager ()->getBlockManager ().getNumPools () == 1 )
809+ if (! mFormatter ->getCacheManager ()->getBlockManager ().isVariableWindow () )
810810 {
811811 auto * cacheManager = mFormatter ->getCacheManager ();
812812 auto beam = 0 ;
You can’t perform that action at this time.
0 commit comments