We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 1dd2338 commit dd56058Copy full SHA for dd56058
vllm/v1/engine/mm_input_cache.py
@@ -51,6 +51,13 @@ def get_and_update_p0(
51
full_mm_inputs = list[Optional[MultiModalKwargs]]()
52
for mm_input, mm_hash in zip(mm_inputs, mm_hashes):
53
if mm_hash in self.mm_cache:
54
+ # Client and Server must be exactly the same (see description
55
+ # in the top of this file).
56
+ # `in` in above statement don't update access time by design.
57
+ # But server side make a direct access and update access time.
58
+ # Have to make a dummy access to update access time to keep
59
+ # LRU order of caches consistent.
60
+ _ = self.mm_cache[mm_hash]
61
mm_input = None
62
else:
63
self.mm_cache[mm_hash] = mm_input
0 commit comments