@@ -88,6 +88,12 @@ def __init__(self) -> None:
88
88
89
89
self ._processing_cache = ProcessingCache (VLLM_MM_INPUT_CACHE_GIB )
90
90
91
+ def reset_processor_cache (self ) -> bool :
92
+ """Reset the multi-modal processing cache."""
93
+ self ._processing_cache .reset ()
94
+
95
+ return True # Success
96
+
91
97
@deprecated ("Legacy input processor/mapper pipeline has been removed. "
92
98
"Please update your model runner to use "
93
99
"`seq_group_metadata.multi_modal_data` directly without "
@@ -106,7 +112,7 @@ def get_max_tokens_per_item_by_modality(
106
112
if not model_config .is_multimodal_model :
107
113
return {}
108
114
109
- processor = self .create_processor (model_config , disable_cache = True )
115
+ processor = self .create_processor (model_config , disable_cache = False )
110
116
profiler = MultiModalProfiler (processor )
111
117
112
118
seq_len = model_config .max_model_len
@@ -190,7 +196,7 @@ def get_mm_limits_per_prompt(
190
196
if not model_config .is_multimodal_model :
191
197
return {}
192
198
193
- processor = self .create_processor (model_config , disable_cache = True )
199
+ processor = self .create_processor (model_config , disable_cache = False )
194
200
profiler = MultiModalProfiler (processor )
195
201
return profiler .get_mm_limits ()
196
202
@@ -286,7 +292,7 @@ def get_decoder_dummy_data(
286
292
287
293
The model is identified by ``model_config``.
288
294
"""
289
- processor = self .create_processor (model_config , disable_cache = True )
295
+ processor = self .create_processor (model_config , disable_cache = False )
290
296
profiler = MultiModalProfiler (processor )
291
297
dummy_data = profiler .get_decoder_dummy_data (seq_len , mm_counts )
292
298
@@ -310,7 +316,7 @@ def get_encoder_dummy_data(
310
316
311
317
The model is identified by ``model_config``.
312
318
"""
313
- processor = self .create_processor (model_config , disable_cache = True )
319
+ processor = self .create_processor (model_config , disable_cache = False )
314
320
profiler = MultiModalProfiler (processor )
315
321
dummy_data = profiler .get_encoder_dummy_data (seq_len , mm_counts )
316
322
0 commit comments