Skip to content

Commit 203d4f8

Browse files
authored
[Core][Bugfix] cache len of tokenizer (#3741)
1 parent 991143c commit 203d4f8

File tree

1 file changed

+4
-0
lines changed

1 file changed

+4
-0
lines changed

vllm/transformers_utils/tokenizer.py

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -26,6 +26,7 @@ def get_cached_tokenizer(
2626
tokenizer_all_special_tokens_extended = (
2727
tokenizer.all_special_tokens_extended)
2828
tokenizer_all_special_tokens = set(tokenizer.all_special_tokens)
29+
tokenizer_len = len(tokenizer)
2930

3031
class CachedTokenizer(tokenizer.__class__):
3132

@@ -41,6 +42,9 @@ def all_special_tokens(self):
4142
def all_special_tokens_extended(self):
4243
return tokenizer_all_special_tokens_extended
4344

45+
def __len__(self):
46+
return tokenizer_len
47+
4448
CachedTokenizer.__name__ = f"Cached{tokenizer.__class__.__name__}"
4549

4650
tokenizer.__class__ = CachedTokenizer

0 commit comments

Comments
 (0)