@@ -22,9 +22,9 @@ class Record(object):
2222 token_id : int
2323 token_num : int
2424
25-
2625@CacheManagerFactory .register ("naive" )
2726class InMemoryCache (CacheManager ):
27+
2828 def __init__ (self , args ) -> None :
2929 self ._records = dict ()
3030 self ._md5_to_record = dict ()
@@ -36,8 +36,9 @@ def __init__(self, args) -> None:
3636 self .lock = threading .Lock ()
3737
3838 from lightllm .server .tokenizer import get_tokenizer
39-
40- tokenizer = get_tokenizer (args .model_dir , args .tokenizer_mode , trust_remote_code = args .trust_remote_code )
39+ tokenizer = get_tokenizer (
40+ args .model_dir , args .tokenizer_mode , trust_remote_code = args .trust_remote_code
41+ )
4142 self .cur_token_id = tokenizer .vocab_size + 10000
4243
4344 def _clear (self ):
@@ -69,6 +70,7 @@ def alloc(self, md5sum: str, token_num: int) -> dict:
6970 self ._clear ()
7071 if self .occupied >= self .capacity :
7172 return None
73+
7274 id = uuid .uuid1 ()
7375 id = id .int
7476 record = Record (
@@ -93,7 +95,11 @@ def alloc(self, md5sum: str, token_num: int) -> dict:
9395 record .visittime = t
9496 record .ref += 1
9597
96- return {"id" : record .id , "token_id" : record .token_id , "token_num" : record .token_num }
98+ return {
99+ "id" : record .id ,
100+ "token_id" : record .token_id ,
101+ "token_num" : record .token_num
102+ }
97103
98104 def release (self , id : int ) -> None :
99105 with self .lock :
0 commit comments