Skip to content

Commit fcac8e5

Browse files
committed
[0828]temp
1 parent 33923b9 commit fcac8e5

File tree

4 files changed

+14
-7
lines changed

4 files changed

+14
-7
lines changed

lightllm/server/embed_cache/impl/memory_cache_with_redis.py

Lines changed: 9 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -29,16 +29,21 @@ def __init__(self, args) -> None:
2929
# 硬盘里的图片image embed 数量。
3030
self.cache_capacity = args.cache_capacity * 2
3131

32+
# llm 负责release
3233
def release(self, ids: list[int]) -> None:
3334
with self.lock:
3435
for id_ in ids:
3536
self._records[id_].ref -= 1
36-
self.redis_cache.decr(id_)
37-
print(self.redis_cache.stats(), flush=True)
37+
if self.redis_cache.query(str(id_)):
38+
self.redis_cache.decr(str(id_))
39+
print(self.redis_cache.stats(), flush=True)
3840

41+
# vit 负责set
3942
def set_items_embed(self, ids: list[int]) -> None:
40-
for id in ids:
41-
self.redis_cache.insert(str(id))
43+
with self.lock:
44+
for id in ids:
45+
self.redis_cache.insert(str(id))
46+
self._records[id].embed = True
4247

4348
def get_items_embed(self, ids: list[int]) -> list[Optional[bool]]:
4449
ret = []

lightllm/server/visualserver/manager.py

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -165,7 +165,8 @@ def _recv_reqs(self):
165165
for img in recv_req.multimodal_params.images:
166166
uuids.append(img.uuid)
167167
token_nums.append(img.token_num)
168-
self.cache_client.root.alloc(uuids, token_nums)
168+
record = self.cache_client.root.alloc(uuids, token_nums)
169+
print(f"record is {record}")
169170
return recv_req
170171
else:
171172
return self.vit_receiver.recv_pyobj(zmq.NOBLOCK)
@@ -179,7 +180,7 @@ async def loop_for_netio_req(self):
179180
for _ in range(self.visual_recv_max_count):
180181
recv_req: GroupReqIndexes = self._recv_reqs()
181182
if isinstance(recv_req, GroupReqIndexes):
182-
print(recv_req, flush=True)
183+
# print(recv_req, flush=True)
183184
self.waiting_reqs.append(recv_req)
184185
else:
185186
assert False, f"Error Req Inf {recv_req}"

lightllm/server/visualserver/model_infer/model_rpc.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -114,6 +114,7 @@ def exposed_encode(self, images: List[ImageItem]):
114114

115115
if self.tp_rank_id == 0:
116116
ready_flags = obtain(self.cache_client.root.get_items_embed(uuids))
117+
print(f"ready_flags is {ready_flags}")
117118
ids_to_set = []
118119
for i, ready in enumerate(ready_flags):
119120
if ready:

lightllm/server/visualserver/vit_connect.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -211,7 +211,7 @@ async def _async_get_vit_objs(self) -> Optional[Dict[int, VIT_Obj]]:
211211
logger.exception(f"Error getting VIT instances: {e}")
212212
return None
213213

214-
async def _wait_visual_embed_ready(self, data, timeout_seconds: int = 20):
214+
async def _wait_visual_embed_ready(self, data, timeout_seconds: int = 100):
215215
# 本地模式不需要等待
216216
if not self.remote_vit:
217217
return

0 commit comments

Comments
 (0)