Skip to content

Commit 4f96308

Browse files
author
wangzaijun
committed
fix
1 parent 1cccbb9 commit 4f96308

File tree

3 files changed

+7
-2
lines changed

3 files changed

+7
-2
lines changed

lightllm/models/qwen2_vl/vision_process.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -162,6 +162,8 @@ def rescale_and_normalize(
162162

163163
def preprocess(self, image) -> Tuple[torch.Tensor, torch.Tensor]:
164164
image_arr = np.asarray(image, dtype=np.uint8)
165+
# TODO check cuda tensor oom reason
166+
# image_data = torch.from_numpy(image_arr).permute(2, 0, 1).contiguous().to("cuda", non_blocking=True)
165167
image_data = torch.from_numpy(image_arr).permute(2, 0, 1)
166168

167169
grouped_images, grouped_images_index = group_images_by_shape(

lightllm/server/api_cli.py

Lines changed: 4 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -359,7 +359,10 @@ def make_argument_parser() -> argparse.ArgumentParser:
359359
"--visual_send_batch_size",
360360
type=int,
361361
default=1,
362-
help="number of images embedding to send to llm process in each batch",
362+
help="""
363+
number of images embedding to send to llm process in each batch,
364+
bigger size can improve throughput but increase latency possibly in some cases
365+
""",
363366
)
364367
parser.add_argument(
365368
"--visual_gpu_ids", nargs="+", type=int, default=None, help="List of GPU IDs to use, e.g., 0 1 2"

lightllm/server/visualserver/manager.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -57,7 +57,7 @@ def __init__(
5757
self.trust_remote_code = args.trust_remote_code
5858
self.args = args
5959
self.visual_model_rpc_ports = visual_model_rpc_ports
60-
self.send_batch_size = min(args.visual_send_batch_size, args.cache_capacity, args.visual_infer_batch_size)
60+
self.send_batch_size = args.visual_send_batch_size
6161
self.shm_req_manager = ShmReqManager()
6262

6363
async def wait_to_model_ready(self):

0 commit comments

Comments
 (0)