Skip to content

Commit 58a1bb7

Browse files
authored
Merge pull request #4178 from myhloli/dev
refactor: update comments in compose.yaml for clarity and guidance on engine parameters
2 parents 8aae656 + 5f86767 commit 58a1bb7

File tree

1 file changed

+11
-55
lines changed

1 file changed

+11
-55
lines changed

docker/compose.yaml

Lines changed: 11 additions & 55 deletions
Original file line numberDiff line numberDiff line change
@@ -10,29 +10,11 @@ services:
1010
MINERU_MODEL_SOURCE: local
1111
entrypoint: mineru-openai-server
1212
command:
13-
# ==================== Engine Selection ====================
14-
# WARNING: Only ONE engine can be enabled at a time!
15-
# Choose 'vllm' OR 'lmdeploy' (uncomment one line below)
1613
--engine vllm
17-
# --engine lmdeploy
18-
19-
# ==================== vLLM Engine Parameters ====================
20-
# Uncomment if using --engine vllm
2114
--host 0.0.0.0
2215
--port 30000
23-
# Multi-GPU configuration (increase throughput)
24-
# --data-parallel-size 2
25-
# Single GPU memory optimization (reduce if VRAM insufficient)
26-
# --gpu-memory-utilization 0.5 # Try 0.4 or lower if issues persist
27-
28-
# ==================== LMDeploy Engine Parameters ====================
29-
# Uncomment if using --engine lmdeploy
30-
# --server-name 0.0.0.0
31-
# --server-port 30000
32-
# Multi-GPU configuration (increase throughput)
33-
# --dp 2
34-
# Single GPU memory optimization (reduce if VRAM insufficient)
35-
# --cache-max-entry-count 0.5 # Try 0.4 or lower if issues persist
16+
# --data-parallel-size 2 # If using multiple GPUs, increase throughput using vllm's multi-GPU parallel mode
17+
# --gpu-memory-utilization 0.5 # If running on a single GPU and encountering VRAM shortage, reduce the KV cache size by this parameter, if VRAM issues persist, try lowering it further to `0.4` or below.
3618
ulimits:
3719
memlock: -1
3820
stack: 67108864
@@ -58,21 +40,11 @@ services:
5840
MINERU_MODEL_SOURCE: local
5941
entrypoint: mineru-api
6042
command:
61-
# ==================== Server Configuration ====================
6243
--host 0.0.0.0
6344
--port 8000
64-
65-
# ==================== vLLM Engine Parameters ====================
66-
# Multi-GPU configuration
67-
# --data-parallel-size 2
68-
# Single GPU memory optimization
69-
# --gpu-memory-utilization 0.5 # Try 0.4 or lower if VRAM insufficient
70-
71-
# ==================== LMDeploy Engine Parameters ====================
72-
# Multi-GPU configuration
73-
# --dp 2
74-
# Single GPU memory optimization
75-
# --cache-max-entry-count 0.5 # Try 0.4 or lower if VRAM insufficient
45+
# parameters for vllm-engine
46+
# --data-parallel-size 2 # If using multiple GPUs, increase throughput using vllm's multi-GPU parallel mode
47+
# --gpu-memory-utilization 0.5 # If running on a single GPU and encountering VRAM shortage, reduce the KV cache size by this parameter, if VRAM issues persist, try lowering it further to `0.4` or below.
7648
ulimits:
7749
memlock: -1
7850
stack: 67108864
@@ -96,30 +68,14 @@ services:
9668
MINERU_MODEL_SOURCE: local
9769
entrypoint: mineru-gradio
9870
command:
99-
# ==================== Gradio Server Configuration ====================
10071
--server-name 0.0.0.0
10172
--server-port 7860
102-
103-
# ==================== Gradio Feature Settings ====================
104-
# --enable-api false # Disable API endpoint
105-
# --max-convert-pages 20 # Limit conversion page count
106-
107-
# ==================== Engine Selection ====================
108-
# WARNING: Only ONE engine can be enabled at a time!
109-
110-
# Option 1: vLLM Engine (recommended for most users)
111-
--enable-vllm-engine true
112-
# Multi-GPU configuration
113-
# --data-parallel-size 2
114-
# Single GPU memory optimization
115-
# --gpu-memory-utilization 0.5 # Try 0.4 or lower if VRAM insufficient
116-
117-
# Option 2: LMDeploy Engine
118-
# --enable-lmdeploy-engine true
119-
# Multi-GPU configuration
120-
# --dp 2
121-
# Single GPU memory optimization
122-
# --cache-max-entry-count 0.5 # Try 0.4 or lower if VRAM insufficient
73+
--enable-vllm-engine true # Enable the vllm engine for Gradio
74+
# --enable-api false # If you want to disable the API, set this to false
75+
# --max-convert-pages 20 # If you want to limit the number of pages for conversion, set this to a specific number
76+
# parameters for vllm-engine
77+
# --data-parallel-size 2 # If using multiple GPUs, increase throughput using vllm's multi-GPU parallel mode
78+
# --gpu-memory-utilization 0.5 # If running on a single GPU and encountering VRAM shortage, reduce the KV cache size by this parameter, if VRAM issues persist, try lowering it further to `0.4` or below.
12379
ulimits:
12480
memlock: -1
12581
stack: 67108864

0 commit comments

Comments
 (0)