Skip to content

Commit cda6156

Browse files
authored
Merge pull request #173 from NillionNetwork/fix/vllm_config_url
fix: working URL with both http and https
2 parents 30351e9 + 2fb6bbb commit cda6156

21 files changed

+29
-54
lines changed

docker/compose/docker-compose.deepseek-14b-gpu.yml

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -22,8 +22,7 @@ services:
2222
--tensor-parallel-size 1
2323
--uvicorn-log-level warning
2424
environment:
25-
- SVC_HOST=deepseek_14b_gpu
26-
- SVC_PORT=8000
25+
- SVC_URL=http://deepseek_14b_gpu:8000
2726
- DISCOVERY_URL=redis://redis:6379
2827
- TOOL_SUPPORT=false
2928
volumes:

docker/compose/docker-compose.gemma-27b-gpu.yml

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -27,8 +27,7 @@ services:
2727
--kv-cache-dtype fp8
2828
--uvicorn-log-level warning
2929
environment:
30-
- SVC_HOST=gemma_27b_gpu
31-
- SVC_PORT=8000
30+
- SVC_URL=http://gemma_27b_gpu:8000
3231
- DISCOVERY_URL=redis://redis:6379
3332
- TOOL_SUPPORT=false
3433
- MULTIMODAL_SUPPORT=true

docker/compose/docker-compose.gemma-4b-gpu.ci.yml

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -26,8 +26,7 @@ services:
2626
2727
--uvicorn-log-level warning
2828
environment:
29-
- SVC_HOST=gemma_4b_gpu
30-
- SVC_PORT=8000
29+
- SVC_URL=http://gemma_4b_gpu:8000
3130
- DISCOVERY_URL=redis://redis:6379
3231
- TOOL_SUPPORT=false
3332
- MULTIMODAL_SUPPORT=true

docker/compose/docker-compose.gpt-120b-gpu.yml

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -26,8 +26,7 @@ services:
2626
--tensor-parallel-size 1
2727
--uvicorn-log-level warning
2828
environment:
29-
- SVC_HOST=gpt_120b_gpu
30-
- SVC_PORT=8000
29+
- SVC_URL=http://gpt_120b_gpu:8000
3130
- DISCOVERY_URL=redis://redis:6379
3231
- TOOL_SUPPORT=true
3332
volumes:

docker/compose/docker-compose.gpt-20b-gpu.ci.yml

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -21,8 +21,7 @@ services:
2121
command: >
2222
--model openai/gpt-oss-20b --gpu-memory-utilization 0.95 --max-model-len 10000 --max-num-batched-tokens 10000 --max-num-seqs 2 --tensor-parallel-size 1 --uvicorn-log-level warning --async-scheduling
2323
environment:
24-
- SVC_HOST=gpt_20b_gpu
25-
- SVC_PORT=8000
24+
- SVC_URL=http://gpt_20b_gpu:8000
2625
- DISCOVERY_URL=redis://redis:6379
2726
- TOOL_SUPPORT=true
2827
volumes:

docker/compose/docker-compose.gpt-20b-gpu.yml

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -26,8 +26,7 @@ services:
2626
--tensor-parallel-size 1
2727
--uvicorn-log-level warning
2828
environment:
29-
- SVC_HOST=gpt_20b_gpu
30-
- SVC_PORT=8000
29+
- SVC_URL=http://gpt_20b_gpu:8000
3130
- DISCOVERY_URL=redis://redis:6379
3231
- TOOL_SUPPORT=true
3332
volumes:

docker/compose/docker-compose.llama-1b-cpu.yml

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -17,8 +17,7 @@ services:
1717
--tool-call-parser llama3_json
1818
--uvicorn-log-level warning
1919
environment:
20-
- SVC_HOST=llama_1b_cpu
21-
- SVC_PORT=8000
20+
- SVC_URL=http://llama_1b_cpu:8000
2221
- DISCOVERY_URL=redis://redis:6379
2322
- TOOL_SUPPORT=true
2423
volumes:

docker/compose/docker-compose.llama-1b-gpu.ci.yml

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -30,8 +30,7 @@ services:
3030
--uvicorn-log-level warning
3131
--dtype half
3232
environment:
33-
- SVC_HOST=llama_1b_gpu
34-
- SVC_PORT=8000
33+
- SVC_URL=http://llama_1b_gpu:8000
3534
- DISCOVERY_URL=redis://redis:6379
3635
- TOOL_SUPPORT=true
3736
- CUDA_LAUNCH_BLOCKING=1

docker/compose/docker-compose.llama-1b-gpu.yml

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -28,8 +28,7 @@ services:
2828
--tool-call-parser llama3_json
2929
--uvicorn-log-level warning
3030
environment:
31-
- SVC_HOST=llama_1b_gpu
32-
- SVC_PORT=8000
31+
- SVC_URL=http://llama_1b_gpu:8000
3332
- DISCOVERY_URL=redis://redis:6379
3433
- TOOL_SUPPORT=true
3534
volumes:

docker/compose/docker-compose.llama-3b-gpu.yml

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -28,8 +28,7 @@ services:
2828
--tool-call-parser llama3_json
2929
--uvicorn-log-level warning
3030
environment:
31-
- SVC_HOST=llama_3b_gpu
32-
- SVC_PORT=8000
31+
- SVC_URL=http://llama_3b_gpu:8000
3332
- DISCOVERY_URL=redis://redis:6379
3433
- TOOL_SUPPORT=true
3534
volumes:

0 commit comments

Comments
 (0)