|
1 | 1 | #!/bin/bash
|
2 |
| -if [[ $# -ne 2 ]]; then |
3 |
| - echo "Usage $0 <router port> <backend url>" |
| 2 | +if [[ $# -ne 1 ]]; then |
| 3 | + echo "Usage $0 <router port>" |
4 | 4 | exit 1
|
5 | 5 | fi
|
6 | 6 |
|
|
15 | 15 | # --log-stats
|
16 | 16 |
|
17 | 17 | # Use this command when testing with static service discovery
|
18 |
| -# python3 -m vllm_router.app --port "$1" \ |
19 |
| -# --service-discovery static \ |
20 |
| -# --static-backends "http://localhost:8000" \ |
21 |
| -# --static-models "facebook/opt-125m" \ |
22 |
| -# --static-model-types "chat" \ |
23 |
| -# --log-stats \ |
24 |
| -# --log-stats-interval 10 \ |
25 |
| -# --engine-stats-interval 10 \ |
26 |
| -# --request-stats-window 10 \ |
27 |
| -# --request-stats-window 10 \ |
28 |
| -# --routing-logic roundrobin |
| 18 | +python3 -m vllm_router.app --port "$1" \ |
| 19 | + --service-discovery static \ |
| 20 | + --static-backends "http://localhost:8000" \ |
| 21 | + --static-models "facebook/opt-125m" \ |
| 22 | + --static-model-types "chat" \ |
| 23 | + --log-stats \ |
| 24 | + --log-stats-interval 10 \ |
| 25 | + --engine-stats-interval 10 \ |
| 26 | + --request-stats-window 10 \ |
| 27 | + --request-stats-window 10 \ |
| 28 | + --routing-logic roundrobin |
29 | 29 |
|
30 | 30 | # Use this command when testing with roundrobin routing logic
|
31 | 31 | #python3 router.py --port "$1" \
|
|
35 | 35 | # --engine-stats-interval 10 \
|
36 | 36 | # --log-stats
|
37 | 37 | #
|
38 |
| - |
39 |
| -# Use this command when testing with whisper transcription |
40 |
| -ROUTER_PORT=$1 |
41 |
| -BACKEND_URL=$2 |
42 |
| - |
43 |
| -python3 -m vllm_router.app \ |
44 |
| - --host 0.0.0.0 \ |
45 |
| - --port "${ROUTER_PORT}" \ |
46 |
| - --service-discovery static \ |
47 |
| - --static-backends "${BACKEND_URL}" \ |
48 |
| - --static-models "openai/whisper-small" \ |
49 |
| - --static-model-types "transcription" \ |
50 |
| - --routing-logic roundrobin \ |
51 |
| - --log-stats \ |
52 |
| - --engine-stats-interval 10 \ |
53 |
| - --request-stats-window 10 |
0 commit comments