diff --git a/deploy/docker-compose/addons/vllm_semantic_router_pipe.py b/deploy/docker-compose/addons/vllm_semantic_router_pipe.py index 3ddbf3f8..a1578abf 100644 --- a/deploy/docker-compose/addons/vllm_semantic_router_pipe.py +++ b/deploy/docker-compose/addons/vllm_semantic_router_pipe.py @@ -18,7 +18,7 @@ class Pipeline: class Valves(BaseModel): # vLLM Semantic Router endpoint URL - vsr_base_url: str = "http://envoy-proxy:8801/v1" + vsr_base_url: str = "http://envoy-proxy:8801" # API key for authentication (if required) api_key: str = "" @@ -45,7 +45,7 @@ def __init__(self): # Initialize valves self.valves = self.Valves( **{ - "vsr_base_url": "http://envoy-proxy:8801/v1", + "vsr_base_url": "http://envoy-proxy:8801", "api_key": "", "show_vsr_info": True, "log_vsr_info": True, diff --git a/tools/mock-vllm/Dockerfile b/tools/mock-vllm/Dockerfile index 2af352bb..63292c9d 100644 --- a/tools/mock-vllm/Dockerfile +++ b/tools/mock-vllm/Dockerfile @@ -6,10 +6,10 @@ RUN apt-get update && apt-get install -y --no-install-recommends \ curl \ && rm -rf /var/lib/apt/lists/* -COPY src/training/requirements.txt ./ +COPY requirements.txt ./ RUN pip install --no-cache-dir -r requirements.txt -COPY app.py ./ +COPY app.py ./ EXPOSE 8000