vllm-project
diff --git a/‎dashboard/Dockerfile‎
Lines changed: 25 additions & 0 deletions b/‎dashboard/Dockerfile‎
Lines changed: 25 additions & 0 deletions
diff --git a/‎dashboard/frontend/src/pages/PlaygroundPage.tsx‎
Lines changed: 9 additions & 1 deletion b/‎dashboard/frontend/src/pages/PlaygroundPage.tsx‎
Lines changed: 9 additions & 1 deletion
diff --git a/‎deploy/openshift/README.md‎
Lines changed: 153 additions & 19 deletions b/‎deploy/openshift/README.md‎
Lines changed: 153 additions & 19 deletions
diff --git a/‎deploy/openshift/cleanup-openshift.sh‎
Lines changed: 48 additions & 3 deletions b/‎deploy/openshift/cleanup-openshift.sh‎
Lines changed: 48 additions & 3 deletions
diff --git a/‎deploy/openshift/config-openshift.yaml‎
Lines changed: 3 additions & 3 deletions b/‎deploy/openshift/config-openshift.yaml‎
Lines changed: 3 additions & 3 deletions
@@ -0,0 +1,25 @@
+# Build frontend
+FROM node:18-alpine AS frontend-builder
+WORKDIR /app/frontend
+COPY frontend/package*.json ./
+RUN npm ci
+COPY frontend/ ./
+RUN npm run build
+
+# Build backend
+FROM golang:1.21-alpine AS backend-builder
+WORKDIR /app/backend
+COPY backend/go.* ./
+RUN go mod download
+COPY backend/ ./
+RUN CGO_ENABLED=0 GOOS=linux go build -o dashboard-server .
+
+# Final image
+FROM alpine:3.18
+RUN apk add --no-cache ca-certificates
+WORKDIR /app
+COPY --from=backend-builder /app/backend/dashboard-server .
+COPY --from=frontend-builder /app/frontend/dist ./frontend
+ENV DASHBOARD_STATIC_DIR=./frontend
+EXPOSE 8700
+CMD ["./dashboard-server"]
@@ -2,7 +2,15 @@ import React, { useState, useEffect } from 'react'
 import styles from './PlaygroundPage.module.css'
 
 const PlaygroundPage: React.FC = () => {
-  const [openWebUIUrl] = useState('http://localhost:3001')
+  // Detect OpenWebUI URL based on current hostname
+  // Assumes openwebui and dashboard have matching hostname patterns
+  const getOpenWebUIUrl = () => {
+    const hostname = window.location.hostname
+    const openwebuiHost = hostname.replace('dashboard', 'openwebui')
+    return `${window.location.protocol}//${openwebuiHost}`
+  }
+
+  const [openWebUIUrl] = useState(getOpenWebUIUrl())
   const [currentUrl, setCurrentUrl] = useState('')
 
   // Auto-load on mount
 
@@ -9,26 +9,54 @@ This directory contains OpenShift-specific deployment manifests for the vLLM Sem
 - OpenShift cluster access
 - `oc` CLI tool configured and logged in
 - Cluster admin privileges (or permissions to create namespaces and routes)
+- Local source code (for dashboard build)
 
-### Automated Deployment (Recommended)
+### One-Click Full Deployment (Recommended)
 
-The deployment script automatically handles everything including dynamic IP configuration:
+Deploy the complete stack including semantic-router, vLLM models, and all observability components:
 
 ```bash
 cd deploy/openshift
 ./deploy-to-openshift.sh
 ```
 
-This script will:
+This script will deploy:
+
+**Core Components:**
 
 - ✅ Build the llm-katan image from Dockerfile
 - ✅ Create namespace and PVCs
-- ✅ Deploy vLLM model services (model-a and model-b)
+- ✅ Deploy vLLM model services (Model-A and Model-B)
 - ✅ Auto-discover Kubernetes service ClusterIPs
 - ✅ Generate configuration with actual IPs (portable across clusters)
-- ✅ Deploy semantic-router with Envoy proxy
+- ✅ Deploy semantic-router with Envoy proxy sidecar
 - ✅ Create OpenShift routes for external access
 
+**Observability Stack:**
+
+- ✅ Dashboard (built from local source with PlaygroundPage fix)
+- ✅ OpenWebUI playground for testing models
+- ✅ Grafana for metrics visualization
+- ✅ Prometheus for metrics collection
+
+### Minimal Deployment (Core Only)
+
+If you only want the core semantic-router and vLLM models without observability:
+
+```bash
+cd deploy/openshift
+./deploy-to-openshift.sh --no-observability
+```
+
+This deploys only the core components without Dashboard, OpenWebUI, Grafana, and Prometheus.
+
+### Command Line Options
+
+| Flag | Description |
+|------|-------------|
+| `--no-observability` | Skip deploying Dashboard, OpenWebUI, Grafana, and Prometheus |
+| `--help`, `-h` | Show help message |
+
 ### Manual Deployment (Advanced)
 
 If you prefer manual deployment or need to customize:
@@ -53,23 +81,67 @@ If you prefer manual deployment or need to customize:
 
 4. **Note:** You'll need to manually configure ClusterIPs in `config-openshift.yaml`
 
+## How Dashboard Build Works
+
+The deployment script uses OpenShift's **binary build** approach for the dashboard:
+
+1. Creates a BuildConfig with Docker strategy
+2. Uploads the local `dashboard/` directory as build source
+3. Builds the image inside OpenShift (no local Docker required)
+4. Pushes to OpenShift internal registry
+5. Deploys using the built image
+
+### Why Binary Build?
+
+- ✅ No local Docker daemon required
+- ✅ Works on any machine with `oc` CLI
+- ✅ Builds with your local code changes (including PlaygroundPage fix)
+- ✅ Automatically integrated with OpenShift registry
+- ✅ Works across different OpenShift clusters
+
+### Updating Dashboard
+
+If you make changes to the dashboard code, rebuild and redeploy:
+
+```bash
+# Rebuild dashboard image from local source
+cd dashboard
+oc start-build dashboard-custom --from-dir=. --follow -n vllm-semantic-router-system
+
+# Restart deployment to use new image
+oc rollout restart deployment/dashboard -n vllm-semantic-router-system
+```
+
 ## Accessing Services
 
-After deployment, the services will be accessible via OpenShift Routes:
+After deployment, the script will display URLs for all services. Routes are automatically generated with cluster-appropriate hostnames.
 
 ### Get Route URLs
 
 ```bash
-# Classification API (HTTP REST)
+# Core Services
 oc get route semantic-router-api -n vllm-semantic-router-system -o jsonpath='{.spec.host}'
-
-# gRPC API
 oc get route semantic-router-grpc -n vllm-semantic-router-system -o jsonpath='{.spec.host}'
-
-# Metrics
 oc get route semantic-router-metrics -n vllm-semantic-router-system -o jsonpath='{.spec.host}'
+
+# Observability (if deployed)
+oc get route dashboard -n vllm-semantic-router-system -o jsonpath='{.spec.host}'
+oc get route openwebui -n vllm-semantic-router-system -o jsonpath='{.spec.host}'
+oc get route grafana -n vllm-semantic-router-system -o jsonpath='{.spec.host}'
+oc get route prometheus -n vllm-semantic-router-system -o jsonpath='{.spec.host}'
+```
+
+### Dashboard Playground
+
+Access the OpenWebUI playground through the dashboard:
+
+```bash
+DASHBOARD_URL=$(oc get route dashboard -n vllm-semantic-router-system -o jsonpath='{.spec.host}')
+echo "Playground: https://$DASHBOARD_URL/playground"
 ```
 
+The playground automatically detects the OpenWebUI URL by replacing `dashboard` with `openwebui` in the hostname - no configuration needed!
+
 ### Example Usage
 
 ```bash
@@ -133,20 +205,82 @@ curl https://$METRICS_ROUTE/metrics
 
 ## Cleanup
 
-Remove all resources:
+### Quick Cleanup
+
+Remove the entire namespace and all resources (recommended):
 
 ```bash
-oc delete -k deploy/openshift/
+cd deploy/openshift
+./cleanup-openshift.sh
 ```
 
-Or remove individual components:
+If not already logged in to OpenShift:
 
 ```bash
-oc delete -f deploy/openshift/routes.yaml
-oc delete -f deploy/openshift/service.yaml
-oc delete -f deploy/openshift/deployment.yaml
-oc delete -f deploy/openshift/pvc.yaml
-oc delete -f deploy/openshift/namespace.yaml
+oc login <your-cluster-url>
+./cleanup-openshift.sh
+```
+
+### Cleanup Options
+
+The cleanup script supports different cleanup levels:
+
+| Level | What Gets Deleted | What's Preserved |
+|-------|------------------|------------------|
+| `deployment` | Deployments, services, routes, configmaps, buildconfigs | Namespace, PVCs |
+| `namespace` (default) | Entire namespace and all resources | Nothing |
+| `all` | Namespace + cluster-wide resources | Nothing |
+
+**Examples:**
+
+```bash
+# Remove everything (default)
+./cleanup-openshift.sh
+
+# Keep namespace and PVCs, remove only deployments
+./cleanup-openshift.sh --level deployment
+
+# Dry run to see what would be deleted
+./cleanup-openshift.sh --dry-run
+
+# Force cleanup without confirmation
+./cleanup-openshift.sh --force
+```
+
+### What Gets Cleaned Up
+
+The cleanup script removes:
+
+**Core Components:**
+
+- semantic-router deployment
+- vLLM model deployments (Model-A, Model-B)
+- All services and routes
+- ConfigMaps (router config, envoy config)
+- BuildConfigs and ImageStreams (llm-katan, dashboard-custom)
+
+**Observability Stack:**
+
+- Dashboard deployment
+- OpenWebUI deployment
+- Grafana deployment
+- Prometheus deployment
+- All related services, routes, and configmaps
+
+**Storage (namespace level only):**
+
+- PVCs for models and cache
+
+### Manual Cleanup
+
+If you prefer manual cleanup:
+
+```bash
+# Delete entire namespace (removes everything)
+oc delete namespace vllm-semantic-router-system
+
+# Or delete specific components
+oc delete deployment,service,route,configmap,buildconfig,imagestream --all -n vllm-semantic-router-system
 ```
 
 ## Troubleshooting
 
@@ -61,8 +61,9 @@ OPTIONS:
     -h, --help               Show this help message
 
 CLEANUP LEVELS:
-    deployment    - Remove deployment, services, routes, configmap (keep namespace and PVC)
-    namespace     - Remove entire namespace and all resources (default)
+    deployment    - Remove deployments, services, routes, configmaps, buildconfigs (keep namespace and PVCs)
+                    Includes: semantic-router, vLLM models, dashboard, OpenWebUI, Grafana, Prometheus
+    namespace     - Remove entire namespace and all resources including PVCs (default)
     all           - Remove namespace and any cluster-wide resources
 
 EXAMPLES:
@@ -254,6 +255,18 @@ show_current_resources() {
     echo "=== ConfigMaps ==="
     oc get configmaps -n "$NAMESPACE" 2>/dev/null || echo "No configmaps found"
 
+    echo ""
+    echo "=== BuildConfigs ==="
+    oc get buildconfig -n "$NAMESPACE" 2>/dev/null || echo "No buildconfigs found"
+
+    echo ""
+    echo "=== ImageStreams ==="
+    oc get imagestream -n "$NAMESPACE" 2>/dev/null || echo "No imagestreams found"
+
+    echo ""
+    echo "=== Deployments ==="
+    oc get deployments -n "$NAMESPACE" 2>/dev/null || echo "No deployments found"
+
     echo ""
 }
 
@@ -270,10 +283,12 @@ confirm_cleanup() {
 
     case "$CLEANUP_LEVEL" in
         "deployment")
-            log "WARN" "Will delete: deployment, services, routes, configmaps (keeping namespace and PVCs)"
+            log "WARN" "Will delete: deployments, services, routes, configmaps, buildconfigs (keeping namespace and PVCs)"
+            log "WARN" "Components: semantic-router, vLLM models, dashboard, OpenWebUI, Grafana, Prometheus"
             ;;
         "namespace")
             log "WARN" "Will delete: entire namespace and all resources including PVCs"
+            log "WARN" "This removes ALL components: core + observability stack"
             ;;
         "all")
             log "WARN" "Will delete: namespace and any cluster-wide resources"
@@ -304,13 +319,43 @@ cleanup_deployment() {
 
     # Delete specific resources but keep namespace and PVCs
     local resources=(
+        # Core semantic-router resources
         "deployment/semantic-router"
+        "deployment/vllm-model-a"
+        "deployment/vllm-model-b"
         "service/semantic-router"
         "service/semantic-router-metrics"
+        "service/vllm-model-a"
+        "service/vllm-model-b"
         "route/semantic-router-api"
         "route/semantic-router-grpc"
         "route/semantic-router-metrics"
+        "route/envoy-http"
+        "route/envoy-admin"
         "configmap/semantic-router-config"
+        "configmap/envoy-config"
+        "buildconfig/llm-katan"
+        "imagestream/llm-katan"
+        "imagestream/python"
+
+        # Observability resources
+        "deployment/dashboard"
+        "deployment/openwebui"
+        "deployment/grafana"
+        "deployment/prometheus"
+        "service/dashboard"
+        "service/openwebui"
+        "service/grafana"
+        "service/prometheus"
+        "route/dashboard"
+        "route/openwebui"
+        "route/grafana"
+        "route/prometheus"
+        "configmap/dashboard-config"
+        "configmap/grafana-config"
+        "configmap/prometheus-config"
+        "buildconfig/dashboard-custom"
+        "imagestream/dashboard-custom"
     )
 
     for resource in "${resources[@]}"; do
 
@@ -32,11 +32,11 @@ prompt_guard:
 # This makes deployment portable across different OpenShift clusters
 vllm_endpoints:
   - name: "model-a-endpoint"
-    address: "172.30.64.134"  # PLACEHOLDER - will be replaced with actual ClusterIP
+    address: "DYNAMIC_MODEL_A_IP"  # model-a-ip - will be replaced with actual ClusterIP
     port: 8000
     weight: 1
   - name: "model-b-endpoint"
-    address: "172.30.116.177"  # PLACEHOLDER - will be replaced with actual ClusterIP
+    address: "DYNAMIC_MODEL_B_IP"  # model-b-ip - will be replaced with actual ClusterIP
     port: 8001
     weight: 1
 
@@ -59,7 +59,7 @@ classifier:
   category_model:
     model_id: "models/category_classifier_modernbert-base_model"
     use_modernbert: true
-    threshold: 0.6
+    threshold: 0.35  # Lowered from 0.45 to handle queries like "what is physics?" (confidence 0.3581)
     use_cpu: true
     category_mapping_path: "models/category_classifier_modernbert-base_model/category_mapping.json"
   pii_model: