From 1503c375706843d3d17fb21a032554998c71fc63 Mon Sep 17 00:00:00 2001
From: JaredforReal <w13431838023@gmail.com>
Date: Wed, 15 Oct 2025 11:06:42 +0800
Subject: [PATCH 1/7] add tracing to docker compose

Signed-off-by: JaredforReal <w13431838023@gmail.com>
---
 config/config.tracing.yaml                    | 104 ++++++++++++++++++
 config/config.yaml                            |  36 +++---
 deploy/docker-compose/README.md               |  16 ++-
 .../addons/grafana-datasource-jaeger.yaml     |  15 +++
 deploy/docker-compose/docker-compose.yml      |  16 +++
 tools/tracing/README.md                       |  12 +-
 .../observability/tracing-quickstart.md       |  55 +++++++++
 7 files changed, 230 insertions(+), 24 deletions(-)
 create mode 100644 config/config.tracing.yaml
 create mode 100644 deploy/docker-compose/addons/grafana-datasource-jaeger.yaml
 create mode 100644 website/docs/tutorials/observability/tracing-quickstart.md

diff --git a/config/config.tracing.yaml b/config/config.tracing.yaml
new file mode 100644
index 00000000..8d9ea682
--- /dev/null
+++ b/config/config.tracing.yaml
@@ -0,0 +1,104 @@
+# Local Tracing Configuration (Jaeger + Always-On Sampling)
+# This config is used by tools/tracing/docker-compose.tracing.yaml via CONFIG_FILE.
+
+bert_model:
+  model_id: sentence-transformers/all-MiniLM-L12-v2
+  threshold: 0.6
+  use_cpu: true
+
+semantic_cache:
+  enabled: true
+  backend_type: "memory"
+  similarity_threshold: 0.8
+  max_entries: 1000
+  ttl_seconds: 3600
+  eviction_policy: "fifo"
+
+tools:
+  enabled: true
+  top_k: 3
+  similarity_threshold: 0.2
+  tools_db_path: "config/tools_db.json"
+  fallback_to_empty: true
+
+prompt_guard:
+  enabled: true
+  use_modernbert: true
+  model_id: "models/jailbreak_classifier_modernbert-base_model"
+  threshold: 0.7
+  use_cpu: true
+  jailbreak_mapping_path: "models/jailbreak_classifier_modernbert-base_model/jailbreak_type_mapping.json"
+
+vllm_endpoints:
+  - name: "endpoint1"
+    address: "127.0.0.1"
+    port: 8000
+    weight: 1
+
+model_config:
+  "openai/gpt-oss-20b":
+    reasoning_family: "gpt-oss"
+    preferred_endpoints: ["endpoint1"]
+    pii_policy:
+      allow_by_default: true
+
+classifier:
+  category_model:
+    model_id: "models/category_classifier_modernbert-base_model"
+    use_modernbert: true
+    threshold: 0.6
+    use_cpu: true
+    category_mapping_path: "models/category_classifier_modernbert-base_model/category_mapping.json"
+  pii_model:
+    model_id: "models/pii_classifier_modernbert-base_presidio_token_model"
+    use_modernbert: true
+    threshold: 0.7
+    use_cpu: true
+    pii_mapping_path: "models/pii_classifier_modernbert-base_presidio_token_model/pii_type_mapping.json"
+
+categories:
+  - name: math
+    system_prompt: "You are a mathematics expert. Provide step-by-step solutions."
+    model_scores:
+      - model: openai/gpt-oss-20b
+        score: 1.0
+        use_reasoning: true
+  - name: other
+    system_prompt: "You are a helpful assistant."
+    model_scores:
+      - model: openai/gpt-oss-20b
+        score: 0.7
+        use_reasoning: false
+
+default_model: openai/gpt-oss-20b
+
+reasoning_families:
+  gpt-oss:
+    type: "reasoning_effort"
+    parameter: "reasoning_effort"
+
+default_reasoning_effort: high
+
+api:
+  batch_classification:
+    max_batch_size: 100
+    concurrency_threshold: 5
+    max_concurrency: 8
+    metrics:
+      enabled: true
+
+observability:
+  tracing:
+    enabled: true
+    provider: "opentelemetry"
+    exporter:
+      type: "otlp"
+      endpoint: "jaeger:4317" # Jaeger gRPC OTLP endpoint inside compose network
+      insecure: true
+    sampling:
+      type: "always_on" # Always sample in local/dev for easy debugging
+      rate: 1.0
+    resource:
+      service_name: "vllm-semantic-router"
+      service_version: "dev"
+      deployment_environment: "local"
diff --git a/config/config.yaml b/config/config.yaml
index 579b9e35..23b6f067 100644
--- a/config/config.yaml
+++ b/config/config.yaml
@@ -5,11 +5,11 @@ bert_model:
 
 semantic_cache:
   enabled: true
-  backend_type: "memory"  # Options: "memory" or "milvus"
+  backend_type: "memory" # Options: "memory" or "milvus"
   similarity_threshold: 0.8
-  max_entries: 1000  # Only applies to memory backend
+  max_entries: 1000 # Only applies to memory backend
   ttl_seconds: 3600
-  eviction_policy: "fifo"  
+  eviction_policy: "fifo"
 
 tools:
   enabled: true
@@ -32,13 +32,13 @@ prompt_guard:
 # NOT supported: domain names (example.com), protocol prefixes (http://), paths (/api), ports in address (use 'port' field)
 vllm_endpoints:
   - name: "endpoint1"
-    address: "127.0.0.1"  # IPv4 address - REQUIRED format
+    address: "127.0.0.1" # IPv4 address - REQUIRED format
     port: 8000
     weight: 1
 
 model_config:
   "openai/gpt-oss-20b":
-    reasoning_family: "gpt-oss"  # This model uses GPT-OSS reasoning syntax
+    reasoning_family: "gpt-oss" # This model uses GPT-OSS reasoning syntax
     preferred_endpoints: ["endpoint1"]
     pii_policy:
       allow_by_default: true
@@ -65,7 +65,7 @@ categories:
     model_scores:
       - model: openai/gpt-oss-20b
         score: 0.7
-        use_reasoning: false  # Business performs better without reasoning
+        use_reasoning: false # Business performs better without reasoning
   - name: law
     system_prompt: "You are a knowledgeable legal expert with comprehensive understanding of legal principles, case law, statutory interpretation, and legal procedures across multiple jurisdictions. Provide accurate legal information and analysis while clearly stating that your responses are for informational purposes only and do not constitute legal advice. Always recommend consulting with qualified legal professionals for specific legal matters."
     model_scores:
@@ -89,7 +89,7 @@ categories:
     model_scores:
       - model: openai/gpt-oss-20b
         score: 0.6
-        use_reasoning: true  # Enable reasoning for complex chemistry
+        use_reasoning: true # Enable reasoning for complex chemistry
   - name: history
     system_prompt: "You are a historian with expertise across different time periods and cultures. Provide accurate historical context and analysis."
     model_scores:
@@ -119,13 +119,13 @@ categories:
     model_scores:
       - model: openai/gpt-oss-20b
         score: 1.0
-        use_reasoning: true  # Enable reasoning for complex math
+        use_reasoning: true # Enable reasoning for complex math
   - name: physics
     system_prompt: "You are a physics expert with deep understanding of physical laws and phenomena. Provide clear explanations with mathematical derivations when appropriate."
     model_scores:
       - model: openai/gpt-oss-20b
         score: 0.7
-        use_reasoning: true  # Enable reasoning for physics
+        use_reasoning: true # Enable reasoning for physics
   - name: computer science
     system_prompt: "You are a computer science expert with knowledge of algorithms, data structures, programming languages, and software engineering. Provide clear, practical solutions with code examples when helpful."
     model_scores:
@@ -178,23 +178,23 @@ api:
       detailed_goroutine_tracking: true
       high_resolution_timing: false
       sample_rate: 1.0
-      duration_buckets: [0.001, 0.005, 0.01, 0.025, 0.05, 0.1, 0.25, 0.5, 1, 2.5, 5, 10, 30]
+      duration_buckets:
+        [0.001, 0.005, 0.01, 0.025, 0.05, 0.1, 0.25, 0.5, 1, 2.5, 5, 10, 30]
       size_buckets: [1, 2, 5, 10, 20, 50, 100, 200]
 
 # Observability Configuration
 observability:
   tracing:
-    enabled: false  # Enable distributed tracing (default: false)
-    provider: "opentelemetry"  # Provider: opentelemetry, openinference, openllmetry
+    enabled: true # Enable distributed tracing for docker-compose stack
+    provider: "opentelemetry" # Provider: opentelemetry, openinference, openllmetry
     exporter:
-      type: "stdout"  # Exporter: otlp, jaeger, zipkin, stdout
-      endpoint: "localhost:4317"  # OTLP endpoint (when type: otlp)
-      insecure: true  # Use insecure connection (no TLS)
+      type: "otlp" # Export spans to Jaeger (via OTLP gRPC)
+      endpoint: "jaeger:4317" # Jaeger collector inside compose network
+      insecure: true # Use insecure connection (no TLS)
     sampling:
-      type: "always_on"  # Sampling: always_on, always_off, probabilistic
-      rate: 1.0  # Sampling rate for probabilistic (0.0-1.0)
+      type: "always_on" # Sampling: always_on, always_off, probabilistic
+      rate: 1.0 # Sampling rate for probabilistic (0.0-1.0)
     resource:
       service_name: "vllm-semantic-router"
       service_version: "v0.1.0"
       deployment_environment: "development"
-
diff --git a/deploy/docker-compose/README.md b/deploy/docker-compose/README.md
index 3a200167..692c857f 100644
--- a/deploy/docker-compose/README.md
+++ b/deploy/docker-compose/README.md
@@ -1,8 +1,9 @@
 # Main Runtime Compose Stack
 
-This directory contains the primary `docker-compose.yml` used to run the semantic-router stack (router + envoy + optional mock-vllm + observability).
+This directory contains the primary `docker-compose.yml` used to run the semantic-router stack (router + envoy + optional mock-vllm + observability: Prometheus/Grafana + Jaeger tracing).
 
 ## Path Layout
+
 Because this file lives under `deploy/docker-compose/`, all relative paths to repository resources go two levels up (../../) back to repo root.
 
 Example mappings:
@@ -30,6 +31,7 @@ docker compose -f deploy/docker-compose/docker-compose.yml down
 ```
 
 ## Overrides
+
 You can place a `docker-compose.override.yml` at repo root and combine:
 
 ```bash
@@ -39,4 +41,14 @@ docker compose -f deploy/docker-compose/docker-compose.yml -f docker-compose.ove
 ## Related Stacks
 
 - Local observability only: `tools/observability/docker-compose.obs.yml`
-- Tracing stack: `tools/tracing/docker-compose.tracing.yaml`
+- Tracing stack (standalone, dev): `tools/tracing/docker-compose.tracing.yaml`
+
+## Tracing & Grafana
+
+- Jaeger UI: http://localhost:16686
+- Grafana: http://localhost:3000 (admin/admin)
+  - Prometheus datasource (default) for metrics
+  - Jaeger datasource for exploring traces (search service `vllm-semantic-router`)
+
+By default, the router container uses `config/config.tracing.yaml` (enabled tracing, exporter to Jaeger).
+Override with `CONFIG_FILE=/app/config/config.yaml` if you don’t want tracing.
diff --git a/deploy/docker-compose/addons/grafana-datasource-jaeger.yaml b/deploy/docker-compose/addons/grafana-datasource-jaeger.yaml
new file mode 100644
index 00000000..85f5165e
--- /dev/null
+++ b/deploy/docker-compose/addons/grafana-datasource-jaeger.yaml
@@ -0,0 +1,15 @@
+# Grafana datasource configuration for Jaeger/Tempo tracing
+# Provisioned automatically when Grafana starts
+
+apiVersion: 1
+
+datasources:
+  - name: Jaeger
+    type: jaeger
+    access: proxy
+    url: http://jaeger:16686
+    isDefault: false
+    editable: true
+    jsonData:
+      nodeGraph:
+        enabled: true
diff --git a/deploy/docker-compose/docker-compose.yml b/deploy/docker-compose/docker-compose.yml
index 98fdb70d..29adf564 100644
--- a/deploy/docker-compose/docker-compose.yml
+++ b/deploy/docker-compose/docker-compose.yml
@@ -1,4 +1,15 @@
 services:
+  # Jaeger for distributed tracing (OTLP gRPC + UI)
+  jaeger:
+    image: jaegertracing/all-in-one:latest
+    container_name: jaeger
+    environment:
+      - COLLECTOR_OTLP_ENABLED=true
+    ports:
+      - "4317:4317"   # OTLP gRPC
+      - "16686:16686" # Web UI
+    networks:
+      - semantic-network
 
   # Semantic Router External Processor Service
   semantic-router:
@@ -11,7 +22,11 @@ services:
       - ../../models:/app/models:ro
     environment:
       - LD_LIBRARY_PATH=/app/lib
+      # Use main config by default; override via CONFIG_FILE if needed
       - CONFIG_FILE=${CONFIG_FILE:-/app/config/config.yaml}
+      # Optional informational envs (router reads YAML for tracing config)
+      - OTEL_EXPORTER_OTLP_ENDPOINT=http://jaeger:4317
+      - OTEL_SERVICE_NAME=vllm-semantic-router
     networks:
       - semantic-network
     healthcheck:
@@ -89,6 +104,7 @@ services:
     volumes:
       - ./addons/grafana.ini:/etc/grafana/grafana.ini:ro
       - ./addons/grafana-datasource.yaml:/etc/grafana/provisioning/datasources/datasource.yaml:ro
+      - ./addons/grafana-datasource-jaeger.yaml:/etc/grafana/provisioning/datasources/datasource_jaeger.yaml:ro
       - ./addons/grafana-dashboard.yaml:/etc/grafana/provisioning/dashboards/dashboard.yaml:ro
       - ./addons/llm-router-dashboard.json:/etc/grafana/provisioning/dashboards/llm-router-dashboard.json:ro
       - grafana-data:/var/lib/grafana
diff --git a/tools/tracing/README.md b/tools/tracing/README.md
index 366853b4..b4594b26 100644
--- a/tools/tracing/README.md
+++ b/tools/tracing/README.md
@@ -3,6 +3,7 @@
 This directory provides a local Jaeger + tracing-enabled semantic-router stack for development, debugging, and demonstration.
 
 ## Why here?
+
 `tools/tracing` groups this with other local-only utilities (see `tools/observability` for metrics stack). Production deployments should rely on manifests in `deploy/kubernetes` / `openshift` instead of this all-in-one compose.
 
 ## Quick Start
@@ -31,7 +32,7 @@ curl -X POST http://localhost:8081/v1/chat/completions \
 ## View Traces
 
 1. Open Jaeger UI
-2. Select service: `vllm-semantic-router` (or `semantic-router` depending on OTEL resource config)
+2. Select service: `vllm-semantic-router` (set via resource.service_name in config/config.tracing.yaml)
 3. Click "Find Traces"
 
 ## Stopping
@@ -48,12 +49,15 @@ docker compose -f tools/tracing/docker-compose.tracing.yaml down -v
 
 ## Environment Variables
 
-| Variable | Purpose |
-|----------|---------|
+| Variable                    | Purpose                         |
+| --------------------------- | ------------------------------- |
 | OTEL_EXPORTER_OTLP_ENDPOINT | Where spans are exported (gRPC) |
-| OTEL_SERVICE_NAME | Logical service name in traces |
+| OTEL_SERVICE_NAME           | Logical service name in traces  |
+
+Note: the router reads tracing settings from the YAML config (observability.tracing._). The OTEL\__ env vars here are only informational and do not override the YAML. To change exporter endpoint or service name, edit `config/config.tracing.yaml`.
 
 ## Relationship with Metrics Stack
+
 If you also want Prometheus/Grafana metrics:
 
 ```bash
diff --git a/website/docs/tutorials/observability/tracing-quickstart.md b/website/docs/tutorials/observability/tracing-quickstart.md
new file mode 100644
index 00000000..1ab5cccd
--- /dev/null
+++ b/website/docs/tutorials/observability/tracing-quickstart.md
@@ -0,0 +1,55 @@
+# Tracing Quickstart
+
+This guide helps you spin up a local tracing stack and see your first traces in a minute.
+
+## Prerequisites
+
+- Docker and Docker Compose
+
+## Start the local tracing stack
+
+The repo includes a compose file that starts Jaeger and a tracing-enabled Semantic Router instance.
+
+- The router uses `config/config.tracing.yaml` which has tracing enabled and the exporter pointed at Jaeger.
+
+Run:
+
+```bash
+# from repo root
+docker compose -f tools/tracing/docker-compose.tracing.yaml up -d
+```
+
+## Send a test request
+
+```bash
+curl -X POST http://localhost:8081/v1/chat/completions \
+  -H "Content-Type: application/json" \
+  -d '{
+    "model": "auto",
+    "messages": [{"role": "user", "content": "What is 2+2?"}]
+  }'
+```
+
+## View traces
+
+1. Open Jaeger UI: http://localhost:16686
+2. Choose service: `vllm-semantic-router`
+3. Find traces → click one to inspect spans
+
+You should see spans like:
+
+- `semantic_router.request.received`
+- `semantic_router.classification`
+- `semantic_router.cache.lookup`
+- `semantic_router.routing.decision`
+- `semantic_router.backend.selection`
+
+## Customize
+
+- Change service name or sampling in `config/config.tracing.yaml` under `observability.tracing`.
+- To export to another backend (e.g., Tempo), set `exporter.endpoint` and `insecure` accordingly.
+
+## Troubleshooting
+
+- No traces? Confirm tracing is enabled in the YAML and Jaeger is reachable at `jaeger:4317` inside the compose network.
+- Empty service list in Jaeger? Make one request to generate spans, then refresh.

From 3c310c5afb7ee2cd987d52df82cc1fe8ffd32d89 Mon Sep 17 00:00:00 2001
From: JaredforReal <w13431838023@gmail.com>
Date: Wed, 15 Oct 2025 13:37:52 +0800
Subject: [PATCH 2/7] make: ensure docker-compose-down stops profiled services;
 add down-core and down-llm-katan targets

Signed-off-by: JaredforReal <w13431838023@gmail.com>
---
 tools/make/docker.mk | 22 ++++++++++++++++++++--
 1 file changed, 20 insertions(+), 2 deletions(-)

diff --git a/tools/make/docker.mk b/tools/make/docker.mk
index 975d91f4..ba2e3503 100644
--- a/tools/make/docker.mk
+++ b/tools/make/docker.mk
@@ -130,9 +130,25 @@ docker-compose-rebuild-llm-katan: docker-compose-up-llm-katan
 
 docker-compose-down:
 	@$(LOG_TARGET)
-	@echo "Stopping docker-compose services..."
+	@echo "Stopping all docker-compose services (including profiled) and removing orphans..."
+	# Stop profiled services explicitly (if they were started)
+	@docker compose --profile llm-katan down --remove-orphans || true
+	@docker compose --profile testing down --remove-orphans || true
+	# Finally stop the base stack
+	@docker compose down --remove-orphans
+
+# Stop only core services (leave profiled services like llm-katan/testing running)
+docker-compose-down-core:
+	@$(LOG_TARGET)
+	@echo "Stopping core services only (no profiles; keeps llm-katan/testing if running)..."
 	@docker compose down
 
+# Stop only llm-katan profiled services
+docker-compose-down-llm-katan:
+	@$(LOG_TARGET)
+	@echo "Stopping llm-katan profiled services..."
+	@docker compose --profile llm-katan down
+
 # Help target for Docker commands
 docker-help:
 	@echo "Docker Make Targets:"
@@ -152,7 +168,9 @@ docker-help:
 	@echo "  docker-compose-rebuild               - Force rebuild then start"
 	@echo "  docker-compose-rebuild-testing       - Force rebuild (testing profile)"
 	@echo "  docker-compose-rebuild-llm-katan     - Force rebuild (llm-katan profile)"
-	@echo "  docker-compose-down                  - Stop docker-compose services"
+	@echo "  docker-compose-down                  - Stop ALL services (base + profiled) and remove orphans"
+	@echo "  docker-compose-down-core             - Stop core services only (keeps profiled running)"
+	@echo "  docker-compose-down-llm-katan        - Stop only llm-katan profiled services"
 	@echo ""
 	@echo "Environment Variables:"
 	@echo "  DOCKER_REGISTRY - Docker registry (default: ghcr.io/vllm-project/semantic-router)"

From 5b7357e99e6759d0e3510db9ab394d762b8b561f Mon Sep 17 00:00:00 2001
From: JaredforReal <w13431838023@gmail.com>
Date: Wed, 15 Oct 2025 18:43:11 +0800
Subject: [PATCH 3/7] add jaeder UI to dahsboard

Signed-off-by: JaredforReal <w13431838023@gmail.com>
---
 dashboard/backend/main.go                    | 47 ++++++++++++
 dashboard/frontend/src/App.tsx               | 12 ++++
 dashboard/frontend/src/components/Layout.tsx | 28 +++++---
 dashboard/frontend/src/pages/TracingPage.tsx | 76 ++++++++++++++++++++
 deploy/docker-compose/docker-compose.yml     | 28 ++++----
 tools/make/golang.mk                         | 34 ++++++++-
 6 files changed, 201 insertions(+), 24 deletions(-)
 create mode 100644 dashboard/frontend/src/pages/TracingPage.tsx

diff --git a/dashboard/backend/main.go b/dashboard/backend/main.go
index 40abd391..72ded509 100644
--- a/dashboard/backend/main.go
+++ b/dashboard/backend/main.go
@@ -271,6 +271,7 @@ func main() {
 	routerAPI := flag.String("router_api", env("TARGET_ROUTER_API_URL", "http://localhost:8080"), "Router API base URL")
 	routerMetrics := flag.String("router_metrics", env("TARGET_ROUTER_METRICS_URL", "http://localhost:9190/metrics"), "Router metrics URL")
 	openwebuiURL := flag.String("openwebui", env("TARGET_OPENWEBUI_URL", ""), "Open WebUI base URL")
+	jaegerURL := flag.String("jaeger", env("TARGET_JAEGER_URL", ""), "Jaeger base URL")
 
 	flag.Parse()
 
@@ -382,6 +383,31 @@ func main() {
 		log.Printf("Warning: Prometheus URL not configured")
 	}
 
+	// Jaeger proxy (optional) - expose full UI under /embedded/jaeger and its static assets under /static/
+	if *jaegerURL != "" {
+		jp, err := newReverseProxy(*jaegerURL, "/embedded/jaeger", false)
+		if err != nil {
+			log.Fatalf("jaeger proxy error: %v", err)
+		}
+		// Jaeger UI (root UI under /embedded/jaeger)
+		mux.Handle("/embedded/jaeger", jp)
+		mux.Handle("/embedded/jaeger/", jp)
+
+		// Jaeger static assets are typically served under /static/* from the same origin
+		// Provide a passthrough proxy without prefix stripping
+		jStatic, _ := newReverseProxy(*jaegerURL, "", false)
+		mux.Handle("/static/", jStatic)
+
+		log.Printf("Jaeger proxy configured: %s; static assets proxied at /static/", *jaegerURL)
+	} else {
+		mux.HandleFunc("/embedded/jaeger/", func(w http.ResponseWriter, r *http.Request) {
+			w.Header().Set("Content-Type", "application/json")
+			w.WriteHeader(http.StatusServiceUnavailable)
+			w.Write([]byte(`{"error":"Jaeger not configured","message":"TARGET_JAEGER_URL environment variable is not set"}`))
+		})
+		log.Printf("Info: Jaeger URL not configured (optional)")
+	}
+
 	// Open WebUI proxy (optional)
 	if *openwebuiURL != "" {
 		op, err := newReverseProxy(*openwebuiURL, "/embedded/openwebui", true)
@@ -400,6 +426,24 @@ func main() {
 		log.Printf("Info: Open WebUI not configured (optional)")
 	}
 
+	// Jaeger proxy (optional)
+	if *jaegerURL != "" {
+		jp, err := newReverseProxy(*jaegerURL, "/embedded/jaeger", false)
+		if err != nil {
+			log.Fatalf("jaeger proxy error: %v", err)
+		}
+		mux.Handle("/embedded/jaeger", jp)
+		mux.Handle("/embedded/jaeger/", jp)
+		log.Printf("Jaeger proxy configured: %s", *jaegerURL)
+	} else {
+		mux.HandleFunc("/embedded/jaeger/", func(w http.ResponseWriter, r *http.Request) {
+			w.Header().Set("Content-Type", "application/json")
+			w.WriteHeader(http.StatusServiceUnavailable)
+			w.Write([]byte(`{"error":"Jaeger not configured","message":"TARGET_JAEGER_URL environment variable is not set"}`))
+		})
+		log.Printf("Info: Jaeger URL not configured (optional)")
+	}
+
 	addr := ":" + *port
 	log.Printf("Semantic Router Dashboard listening on %s", addr)
 	log.Printf("Static dir: %s", *staticDir)
@@ -409,6 +453,9 @@ func main() {
 	if *promURL != "" {
 		log.Printf("Prometheus: %s → /embedded/prometheus/", *promURL)
 	}
+	if *jaegerURL != "" {
+		log.Printf("Jaeger: %s → /embedded/jaeger/", *jaegerURL)
+	}
 	if *openwebuiURL != "" {
 		log.Printf("OpenWebUI: %s → /embedded/openwebui/", *openwebuiURL)
 	}
diff --git a/dashboard/frontend/src/App.tsx b/dashboard/frontend/src/App.tsx
index fb2a6c65..654b7d45 100644
--- a/dashboard/frontend/src/App.tsx
+++ b/dashboard/frontend/src/App.tsx
@@ -6,6 +6,7 @@ import MonitoringPage from './pages/MonitoringPage'
 import ConfigPage from './pages/ConfigPage'
 import PlaygroundPage from './pages/PlaygroundPage'
 import TopologyPage from './pages/TopologyPage'
+import TracingPage from './pages/TracingPage'
 import { ConfigSection } from './components/ConfigNav'
 
 const App: React.FC = () => {
@@ -117,6 +118,17 @@ const App: React.FC = () => {
             </Layout>
           }
         />
+        <Route
+          path="/tracing"
+          element={
+            <Layout
+              configSection={configSection}
+              onConfigSectionChange={(section) => setConfigSection(section as ConfigSection)}
+            >
+              <TracingPage />
+            </Layout>
+          }
+        />
       </Routes>
     </BrowserRouter>
   )
diff --git a/dashboard/frontend/src/components/Layout.tsx b/dashboard/frontend/src/components/Layout.tsx
index 98cee2aa..9ecca8c0 100644
--- a/dashboard/frontend/src/components/Layout.tsx
+++ b/dashboard/frontend/src/components/Layout.tsx
@@ -55,14 +55,14 @@ const Layout: React.FC<LayoutProps> = ({ children, configSection, onConfigSectio
             {sidebarCollapsed ? (
               // 折叠状态：箭头向右
               <svg width="20" height="20" viewBox="0 0 20 20" fill="none" xmlns="http://www.w3.org/2000/svg">
-                <path d="M14 10L18 10M18 10L16 8M18 10L16 12" stroke="currentColor" strokeWidth="1.5" strokeLinecap="round" strokeLinejoin="round"/>
-                <path d="M2 5H10M2 10H10M2 15H10" stroke="currentColor" strokeWidth="1.5" strokeLinecap="round"/>
+                <path d="M14 10L18 10M18 10L16 8M18 10L16 12" stroke="currentColor" strokeWidth="1.5" strokeLinecap="round" strokeLinejoin="round" />
+                <path d="M2 5H10M2 10H10M2 15H10" stroke="currentColor" strokeWidth="1.5" strokeLinecap="round" />
               </svg>
             ) : (
               // 展开状态：箭头向左
               <svg width="20" height="20" viewBox="0 0 20 20" fill="none" xmlns="http://www.w3.org/2000/svg">
-                <path d="M6 10L2 10M2 10L4 8M2 10L4 12" stroke="currentColor" strokeWidth="1.5" strokeLinecap="round" strokeLinejoin="round"/>
-                <path d="M10 5H18M10 10H18M10 15H18" stroke="currentColor" strokeWidth="1.5" strokeLinecap="round"/>
+                <path d="M6 10L2 10M2 10L4 8M2 10L4 12" stroke="currentColor" strokeWidth="1.5" strokeLinecap="round" strokeLinejoin="round" />
+                <path d="M10 5H18M10 10H18M10 15H18" stroke="currentColor" strokeWidth="1.5" strokeLinecap="round" />
               </svg>
             )}
           </button>
@@ -98,12 +98,11 @@ const Layout: React.FC<LayoutProps> = ({ children, configSection, onConfigSectio
               ].map((section) => (
                 <button
                   key={section.id}
-                  className={`${styles.navLink} ${
-                    (section.id === 'topology' && location.pathname === '/topology') ||
-                    (isConfigPage && configSection === section.id)
+                  className={`${styles.navLink} ${(section.id === 'topology' && location.pathname === '/topology') ||
+                      (isConfigPage && configSection === section.id)
                       ? styles.navLinkActive
                       : ''
-                  }`}
+                    }`}
                   onClick={() => {
                     if (section.id === 'topology') {
                       navigate('/topology')
@@ -131,6 +130,17 @@ const Layout: React.FC<LayoutProps> = ({ children, configSection, onConfigSectio
             <span className={styles.navIcon}>📊</span>
             {!sidebarCollapsed && <span className={styles.navText}>Monitoring</span>}
           </NavLink>
+
+          <NavLink
+            to="/tracing"
+            className={({ isActive }) =>
+              isActive ? `${styles.navLink} ${styles.navLinkActive}` : styles.navLink
+            }
+            title="Tracing"
+          >
+            <span className={styles.navIcon}>🔎</span>
+            {!sidebarCollapsed && <span className={styles.navText}>Tracing</span>}
+          </NavLink>
         </nav>
         <div className={styles.sidebarFooter}>
           <button
@@ -152,7 +162,7 @@ const Layout: React.FC<LayoutProps> = ({ children, configSection, onConfigSectio
                 title="GitHub Repository"
               >
                 <svg width="20" height="20" viewBox="0 0 24 24" fill="currentColor">
-                  <path d="M12 0c-6.626 0-12 5.373-12 12 0 5.302 3.438 9.8 8.207 11.387.599.111.793-.261.793-.577v-2.234c-3.338.726-4.033-1.416-4.033-1.416-.546-1.387-1.333-1.756-1.333-1.756-1.089-.745.083-.729.083-.729 1.205.084 1.839 1.237 1.839 1.237 1.07 1.834 2.807 1.304 3.492.997.107-.775.418-1.305.762-1.604-2.665-.305-5.467-1.334-5.467-5.931 0-1.311.469-2.381 1.236-3.221-.124-.303-.535-1.524.117-3.176 0 0 1.008-.322 3.301 1.23.957-.266 1.983-.399 3.003-.404 1.02.005 2.047.138 3.006.404 2.291-1.552 3.297-1.23 3.297-1.23.653 1.653.242 2.874.118 3.176.77.84 1.235 1.911 1.235 3.221 0 4.609-2.807 5.624-5.479 5.921.43.372.823 1.102.823 2.222v3.293c0 .319.192.694.801.576 4.765-1.589 8.199-6.086 8.199-11.386 0-6.627-5.373-12-12-12z"/>
+                  <path d="M12 0c-6.626 0-12 5.373-12 12 0 5.302 3.438 9.8 8.207 11.387.599.111.793-.261.793-.577v-2.234c-3.338.726-4.033-1.416-4.033-1.416-.546-1.387-1.333-1.756-1.333-1.756-1.089-.745.083-.729.083-.729 1.205.084 1.839 1.237 1.839 1.237 1.07 1.834 2.807 1.304 3.492.997.107-.775.418-1.305.762-1.604-2.665-.305-5.467-1.334-5.467-5.931 0-1.311.469-2.381 1.236-3.221-.124-.303-.535-1.524.117-3.176 0 0 1.008-.322 3.301 1.23.957-.266 1.983-.399 3.003-.404 1.02.005 2.047.138 3.006.404 2.291-1.552 3.297-1.23 3.297-1.23.653 1.653.242 2.874.118 3.176.77.84 1.235 1.911 1.235 3.221 0 4.609-2.807 5.624-5.479 5.921.43.372.823 1.102.823 2.222v3.293c0 .319.192.694.801.576 4.765-1.589 8.199-6.086 8.199-11.386 0-6.627-5.373-12-12-12z" />
                 </svg>
               </a>
               <a
diff --git a/dashboard/frontend/src/pages/TracingPage.tsx b/dashboard/frontend/src/pages/TracingPage.tsx
new file mode 100644
index 00000000..db33d677
--- /dev/null
+++ b/dashboard/frontend/src/pages/TracingPage.tsx
@@ -0,0 +1,76 @@
+import React, { useEffect, useRef, useState } from 'react'
+import styles from './MonitoringPage.module.css'
+
+const TracingPage: React.FC = () => {
+  const [theme, setTheme] = useState(
+    document.documentElement.getAttribute('data-theme') || 'dark'
+  )
+  const [loading, setLoading] = useState(true)
+  const [error, setError] = useState<string | null>(null)
+  const iframeRef = useRef<HTMLIFrameElement>(null)
+
+  useEffect(() => {
+    const observer = new MutationObserver(() => {
+      const t = document.documentElement.getAttribute('data-theme') || 'dark'
+      if (t !== theme) {
+        setTheme(t)
+        setLoading(true)
+      }
+    })
+    observer.observe(document.documentElement, { attributes: true, attributeFilter: ['data-theme'] })
+    return () => observer.disconnect()
+  }, [theme])
+
+  const buildJaegerUrl = () => {
+    // Default Jaeger landing page; could navigate to search with params later
+    return `/embedded/jaeger/search?lookback=1h&limit=20&service=vllm-semantic-router`
+  }
+
+  useEffect(() => {
+    // Slight delay to ensure iframe renders
+    const timer = setTimeout(() => setLoading(false), 100)
+    return () => clearTimeout(timer)
+  }, [theme])
+
+  const handleIframeLoad = () => {
+    setLoading(false)
+    setError(null)
+  }
+
+  const handleIframeError = () => {
+    setLoading(false)
+    setError('Failed to load Jaeger UI. Please check that Jaeger is running and the proxy is configured.')
+  }
+
+  return (
+    <div className={styles.container}>
+      {error && (
+        <div className={styles.errorBanner}>
+          <span className={styles.errorIcon}>⚠️</span>
+          <span>{error}</span>
+        </div>
+      )}
+
+      <div className={styles.iframeContainer}>
+        {loading && (
+          <div className={styles.loadingOverlay}>
+            <div className={styles.spinner}></div>
+            <p>Loading Jaeger UI...</p>
+          </div>
+        )}
+        <iframe
+          ref={iframeRef}
+          key={`jaeger-${theme}`}
+          src={buildJaegerUrl()}
+          className={styles.iframe}
+          title="Jaeger Tracing"
+          allowFullScreen
+          onLoad={handleIframeLoad}
+          onError={handleIframeError}
+        />
+      </div>
+    </div>
+  )
+}
+
+export default TracingPage
diff --git a/deploy/docker-compose/docker-compose.yml b/deploy/docker-compose/docker-compose.yml
index 3369141b..e8cefa02 100644
--- a/deploy/docker-compose/docker-compose.yml
+++ b/deploy/docker-compose/docker-compose.yml
@@ -1,19 +1,8 @@
 services:
-  # Jaeger for distributed tracing (OTLP gRPC + UI)
-  jaeger:
-    image: jaegertracing/all-in-one:latest
-    container_name: jaeger
-    environment:
-      - COLLECTOR_OTLP_ENABLED=true
-    ports:
-      - "4317:4317"   # OTLP gRPC
-      - "16686:16686" # Web UI
-    networks:
-      - semantic-network
 
   # Semantic Router External Processor Service
   semantic-router:
-    image: ghcr.io/vllm-project/semantic-router/extproc:latest
+    image: semantic-router-extproc:dev
     container_name: semantic-router
     ports:
       - "50051:50051"
@@ -80,6 +69,18 @@ services:
       retries: 5
       start_period: 5s
 
+  # Jaeger for distributed tracing (OTLP gRPC + UI)
+  jaeger:
+    image: jaegertracing/all-in-one:latest
+    container_name: jaeger
+    environment:
+      - COLLECTOR_OTLP_ENABLED=true
+    ports:
+      - "4317:4317"   # OTLP gRPC
+      - "16686:16686" # Web UI
+    networks:
+      - semantic-network
+
   # Prometheus and Grafana for observability
   prometheus:
     image: prom/prometheus:v2.53.0
@@ -178,7 +179,7 @@ services:
   # Semantic Router Dashboard
   dashboard:
     # Use pre-built image from GHCR, fallback to local build for development
-    image: ${DASHBOARD_IMAGE:-ghcr.io/vllm-project/semantic-router/dashboard:latest}
+    # image: ${DASHBOARD_IMAGE:-ghcr.io/vllm-project/semantic-router/dashboard:latest}
     build:
       context: ../../
       dockerfile: dashboard/backend/Dockerfile
@@ -188,6 +189,7 @@ services:
       - DASHBOARD_PORT=8700
       - TARGET_GRAFANA_URL=http://grafana:3000
       - TARGET_PROMETHEUS_URL=http://prometheus:9090
+      - TARGET_JAEGER_URL=http://jaeger:16686
       - TARGET_ROUTER_API_URL=http://semantic-router:8080
       - TARGET_ROUTER_METRICS_URL=http://semantic-router:9190/metrics
       - TARGET_OPENWEBUI_URL=http://openwebui:8080
diff --git a/tools/make/golang.mk b/tools/make/golang.mk
index 0c9c73bd..2ba15e74 100644
--- a/tools/make/golang.mk
+++ b/tools/make/golang.mk
@@ -8,7 +8,22 @@
 go-lint:
 	@$(LOG_TARGET)
 	@echo "Running golangci-lint for src/semantic-router..."
-	@cd src/semantic-router/ && golangci-lint run ./... --config ../../tools/linter/go/.golangci.yml
+	@set -e; \
+	BIN=$$(command -v golangci-lint || true); \
+	if [ -z "$$BIN" ] && [ -x "/snap/bin/golangci-lint" ]; then BIN="/snap/bin/golangci-lint"; fi; \
+	if [ -z "$$BIN" ]; then \
+		if command -v go >/dev/null 2>&1; then \
+			echo "Installing golangci-lint via 'go install'..."; \
+			GOPATH_DIR=$$(go env GOPATH); \
+			BIN="$$GOPATH_DIR/bin/golangci-lint"; \
+			go install github.com/golangci/golangci-lint/cmd/golangci-lint@v1.61.0; \
+		else \
+			echo "ERROR: golangci-lint not found. Add /snap/bin to PATH or install via 'go install'." >&2; \
+			echo "Hint: export PATH=\$$PATH:/snap/bin" >&2; \
+			exit 127; \
+		fi; \
+	fi; \
+	cd src/semantic-router/ && "$$BIN" run ./... --config ../../tools/linter/go/.golangci.yml
 	@echo "✅ src/semantic-router go module lint passed"
 
 # golangci-lint fix for Go modules
@@ -16,7 +31,22 @@ go-lint:
 go-lint-fix:
 	@$(LOG_TARGET)
 	@echo "Running golangci-lint fix for src/semantic-router..."
-	@cd src/semantic-router/ && golangci-lint run ./... --fix --config ../../tools/linter/go/.golangci.yml
+	@set -e; \
+	BIN=$$(command -v golangci-lint || true); \
+	if [ -z "$$BIN" ] && [ -x "/snap/bin/golangci-lint" ]; then BIN="/snap/bin/golangci-lint"; fi; \
+	if [ -z "$$BIN" ]; then \
+		if command -v go >/dev/null 2>&1; then \
+			echo "Installing golangci-lint via 'go install'..."; \
+			GOPATH_DIR=$$(go env GOPATH); \
+			BIN="$$GOPATH_DIR/bin/golangci-lint"; \
+			go install github.com/golangci/golangci-lint/cmd/golangci-lint@v1.61.0; \
+		else \
+			echo "ERROR: golangci-lint not found. Add /snap/bin to PATH or install via 'go install'." >&2; \
+			echo "Hint: export PATH=\$$PATH:/snap/bin" >&2; \
+			exit 127; \
+		fi; \
+	fi; \
+	cd src/semantic-router/ && "$$BIN" run ./... --fix --config ../../tools/linter/go/.golangci.yml
 	@echo "✅ src/semantic-router go module lint fix applied"
 
 # Run go vet for all Go modules

From 059938349ae8114283e2e6f79cf17f3901e28365 Mon Sep 17 00:00:00 2001
From: JaredforReal <w13431838023@gmail.com>
Date: Thu, 16 Oct 2025 20:47:42 +0800
Subject: [PATCH 4/7] fix some network bug

Signed-off-by: JaredforReal <w13431838023@gmail.com>
---
 dashboard/backend/main.go                | 34 +++++++++++-------------
 deploy/docker-compose/docker-compose.yml |  4 +--
 2 files changed, 17 insertions(+), 21 deletions(-)

diff --git a/dashboard/backend/main.go b/dashboard/backend/main.go
index 72ded509..c77c2e5c 100644
--- a/dashboard/backend/main.go
+++ b/dashboard/backend/main.go
@@ -341,13 +341,27 @@ func main() {
 		log.Printf("Warning: Grafana URL not configured")
 	}
 
-	// Smart /api/ router: route to Router API or Grafana API based on path
+	// Jaeger API proxy (needs to be set up early for the smart router below)
+	var jaegerAPIProxy *httputil.ReverseProxy
+	if *jaegerURL != "" {
+		// Create proxy for Jaeger API (no prefix stripping for /api/*)
+		jaegerAPIProxy, _ = newReverseProxy(*jaegerURL, "", false)
+	}
+
+	// Smart /api/ router: route to Router API, Jaeger API, or Grafana API based on path
 	mux.HandleFunc("/api/", func(w http.ResponseWriter, r *http.Request) {
 		// If path starts with /api/router/, use Router API proxy
 		if strings.HasPrefix(r.URL.Path, "/api/router/") && routerAPIProxy != nil {
 			routerAPIProxy.ServeHTTP(w, r)
 			return
 		}
+		// If path is Jaeger API (services, traces, operations, etc.), use Jaeger proxy
+		if jaegerAPIProxy != nil && (strings.HasPrefix(r.URL.Path, "/api/services") ||
+			strings.HasPrefix(r.URL.Path, "/api/traces") ||
+			strings.HasPrefix(r.URL.Path, "/api/operations")) {
+			jaegerAPIProxy.ServeHTTP(w, r)
+			return
+		}
 		// Otherwise, if Grafana is configured, proxy to Grafana API
 		if grafanaStaticProxy != nil {
 			grafanaStaticProxy.ServeHTTP(w, r)
@@ -426,24 +440,6 @@ func main() {
 		log.Printf("Info: Open WebUI not configured (optional)")
 	}
 
-	// Jaeger proxy (optional)
-	if *jaegerURL != "" {
-		jp, err := newReverseProxy(*jaegerURL, "/embedded/jaeger", false)
-		if err != nil {
-			log.Fatalf("jaeger proxy error: %v", err)
-		}
-		mux.Handle("/embedded/jaeger", jp)
-		mux.Handle("/embedded/jaeger/", jp)
-		log.Printf("Jaeger proxy configured: %s", *jaegerURL)
-	} else {
-		mux.HandleFunc("/embedded/jaeger/", func(w http.ResponseWriter, r *http.Request) {
-			w.Header().Set("Content-Type", "application/json")
-			w.WriteHeader(http.StatusServiceUnavailable)
-			w.Write([]byte(`{"error":"Jaeger not configured","message":"TARGET_JAEGER_URL environment variable is not set"}`))
-		})
-		log.Printf("Info: Jaeger URL not configured (optional)")
-	}
-
 	addr := ":" + *port
 	log.Printf("Semantic Router Dashboard listening on %s", addr)
 	log.Printf("Static dir: %s", *staticDir)
diff --git a/deploy/docker-compose/docker-compose.yml b/deploy/docker-compose/docker-compose.yml
index e8cefa02..280456f8 100644
--- a/deploy/docker-compose/docker-compose.yml
+++ b/deploy/docker-compose/docker-compose.yml
@@ -2,7 +2,7 @@ services:
 
   # Semantic Router External Processor Service
   semantic-router:
-    image: semantic-router-extproc:dev
+    image: ghcr.io/vllm-project/semantic-router/extproc:latest
     container_name: semantic-router
     ports:
       - "50051:50051"
@@ -76,7 +76,7 @@ services:
     environment:
       - COLLECTOR_OTLP_ENABLED=true
     ports:
-      - "4317:4317"   # OTLP gRPC
+      - "4318:4317"   # OTLP gRPC (mapped to 4318 on host to avoid conflicts)
       - "16686:16686" # Web UI
     networks:
       - semantic-network

From 789fc475c5b265165ba30bd277eac4baf744534c Mon Sep 17 00:00:00 2001
From: JaredforReal <w13431838023@gmail.com>
Date: Thu, 16 Oct 2025 21:03:44 +0800
Subject: [PATCH 5/7] refine layout

Signed-off-by: JaredforReal <w13431838023@gmail.com>
---
 config/config.tracing.yaml                    |  2 +-
 .../frontend/src/components/Layout.module.css | 96 ++++++++-----------
 dashboard/frontend/src/components/Layout.tsx  | 90 +++++++----------
 3 files changed, 75 insertions(+), 113 deletions(-)

diff --git a/config/config.tracing.yaml b/config/config.tracing.yaml
index 8d9ea682..9bd722e0 100644
--- a/config/config.tracing.yaml
+++ b/config/config.tracing.yaml
@@ -2,7 +2,7 @@
 # This config is used by tools/tracing/docker-compose.tracing.yaml via CONFIG_FILE.
 
 bert_model:
-  model_id: sentence-transformers/all-MiniLM-L12-v2
+  model_id: models/all-MiniLM-L12-v2
   threshold: 0.6
   use_cpu: true
 
diff --git a/dashboard/frontend/src/components/Layout.module.css b/dashboard/frontend/src/components/Layout.module.css
index 40e4f223..c4479dc1 100644
--- a/dashboard/frontend/src/components/Layout.module.css
+++ b/dashboard/frontend/src/components/Layout.module.css
@@ -25,39 +25,11 @@
   align-items: center;
   gap: 0.5rem;
   padding: 0 0.25rem;
-  flex-direction: column;
+  justify-content: center;
 }
 
 .sidebarCollapsed .brandContainer {
-  flex-direction: column;
-  gap: 0.75rem;
-}
-
-.collapseButton {
-  display: flex;
-  align-items: center;
   justify-content: center;
-  width: 32px;
-  height: 32px;
-  padding: 6px;
-  background: transparent;
-  border: none;
-  border-radius: var(--radius-md);
-  cursor: pointer;
-  color: var(--color-text-secondary);
-  transition: all var(--transition-fast);
-  flex-shrink: 0;
-}
-
-.collapseButton:hover {
-  background-color: var(--color-bg-tertiary);
-  color: var(--color-text);
-}
-
-.collapseButton svg {
-  width: 20px;
-  height: 20px;
-  flex-shrink: 0;
 }
 
 .brand {
@@ -228,41 +200,36 @@
   padding: 0 0.5rem;
   display: flex;
   align-items: center;
-  gap: 0.5rem;
-}
-
-.themeToggle {
-  padding: 0.5rem;
-  font-size: 1.25rem;
-  border-radius: var(--radius-md);
-  transition: background-color var(--transition-fast);
-  background: transparent;
-  border: none;
-  cursor: pointer;
-  color: var(--color-text);
-}
-
-.themeToggle:hover {
-  background-color: var(--color-bg-tertiary);
+  justify-content: center;
 }
 
-.iconButton {
+.collapseButton {
   display: flex;
   align-items: center;
   justify-content: center;
-  padding: 0.5rem;
+  width: 32px;
+  height: 32px;
+  padding: 6px;
+  background: transparent;
+  border: none;
   border-radius: var(--radius-md);
-  transition: background-color var(--transition-fast);
-  color: var(--color-text-secondary);
-  text-decoration: none;
   cursor: pointer;
+  color: var(--color-text-secondary);
+  transition: all var(--transition-fast);
+  flex-shrink: 0;
 }
 
-.iconButton:hover {
+.collapseButton:hover {
   background-color: var(--color-bg-tertiary);
   color: var(--color-text);
 }
 
+.collapseButton svg {
+  width: 20px;
+  height: 20px;
+  flex-shrink: 0;
+}
+
 .main {
   flex: 1;
   display: flex;
@@ -292,22 +259,35 @@
   flex: 1;
 }
 
+.headerBrand {
+  font-size: 1.125rem;
+  font-weight: 600;
+  color: var(--color-text);
+}
+
 .headerRight {
   display: flex;
   align-items: center;
-  gap: 1.5rem;
+  gap: 0.75rem;
 }
 
-.headerLink {
+.headerIconButton {
+  display: flex;
+  align-items: center;
+  justify-content: center;
+  padding: 0.5rem;
+  font-size: 1.25rem;
+  border-radius: var(--radius-md);
+  transition: all var(--transition-fast);
+  background: transparent;
+  border: none;
+  cursor: pointer;
   color: var(--color-text-secondary);
   text-decoration: none;
-  font-size: 0.9375rem;
-  font-weight: 500;
-  transition: color var(--transition-fast);
-  white-space: nowrap;
 }
 
-.headerLink:hover {
+.headerIconButton:hover {
+  background-color: var(--color-bg-tertiary);
   color: var(--color-text);
 }
 
diff --git a/dashboard/frontend/src/components/Layout.tsx b/dashboard/frontend/src/components/Layout.tsx
index 9ecca8c0..65cc6a72 100644
--- a/dashboard/frontend/src/components/Layout.tsx
+++ b/dashboard/frontend/src/components/Layout.tsx
@@ -46,26 +46,6 @@ const Layout: React.FC<LayoutProps> = ({ children, configSection, onConfigSectio
     <div className={styles.container}>
       <aside className={`${styles.sidebar} ${sidebarCollapsed ? styles.sidebarCollapsed : ''}`}>
         <div className={styles.brandContainer}>
-          <button
-            className={styles.collapseButton}
-            onClick={toggleSidebar}
-            aria-label={sidebarCollapsed ? 'Expand sidebar' : 'Collapse sidebar'}
-            title={sidebarCollapsed ? 'Expand sidebar' : 'Collapse sidebar'}
-          >
-            {sidebarCollapsed ? (
-              // 折叠状态：箭头向右
-              <svg width="20" height="20" viewBox="0 0 20 20" fill="none" xmlns="http://www.w3.org/2000/svg">
-                <path d="M14 10L18 10M18 10L16 8M18 10L16 12" stroke="currentColor" strokeWidth="1.5" strokeLinecap="round" strokeLinejoin="round" />
-                <path d="M2 5H10M2 10H10M2 15H10" stroke="currentColor" strokeWidth="1.5" strokeLinecap="round" />
-              </svg>
-            ) : (
-              // 展开状态：箭头向左
-              <svg width="20" height="20" viewBox="0 0 20 20" fill="none" xmlns="http://www.w3.org/2000/svg">
-                <path d="M6 10L2 10M2 10L4 8M2 10L4 12" stroke="currentColor" strokeWidth="1.5" strokeLinecap="round" strokeLinejoin="round" />
-                <path d="M10 5H18M10 10H18M10 15H18" stroke="currentColor" strokeWidth="1.5" strokeLinecap="round" />
-              </svg>
-            )}
-          </button>
           <NavLink to="/" className={styles.brand}>
             <img src="/vllm.png" alt="vLLM" className={styles.logo} />
             {!sidebarCollapsed && <span className={styles.brandText}>Semantic Router</span>}
@@ -144,20 +124,47 @@ const Layout: React.FC<LayoutProps> = ({ children, configSection, onConfigSectio
         </nav>
         <div className={styles.sidebarFooter}>
           <button
-            className={styles.themeToggle}
-            onClick={toggleTheme}
-            aria-label="Toggle theme"
-            title="Toggle theme"
+            className={styles.collapseButton}
+            onClick={toggleSidebar}
+            aria-label={sidebarCollapsed ? 'Expand sidebar' : 'Collapse sidebar'}
+            title={sidebarCollapsed ? 'Expand sidebar' : 'Collapse sidebar'}
           >
-            {theme === 'light' ? '🌙' : '☀️'}
+            {sidebarCollapsed ? (
+              // Collapsed state: arrow pointing right
+              <svg width="20" height="20" viewBox="0 0 20 20" fill="none" xmlns="http://www.w3.org/2000/svg">
+                <path d="M14 10L18 10M18 10L16 8M18 10L16 12" stroke="currentColor" strokeWidth="1.5" strokeLinecap="round" strokeLinejoin="round" />
+                <path d="M2 5H10M2 10H10M2 15H10" stroke="currentColor" strokeWidth="1.5" strokeLinecap="round" />
+              </svg>
+            ) : (
+              // Expanded state: arrow pointing left
+              <svg width="20" height="20" viewBox="0 0 20 20" fill="none" xmlns="http://www.w3.org/2000/svg">
+                <path d="M6 10L2 10M2 10L4 8M2 10L4 12" stroke="currentColor" strokeWidth="1.5" strokeLinecap="round" strokeLinejoin="round" />
+                <path d="M10 5H18M10 10H18M10 15H18" stroke="currentColor" strokeWidth="1.5" strokeLinecap="round" />
+              </svg>
+            )}
           </button>
-          {!sidebarCollapsed && (
-            <>
+        </div>
+      </aside>
+      <main className={styles.main}>
+        <header className={styles.header}>
+          <div className={styles.headerContent}>
+            <div className={styles.headerLeft}>
+              <span className={styles.headerBrand}>Semantic Router</span>
+            </div>
+            <div className={styles.headerRight}>
+              <button
+                className={styles.headerIconButton}
+                onClick={toggleTheme}
+                aria-label="Toggle theme"
+                title="Toggle theme"
+              >
+                {theme === 'light' ? '🌙' : '☀️'}
+              </button>
               <a
                 href="https://github.com/vllm-project/semantic-router"
                 target="_blank"
                 rel="noopener noreferrer"
-                className={styles.iconButton}
+                className={styles.headerIconButton}
                 aria-label="GitHub"
                 title="GitHub Repository"
               >
@@ -169,7 +176,7 @@ const Layout: React.FC<LayoutProps> = ({ children, configSection, onConfigSectio
                 href="https://vllm-semantic-router.com"
                 target="_blank"
                 rel="noopener noreferrer"
-                className={styles.iconButton}
+                className={styles.headerIconButton}
                 aria-label="Documentation"
                 title="Documentation"
               >
@@ -178,31 +185,6 @@ const Layout: React.FC<LayoutProps> = ({ children, configSection, onConfigSectio
                   <path d="M6.5 2H20v20H6.5A2.5 2.5 0 0 1 4 19.5v-15A2.5 2.5 0 0 1 6.5 2z"></path>
                 </svg>
               </a>
-            </>
-          )}
-        </div>
-      </aside>
-      <main className={styles.main}>
-        <header className={styles.header}>
-          <div className={styles.headerContent}>
-            <div className={styles.headerLeft}></div>
-            <div className={styles.headerRight}>
-              <a
-                href="https://vllm-semantic-router.com"
-                target="_blank"
-                rel="noopener noreferrer"
-                className={styles.headerLink}
-              >
-                Docs
-              </a>
-              <a
-                href="https://github.com/vllm-project/semantic-router"
-                target="_blank"
-                rel="noopener noreferrer"
-                className={styles.headerLink}
-              >
-                GitHub
-              </a>
             </div>
           </div>
         </header>

From 418165854d4acd5fd62a749d6798f8944824274f Mon Sep 17 00:00:00 2001
From: JaredforReal <w13431838023@gmail.com>
Date: Thu, 16 Oct 2025 21:08:37 +0800
Subject: [PATCH 6/7] revert golang.mk

Signed-off-by: JaredforReal <w13431838023@gmail.com>
---
 tools/make/golang.mk | 34 ++--------------------------------
 1 file changed, 2 insertions(+), 32 deletions(-)

diff --git a/tools/make/golang.mk b/tools/make/golang.mk
index 2ba15e74..0c9c73bd 100644
--- a/tools/make/golang.mk
+++ b/tools/make/golang.mk
@@ -8,22 +8,7 @@
 go-lint:
 	@$(LOG_TARGET)
 	@echo "Running golangci-lint for src/semantic-router..."
-	@set -e; \
-	BIN=$$(command -v golangci-lint || true); \
-	if [ -z "$$BIN" ] && [ -x "/snap/bin/golangci-lint" ]; then BIN="/snap/bin/golangci-lint"; fi; \
-	if [ -z "$$BIN" ]; then \
-		if command -v go >/dev/null 2>&1; then \
-			echo "Installing golangci-lint via 'go install'..."; \
-			GOPATH_DIR=$$(go env GOPATH); \
-			BIN="$$GOPATH_DIR/bin/golangci-lint"; \
-			go install github.com/golangci/golangci-lint/cmd/golangci-lint@v1.61.0; \
-		else \
-			echo "ERROR: golangci-lint not found. Add /snap/bin to PATH or install via 'go install'." >&2; \
-			echo "Hint: export PATH=\$$PATH:/snap/bin" >&2; \
-			exit 127; \
-		fi; \
-	fi; \
-	cd src/semantic-router/ && "$$BIN" run ./... --config ../../tools/linter/go/.golangci.yml
+	@cd src/semantic-router/ && golangci-lint run ./... --config ../../tools/linter/go/.golangci.yml
 	@echo "✅ src/semantic-router go module lint passed"
 
 # golangci-lint fix for Go modules
@@ -31,22 +16,7 @@ go-lint:
 go-lint-fix:
 	@$(LOG_TARGET)
 	@echo "Running golangci-lint fix for src/semantic-router..."
-	@set -e; \
-	BIN=$$(command -v golangci-lint || true); \
-	if [ -z "$$BIN" ] && [ -x "/snap/bin/golangci-lint" ]; then BIN="/snap/bin/golangci-lint"; fi; \
-	if [ -z "$$BIN" ]; then \
-		if command -v go >/dev/null 2>&1; then \
-			echo "Installing golangci-lint via 'go install'..."; \
-			GOPATH_DIR=$$(go env GOPATH); \
-			BIN="$$GOPATH_DIR/bin/golangci-lint"; \
-			go install github.com/golangci/golangci-lint/cmd/golangci-lint@v1.61.0; \
-		else \
-			echo "ERROR: golangci-lint not found. Add /snap/bin to PATH or install via 'go install'." >&2; \
-			echo "Hint: export PATH=\$$PATH:/snap/bin" >&2; \
-			exit 127; \
-		fi; \
-	fi; \
-	cd src/semantic-router/ && "$$BIN" run ./... --fix --config ../../tools/linter/go/.golangci.yml
+	@cd src/semantic-router/ && golangci-lint run ./... --fix --config ../../tools/linter/go/.golangci.yml
 	@echo "✅ src/semantic-router go module lint fix applied"
 
 # Run go vet for all Go modules

From e397227acce59e98e08d44be363602e8418155df Mon Sep 17 00:00:00 2001
From: JaredforReal <w13431838023@gmail.com>
Date: Thu, 16 Oct 2025 21:09:26 +0800
Subject: [PATCH 7/7] delete tracing quickstart

Signed-off-by: JaredforReal <w13431838023@gmail.com>
---
 .../observability/tracing-quickstart.md       | 55 -------------------
 1 file changed, 55 deletions(-)
 delete mode 100644 website/docs/tutorials/observability/tracing-quickstart.md

diff --git a/website/docs/tutorials/observability/tracing-quickstart.md b/website/docs/tutorials/observability/tracing-quickstart.md
deleted file mode 100644
index 1ab5cccd..00000000
--- a/website/docs/tutorials/observability/tracing-quickstart.md
+++ /dev/null
@@ -1,55 +0,0 @@
-# Tracing Quickstart
-
-This guide helps you spin up a local tracing stack and see your first traces in a minute.
-
-## Prerequisites
-
-- Docker and Docker Compose
-
-## Start the local tracing stack
-
-The repo includes a compose file that starts Jaeger and a tracing-enabled Semantic Router instance.
-
-- The router uses `config/config.tracing.yaml` which has tracing enabled and the exporter pointed at Jaeger.
-
-Run:
-
-```bash
-# from repo root
-docker compose -f tools/tracing/docker-compose.tracing.yaml up -d
-```
-
-## Send a test request
-
-```bash
-curl -X POST http://localhost:8081/v1/chat/completions \
-  -H "Content-Type: application/json" \
-  -d '{
-    "model": "auto",
-    "messages": [{"role": "user", "content": "What is 2+2?"}]
-  }'
-```
-
-## View traces
-
-1. Open Jaeger UI: http://localhost:16686
-2. Choose service: `vllm-semantic-router`
-3. Find traces → click one to inspect spans
-
-You should see spans like:
-
-- `semantic_router.request.received`
-- `semantic_router.classification`
-- `semantic_router.cache.lookup`
-- `semantic_router.routing.decision`
-- `semantic_router.backend.selection`
-
-## Customize
-
-- Change service name or sampling in `config/config.tracing.yaml` under `observability.tracing`.
-- To export to another backend (e.g., Tempo), set `exporter.endpoint` and `insecure` accordingly.
-
-## Troubleshooting
-
-- No traces? Confirm tracing is enabled in the YAML and Jaeger is reachable at `jaeger:4317` inside the compose network.
-- Empty service list in Jaeger? Make one request to generate spans, then refresh.