vllm-project
diff --git a/‎.github/workflows/integration-test-dynamic-config.yml‎
Lines changed: 156 additions & 0 deletions b/‎.github/workflows/integration-test-dynamic-config.yml‎
Lines changed: 156 additions & 0 deletions
diff --git a/‎deploy/helm/semantic-router/templates/clusterrole.yaml‎
Lines changed: 40 additions & 0 deletions b/‎deploy/helm/semantic-router/templates/clusterrole.yaml‎
Lines changed: 40 additions & 0 deletions
diff --git a/‎deploy/helm/semantic-router/templates/clusterrolebinding.yaml‎
Lines changed: 17 additions & 0 deletions b/‎deploy/helm/semantic-router/templates/clusterrolebinding.yaml‎
Lines changed: 17 additions & 0 deletions
diff --git a/‎deploy/helm/semantic-router/values.yaml‎
Lines changed: 5 additions & 0 deletions b/‎deploy/helm/semantic-router/values.yaml‎
Lines changed: 5 additions & 0 deletions
diff --git a/‎e2e/cmd/e2e/main.go‎
Lines changed: 3 additions & 0 deletions b/‎e2e/cmd/e2e/main.go‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎e2e/profiles/dynamic-config/crds/intelligentpool.yaml‎
Lines changed: 26 additions & 0 deletions b/‎e2e/profiles/dynamic-config/crds/intelligentpool.yaml‎
Lines changed: 26 additions & 0 deletions
@@ -0,0 +1,156 @@
+name: Integration Test [Dynamic Config]
+
+on:
+  pull_request:
+    branches:
+      - main
+  push:
+    branches:
+      - main
+  workflow_dispatch: # Allow manual triggering
+
+jobs:
+  integration-test:
+    runs-on: ubuntu-latest
+    timeout-minutes: 60
+
+    steps:
+      - name: Check out the repo
+        uses: actions/checkout@v4
+
+      - name: Set up Go
+        uses: actions/setup-go@v5
+        with:
+          go-version: '1.24'
+
+      - name: Set up Rust
+        uses: actions-rust-lang/setup-rust-toolchain@v1
+        with:
+          toolchain: 1.90
+
+      - name: Install system dependencies
+        run: |
+          sudo apt-get update
+          sudo apt-get install -y \
+            make \
+            curl \
+            build-essential \
+            pkg-config
+
+      - name: Install Kind
+        run: |
+          curl -Lo ./kind https://kind.sigs.k8s.io/dl/v0.22.0/kind-linux-amd64
+          chmod +x ./kind
+          sudo mv ./kind /usr/local/bin/kind
+
+      - name: Install kubectl
+        run: |
+          curl -LO "https://dl.k8s.io/release/$(curl -L -s https://dl.k8s.io/release/stable.txt)/bin/linux/amd64/kubectl"
+          chmod +x kubectl
+          sudo mv kubectl /usr/local/bin/kubectl
+
+      - name: Install Helm
+        run: |
+          curl https://raw.githubusercontent.com/helm/helm/main/scripts/get-helm-3 | bash
+
+      - name: Download E2E test dependencies
+        run: |
+          cd e2e && go mod download
+
+      - name: Build E2E test binary
+        run: |
+          make build-e2e
+
+      - name: Run Dynamic Config E2E tests
+        id: e2e-test
+        run: |
+          set +e  # Don't exit on error, we want to capture the result
+          make e2e-test E2E_PROFILE=dynamic-config E2E_VERBOSE=true E2E_KEEP_CLUSTER=false
+          TEST_EXIT_CODE=$?
+          echo "test_exit_code=${TEST_EXIT_CODE}" >> $GITHUB_OUTPUT
+          exit ${TEST_EXIT_CODE}
+
+      - name: Upload test reports
+        if: always()
+        uses: actions/upload-artifact@v4
+        with:
+          name: test-reports-dynamic-config
+          path: |
+            test-report.json
+            test-report.md
+            semantic-router-logs.txt
+          retention-days: 30
+
+      - name: Create test summary from report
+        if: always()
+        run: |
+          if [ -f "test-report.md" ]; then
+            echo "=== Reading test report from test-report.md ==="
+            cat test-report.md >> $GITHUB_STEP_SUMMARY
+
+            # Add semantic-router logs section if available
+            if [ -f "semantic-router-logs.txt" ]; then
+              cat >> $GITHUB_STEP_SUMMARY << 'EOF'
+
+          ---
+
+          ### 📝 Semantic Router Logs
+
+          <details>
+          <summary>Click to view semantic-router logs</summary>
+
+          ```
+          EOF
+              # Add first 500 lines of logs to summary (to avoid exceeding GitHub limits)
+              head -n 500 semantic-router-logs.txt >> $GITHUB_STEP_SUMMARY
+
+              # Check if there are more lines
+              TOTAL_LINES=$(wc -l < semantic-router-logs.txt)
+              if [ "$TOTAL_LINES" -gt 500 ]; then
+                cat >> $GITHUB_STEP_SUMMARY << EOF
+
+          ... (showing first 500 lines of $TOTAL_LINES total lines)
+
+          📦 Full logs are available in the workflow artifacts: semantic-router-logs.txt
+          EOF
+              fi
+
+              cat >> $GITHUB_STEP_SUMMARY << 'EOF'
+          ```
+
+          </details>
+          EOF
+            fi
+
+            # Add additional context
+            cat >> $GITHUB_STEP_SUMMARY << 'EOF'
+
+          ---
+
+          ### 📚 Additional Resources
+
+          - **Trigger:** ${{ github.event_name }}
+          - **Branch:** `${{ github.ref_name }}`
+          - **Commit:** `${{ github.sha }}`
+          - **Workflow Run:** [${{ github.run_id }}](${{ github.server_url }}/${{ github.repository }}/actions/runs/${{ github.run_id }})
+          - [E2E Test Framework Documentation](https://github.com/${{ github.repository }}/tree/main/e2e)
+          - [Dynamic Config Profile](https://github.com/${{ github.repository }}/tree/main/e2e/profiles/dynamic-config)
+
+          ### 📦 Artifacts
+
+          - **test-report.json** - Detailed test results in JSON format
+          - **test-report.md** - Human-readable test report
+          - **semantic-router-logs.txt** - Complete semantic-router pod logs
+          - All artifacts are retained for 30 days
+          
+          ### 🔧 Dynamic Config Profile
+          
+          This test validates the Kubernetes CRD-based dynamic configuration feature:
+          - IntelligentPool CRD for model configuration
+          - IntelligentRoute CRD for routing decisions
+          - Controller-runtime based reconciliation
+          - Automatic configuration updates on CRD changes
+          EOF
+          else
+            echo "⚠️ Test report file not found!" >> $GITHUB_STEP_SUMMARY
+
@@ -0,0 +1,40 @@
+{{- if .Values.rbac.create -}}
+apiVersion: rbac.authorization.k8s.io/v1
+kind: ClusterRole
+metadata:
+  name: {{ include "semantic-router.fullname" . }}
+  labels:
+    {{- include "semantic-router.labels" . | nindent 4 }}
+rules:
+  # Permissions for IntelligentPool CRD
+  - apiGroups:
+      - vllm.ai
+    resources:
+      - intelligentpools
+    verbs:
+      - get
+      - list
+      - watch
+  - apiGroups:
+      - vllm.ai
+    resources:
+      - intelligentpools/status
+    verbs:
+      - get
+  # Permissions for IntelligentRoute CRD
+  - apiGroups:
+      - vllm.ai
+    resources:
+      - intelligentroutes
+    verbs:
+      - get
+      - list
+      - watch
+  - apiGroups:
+      - vllm.ai
+    resources:
+      - intelligentroutes/status
+    verbs:
+      - get
+{{- end }}
+
@@ -0,0 +1,17 @@
+{{- if .Values.rbac.create -}}
+apiVersion: rbac.authorization.k8s.io/v1
+kind: ClusterRoleBinding
+metadata:
+  name: {{ include "semantic-router.fullname" . }}
+  labels:
+    {{- include "semantic-router.labels" . | nindent 4 }}
+roleRef:
+  apiGroup: rbac.authorization.k8s.io
+  kind: ClusterRole
+  name: {{ include "semantic-router.fullname" . }}
+subjects:
+  - kind: ServiceAccount
+    name: {{ include "semantic-router.serviceAccountName" . }}
+    namespace: {{ include "semantic-router.namespace" . }}
+{{- end }}
+
@@ -42,6 +42,11 @@ serviceAccount:
   # -- The name of the service account to use
   name: ""
 
+# RBAC configuration
+rbac:
+  # -- Create RBAC resources (ClusterRole and ClusterRoleBinding)
+  create: true
+
 # Pod annotations
 podAnnotations: {}
 
 
@@ -10,6 +10,7 @@ import (
 	"github.com/vllm-project/semantic-router/e2e/pkg/banner"
 	"github.com/vllm-project/semantic-router/e2e/pkg/framework"
 	aigateway "github.com/vllm-project/semantic-router/e2e/profiles/ai-gateway"
+	dynamicconfig "github.com/vllm-project/semantic-router/e2e/profiles/dynamic-config"
 
 	// Import profiles to register test cases
 	_ "github.com/vllm-project/semantic-router/e2e/profiles/ai-gateway"
@@ -96,6 +97,8 @@ func getProfile(name string) (framework.Profile, error) {
 	switch name {
 	case "ai-gateway":
 		return aigateway.NewProfile(), nil
+	case "dynamic-config":
+		return dynamicconfig.NewProfile(), nil
 	// Add more profiles here as they are implemented
 	// case "istio":
 	//     return istio.NewProfile(), nil
 
@@ -0,0 +1,26 @@
+apiVersion: vllm.ai/v1alpha1
+kind: IntelligentPool
+metadata:
+  name: ai-gateway-pool
+  namespace: default
+spec:
+  defaultModel: "base-model"
+  models:
+    - name: "base-model"
+      reasoningFamily: "qwen3"
+      piiPolicy:
+        allowByDefault: false
+      loras:
+        - name: "science-expert"
+          description: "Specialized for science domains: biology, chemistry, physics, health, engineering"
+        - name: "social-expert"
+          description: "Optimized for social sciences: business, economics"
+        - name: "math-expert"
+          description: "Fine-tuned for mathematics and quantitative reasoning"
+        - name: "law-expert"
+          description: "Specialized for legal questions and law-related topics"
+        - name: "humanities-expert"
+          description: "Optimized for humanities: psychology, history, philosophy"
+        - name: "general-expert"
+          description: "General-purpose adapter for diverse topics"
+