vllm-project
diff --git a/‎deploy/kubernetes/crds/examples/intelligentroute-example.yaml‎
Lines changed: 1 addition & 12 deletions b/‎deploy/kubernetes/crds/examples/intelligentroute-example.yaml‎
Lines changed: 1 addition & 12 deletions
diff --git a/‎src/semantic-router/pkg/k8s/converter_test.go‎
Lines changed: 33 additions & 6 deletions b/‎src/semantic-router/pkg/k8s/converter_test.go‎
Lines changed: 33 additions & 6 deletions
diff --git a/‎src/semantic-router/pkg/k8s/testdata/README.md‎
Lines changed: 165 additions & 0 deletions b/‎src/semantic-router/pkg/k8s/testdata/README.md‎
Lines changed: 165 additions & 0 deletions
diff --git a/‎src/semantic-router/pkg/k8s/testdata/input/01-basic.yaml‎
Lines changed: 79 additions & 0 deletions b/‎src/semantic-router/pkg/k8s/testdata/input/01-basic.yaml‎
Lines changed: 79 additions & 0 deletions
diff --git a/‎src/semantic-router/pkg/k8s/testdata/input/02-keyword-only.yaml‎
Lines changed: 61 additions & 0 deletions b/‎src/semantic-router/pkg/k8s/testdata/input/02-keyword-only.yaml‎
Lines changed: 61 additions & 0 deletions
@@ -38,20 +38,9 @@ spec:
 
     # Domain-based signals (MMLU domain categories)
     domains:
-      - "business"
-      - "law"
-      - "psychology"
-      - "biology"
-      - "chemistry"
-      - "history"
-      - "other"
-      - "health"
-      - "economics"
       - "math"
-      - "physics"
       - "computer_science"
-      - "philosophy"
-      - "engineering"
+      - "physics"
 
   # Decisions (priority used when multiple decisions match)
   decisions:
 
@@ -202,11 +202,20 @@ func TestConverterWithTestData(t *testing.T) {
 	testdataDir := "testdata"
 	inputDir := filepath.Join(testdataDir, "input")
 	outputDir := filepath.Join(testdataDir, "output")
+	baseConfigPath := filepath.Join(testdataDir, "base-config.yaml")
 
 	// Ensure output directory exists
 	err := os.MkdirAll(outputDir, 0755)
 	require.NoError(t, err, "Failed to create output directory")
 
+	// Load base config (static parts)
+	baseConfigData, err := os.ReadFile(baseConfigPath)
+	require.NoError(t, err, "Failed to read base config file: %s", baseConfigPath)
+
+	var baseConfig config.RouterConfig
+	err = yaml.Unmarshal(baseConfigData, &baseConfig)
+	require.NoError(t, err, "Failed to unmarshal base config")
+
 	// Read all input files
 	inputFiles, err := os.ReadDir(inputDir)
 	require.NoError(t, err, "Failed to read input directory")
@@ -240,12 +249,8 @@ func TestConverterWithTestData(t *testing.T) {
 			intelligentRouting, err := converter.ConvertIntelligentRoute(route)
 			require.NoError(t, err, "Failed to convert IntelligentRoute")
 
-			// Create output config
-			outputConfig := &config.RouterConfig{
-				ConfigSource:       config.ConfigSourceKubernetes,
-				BackendModels:      *backendModels,
-				IntelligentRouting: *intelligentRouting,
-			}
+			// Merge base config with CRD-derived config
+			outputConfig := mergeConfigs(&baseConfig, backendModels, intelligentRouting)
 
 			// Marshal to YAML
 			outputData, err := yaml.Marshal(outputConfig)
@@ -271,6 +276,28 @@ func TestConverterWithTestData(t *testing.T) {
 	}
 }
 
+// mergeConfigs merges base config with CRD-derived dynamic parts
+func mergeConfigs(baseConfig *config.RouterConfig, backendModels *config.BackendModels, intelligentRouting *config.IntelligentRouting) *config.RouterConfig {
+	// Start with a copy of base config (contains all static parts)
+	merged := *baseConfig
+
+	// Override config source
+	merged.ConfigSource = config.ConfigSourceKubernetes
+
+	// Override dynamic parts from CRDs
+	merged.BackendModels = *backendModels
+
+	// Merge IntelligentRouting while preserving ReasoningConfig from base
+	merged.IntelligentRouting.KeywordRules = intelligentRouting.KeywordRules
+	merged.IntelligentRouting.EmbeddingRules = intelligentRouting.EmbeddingRules
+	merged.IntelligentRouting.Categories = intelligentRouting.Categories
+	merged.IntelligentRouting.Decisions = intelligentRouting.Decisions
+	merged.IntelligentRouting.Strategy = intelligentRouting.Strategy
+	// Keep ReasoningConfig from base (ReasoningFamilies, DefaultReasoningEffort)
+
+	return &merged
+}
+
 // parseInputYAML parses a multi-document YAML file containing IntelligentPool and IntelligentRoute
 func parseInputYAML(data []byte) (*v1alpha1.IntelligentPool, *v1alpha1.IntelligentRoute, error) {
 	decoder := k8syaml.NewYAMLOrJSONDecoder(strings.NewReader(string(data)), 4096)
 
@@ -0,0 +1,165 @@
+# Test Data for CRD Converter
+
+This directory contains test data for the Kubernetes CRD to RouterConfig converter.
+
+## Directory Structure
+
+```
+testdata/
+├── base-config.yaml          # Static base configuration (shared across all tests)
+├── input/                    # Input CRD YAML files (IntelligentPool + IntelligentRoute)
+│   ├── 01-basic.yaml
+│   ├── 02-keyword-only.yaml
+│   ├── ...
+│   └── 15-keyword-embedding-domain-no-plugin.yaml
+└── output/                   # Generated RouterConfig YAML files
+    ├── 01-basic.yaml
+    ├── 02-keyword-only.yaml
+    ├── ...
+    └── 15-keyword-embedding-domain-no-plugin.yaml
+```
+
+## Base Configuration
+
+`base-config.yaml` contains static configuration that doesn't come from CRDs:
+- Reasoning families (deepseek, qwen3, gpt)
+- Default reasoning effort level
+- BERT model configuration
+- Semantic cache settings
+- Tools configuration
+- Prompt guard settings
+- Classifier configuration
+- Router options
+- Embedding models paths
+- API configuration
+- Observability settings
+
+## Test Scenarios Overview
+
+| # | File | Keyword | Embedding | Domain | Plugin | Use Case |
+|---|------|---------|-----------|--------|--------|----------|
+| 1 | 01-basic.yaml | ✓ | ✓ | ✓ | ✓ | Basic comprehensive example |
+| 2 | 02-keyword-only.yaml | ✓ | ✗ | ✗ | ✗ | FAQ detection, greetings |
+| 3 | 03-embedding-only.yaml | ✗ | ✓ | ✗ | ✗ | Customer support, technical issues |
+| 4 | 04-domain-only.yaml | ✗ | ✗ | ✓ | ✗ | STEM queries, subject routing |
+| 5 | 05-keyword-embedding.yaml | ✓ | ✓ | ✗ | ✗ | Urgent support with semantics |
+| 6 | 06-keyword-domain.yaml | ✓ | ✗ | ✓ | ✗ | Academic homework assistance |
+| 7 | 07-domain-embedding.yaml | ✗ | ✓ | ✓ | ✗ | Research queries by domain |
+| 8 | 08-keyword-embedding-domain.yaml | ✓ | ✓ | ✓ | ✗ | Comprehensive tech support |
+| 9 | 09-keyword-plugin.yaml | ✓ | ✗ | ✗ | ✓ | FAQ with caching |
+| 10 | 10-embedding-plugin.yaml | ✗ | ✓ | ✗ | ✓ | PII-protected queries |
+| 11 | 11-domain-plugin.yaml | ✗ | ✗ | ✓ | ✓ | Legal advice with disclaimers |
+| 12 | 12-keyword-embedding-plugin.yaml | ✓ | ✓ | ✗ | ✓ | Security queries with protection |
+| 13 | 13-keyword-domain-plugin.yaml | ✓ | ✗ | ✓ | ✓ | Medical queries with PII |
+| 14 | 14-domain-embedding-plugin.yaml | ✗ | ✓ | ✓ | ✓ | Financial advice with protection |
+| 15 | 15-keyword-embedding-domain-plugin.yaml | ✓ | ✓ | ✓ | ✓ | Enterprise compliance (full) |
+| 16 | 16-keyword-embedding-domain-no-plugin.yaml | ✓ | ✓ | ✓ | ✗ | Educational tutorials |
+
+## Test Scenarios Details
+
+### Signal Type Combinations (No Plugins)
+
+1. **02-keyword-only.yaml** - Only keyword signals
+   - Use case: FAQ detection, greeting responses
+   - Signals: urgent, greeting keywords
+
+2. **03-embedding-only.yaml** - Only embedding signals
+   - Use case: Customer support, technical issue detection
+   - Signals: customer_support, technical_issue embeddings
+
+3. **04-domain-only.yaml** - Only domain signals
+   - Use case: STEM queries, subject-specific routing
+   - Signals: math, physics, computer_science, chemistry domains
+
+4. **05-keyword-embedding.yaml** - Keyword + Embedding
+   - Use case: Urgent support requests with semantic matching
+   - Signals: urgent keywords + support_request embeddings
+
+5. **06-keyword-domain.yaml** - Keyword + Domain
+   - Use case: Academic homework assistance
+   - Signals: homework keywords + math/physics/chemistry domains
+
+6. **07-domain-embedding.yaml** - Domain + Embedding
+   - Use case: Research queries in specific domains
+   - Signals: research_question embeddings + biology/chemistry/physics domains
+
+7. **08-keyword-embedding-domain.yaml** - All three signal types
+   - Use case: Comprehensive technical support routing
+   - Signals: urgent keywords + technical_help embeddings + CS/engineering/math domains
+
+### Signal Type Combinations (With Plugins)
+
+8. **09-keyword-plugin.yaml** - Keyword + Plugins
+   - Use case: FAQ with aggressive caching
+   - Plugins: semantic-cache, header_mutation
+
+9. **10-embedding-plugin.yaml** - Embedding + Plugins
+   - Use case: PII-protected sensitive data handling
+   - Plugins: pii (redaction), jailbreak protection
+
+10. **11-domain-plugin.yaml** - Domain + Plugins
+    - Use case: Legal advice with disclaimers
+    - Plugins: system_prompt, semantic-cache
+
+11. **12-keyword-embedding-plugin.yaml** - Keyword + Embedding + Plugins
+    - Use case: Security queries with protection
+    - Plugins: jailbreak, system_prompt, header_mutation
+
+12. **13-keyword-domain-plugin.yaml** - Keyword + Domain + Plugins
+    - Use case: Medical queries with PII protection
+    - Plugins: pii (hash mode), system_prompt, semantic-cache
+
+13. **14-domain-embedding-plugin.yaml** - Domain + Embedding + Plugins
+    - Use case: Financial advice with comprehensive protection
+    - Plugins: pii, system_prompt, jailbreak, semantic-cache
+
+14. **15-keyword-embedding-domain-plugin.yaml** - Keyword + Embedding + Domain + Plugins
+    - Use case: Enterprise compliance and legal queries with full protection
+    - Signals: compliance/confidential keywords + business_analysis/legal_review embeddings + business/law/economics domains
+    - Plugins: pii (hash/mask modes), jailbreak, system_prompt, semantic-cache, header_mutation
+    - Multiple decisions with different plugin configurations
+
+15. **16-keyword-embedding-domain-no-plugin.yaml** - All signals, no plugins
+    - Use case: Educational tutorials across multiple domains
+    - Signals: tutorial keywords + learning_intent embeddings + CS/math/engineering domains
+    - Multiple decisions with different priorities
+
+## Plugin Types Used
+
+- **semantic-cache**: Cache responses for similar queries
+- **pii**: Detect and redact/mask/hash PII entities
+- **jailbreak**: Detect and block jailbreak attempts
+- **system_prompt**: Inject custom system prompts
+- **header_mutation**: Add custom headers to requests
+
+## Running Tests
+
+```bash
+cd src/semantic-router
+go test ./pkg/k8s -v -run TestConverterWithTestData
+```
+
+This will:
+1. Load `base-config.yaml` as the static configuration base
+2. Parse each input YAML file (IntelligentPool + IntelligentRoute)
+3. Convert CRDs to RouterConfig format
+4. Merge static base config with dynamic CRD-derived config
+5. Generate output YAML files in `testdata/output/`
+6. Validate that output can be unmarshaled correctly
+
+## Output Structure
+
+Each generated output file contains:
+- **Static parts** (from base-config.yaml):
+  - embedding_models, bert_model, classifier, prompt_guard
+  - semantic_cache, observability, api, tools
+  - reasoning_families, default_reasoning_effort
+  
+- **Dynamic parts** (from CRDs):
+  - keyword_rules (from signals.keywords)
+  - embedding_rules (from signals.embeddings)
+  - categories (from signals.domains)
+  - decisions (from decisions)
+  - model_config (from IntelligentPool.models)
+  - default_model (from IntelligentPool.defaultModel)
+
@@ -0,0 +1,79 @@
+---
+apiVersion: vllm.ai/v1alpha1
+kind: IntelligentPool
+metadata:
+  name: test-pool
+  namespace: default
+spec:
+  defaultModel: "qwen3-8b"
+  models:
+    - name: "qwen3-8b"
+      reasoningFamily: "qwen3"
+      piiPolicy:
+        allowByDefault: true
+      pricing:
+        inputTokenPrice: 0.000001
+        outputTokenPrice: 0.000002
+      loras:
+        - name: "tech-expert"
+          description: "Technical support specialist"
+---
+apiVersion: vllm.ai/v1alpha1
+kind: IntelligentRoute
+metadata:
+  name: test-route
+  namespace: default
+spec:
+  signals:
+    keywords:
+      - name: "urgent"
+        operator: "OR"
+        keywords: ["urgent", "emergency", "asap"]
+        caseSensitive: false
+    embeddings:
+      - name: "tech_support"
+        threshold: 0.75
+        candidates:
+          - "I need help with technical issues"
+          - "Can you help me troubleshoot this problem?"
+          - "Something is not working correctly"
+        aggregationMethod: "max"
+    domains:
+      - "computer_science"
+      - "math"
+  
+  decisions:
+    - name: "urgent_tech"
+      priority: 100
+      description: "Urgent technical support requests"
+      signals:
+        operator: "AND"
+        conditions:
+          - type: "keyword"
+            name: "urgent"
+          - type: "embedding"
+            name: "tech_support"
+      modelRefs:
+        - model: "qwen3-8b"
+          useReasoning: true
+          reasoningEffort: "medium"
+      plugins:
+        - type: "semantic-cache"
+          configuration:
+            enabled: true
+            threshold: 0.9
+    
+    - name: "general_tech"
+      priority: 50
+      description: "General technical queries"
+      signals:
+        operator: "OR"
+        conditions:
+          - type: "embedding"
+            name: "tech_support"
+          - type: "domain"
+            name: "computer_science"
+      modelRefs:
+        - model: "qwen3-8b"
+          useReasoning: false
+
@@ -0,0 +1,61 @@
+---
+apiVersion: vllm.ai/v1alpha1
+kind: IntelligentPool
+metadata:
+  name: keyword-pool
+  namespace: default
+spec:
+  defaultModel: "base-model"
+  models:
+    - name: "base-model"
+      reasoningFamily: "qwen3"
+      piiPolicy:
+        allowByDefault: true
+      pricing:
+        inputTokenPrice: 0.000001
+        outputTokenPrice: 0.000002
+
+---
+apiVersion: vllm.ai/v1alpha1
+kind: IntelligentRoute
+metadata:
+  name: keyword-route
+  namespace: default
+spec:
+  signals:
+    keywords:
+      - name: "urgent"
+        operator: "OR"
+        keywords: ["urgent", "emergency", "critical", "asap"]
+        caseSensitive: false
+      - name: "greeting"
+        operator: "OR"
+        keywords: ["hello", "hi", "hey", "greetings"]
+        caseSensitive: false
+  
+  decisions:
+    - name: "urgent_request"
+      description: "Handle urgent requests"
+      priority: 100
+      signals:
+        operator: "AND"
+        conditions:
+          - type: "keyword"
+            name: "urgent"
+      modelRefs:
+        - model: "base-model"
+          use_reasoning: true
+          reasoning_effort: "high"
+    
+    - name: "greeting_response"
+      description: "Handle greetings"
+      priority: 50
+      signals:
+        operator: "AND"
+        conditions:
+          - type: "keyword"
+            name: "greeting"
+      modelRefs:
+        - model: "base-model"
+          use_reasoning: false
+