feat: implement decision-based routing with plugin architecture

Xunzhuo · Xunzhuo · commit 7be81a12f210 · 2025-11-18T11:09:30.000+08:00
Signed-off-by: bitliu &lt;bitliu@tencent.com&gt;
diff --git a/deploy/helm/semantic-router/values.yaml b/deploy/helm/semantic-router/values.yaml
@@ -250,21 +250,6 @@ config:
     use_cpu: true
     jailbreak_mapping_path: "models/jailbreak_classifier_modernbert-base_model/jailbreak_type_mapping.json"
 
-  # vLLM endpoints configuration
-  vllm_endpoints:
-    - name: "endpoint1"
-      address: "172.28.0.20"
-      port: 8002
-      weight: 1
-
-  # Model configuration
-  model_config:
-    "qwen3":
-      reasoning_family: "qwen3"
-      preferred_endpoints: ["endpoint1"]
-      pii_policy:
-        allow_by_default: true
-
   # Classifier configuration
   classifier:
     category_model:
@@ -280,102 +265,6 @@ config:
       use_cpu: true
       pii_mapping_path: "models/pii_classifier_modernbert-base_presidio_token_model/pii_type_mapping.json"
 
-  # Categories configuration
-  categories:
-    - name: business
-      system_prompt: "You are a senior business consultant and strategic advisor with expertise in corporate strategy, operations management, financial analysis, marketing, and organizational development. Provide practical, actionable business advice backed by proven methodologies and industry best practices. Consider market dynamics, competitive landscape, and stakeholder interests in your recommendations."
-      model_scores:
-        - model: qwen3
-          score: 0.7
-          use_reasoning: false
-    - name: law
-      system_prompt: "You are a knowledgeable legal expert with comprehensive understanding of legal principles, case law, statutory interpretation, and legal procedures across multiple jurisdictions. Provide accurate legal information and analysis while clearly stating that your responses are for informational purposes only and do not constitute legal advice. Always recommend consulting with qualified legal professionals for specific legal matters."
-      model_scores:
-        - model: qwen3
-          score: 0.4
-          use_reasoning: false
-    - name: psychology
-      system_prompt: "You are a psychology expert with deep knowledge of cognitive processes, behavioral patterns, mental health, developmental psychology, social psychology, and therapeutic approaches. Provide evidence-based insights grounded in psychological research and theory. When discussing mental health topics, emphasize the importance of professional consultation and avoid providing diagnostic or therapeutic advice."
-      semantic_cache_enabled: true
-      semantic_cache_similarity_threshold: 0.92
-      model_scores:
-        - model: qwen3
-          score: 0.6
-          use_reasoning: false
-    - name: biology
-      system_prompt: "You are a biology expert with comprehensive knowledge spanning molecular biology, genetics, cell biology, ecology, evolution, anatomy, physiology, and biotechnology. Explain biological concepts with scientific accuracy, use appropriate terminology, and provide examples from current research. Connect biological principles to real-world applications and emphasize the interconnectedness of biological systems."
-      model_scores:
-        - model: qwen3
-          score: 0.9
-          use_reasoning: false
-    - name: chemistry
-      system_prompt: "You are a chemistry expert specializing in chemical reactions, molecular structures, and laboratory techniques. Provide detailed, step-by-step explanations."
-      model_scores:
-        - model: qwen3
-          score: 0.6
-          use_reasoning: true
-    - name: history
-      system_prompt: "You are a historian with expertise across different time periods and cultures. Provide accurate historical context and analysis."
-      model_scores:
-        - model: qwen3
-          score: 0.7
-          use_reasoning: false
-    - name: other
-      system_prompt: "You are a helpful and knowledgeable assistant. Provide accurate, helpful responses across a wide range of topics."
-      semantic_cache_enabled: true
-      semantic_cache_similarity_threshold: 0.75
-      model_scores:
-        - model: qwen3
-          score: 0.7
-          use_reasoning: false
-    - name: health
-      system_prompt: "You are a health and medical information expert with knowledge of anatomy, physiology, diseases, treatments, preventive care, nutrition, and wellness. Provide accurate, evidence-based health information while emphasizing that your responses are for educational purposes only and should never replace professional medical advice, diagnosis, or treatment. Always encourage users to consult healthcare professionals for medical concerns and emergencies."
-      semantic_cache_enabled: true
-      semantic_cache_similarity_threshold: 0.95
-      model_scores:
-        - model: qwen3
-          score: 0.5
-          use_reasoning: false
-    - name: economics
-      system_prompt: "You are an economics expert with deep understanding of microeconomics, macroeconomics, econometrics, financial markets, monetary policy, fiscal policy, international trade, and economic theory. Analyze economic phenomena using established economic principles, provide data-driven insights, and explain complex economic concepts in accessible terms. Consider both theoretical frameworks and real-world applications in your responses."
-      model_scores:
-        - model: qwen3
-          score: 1.0
-          use_reasoning: false
-    - name: math
-      system_prompt: "You are a mathematics expert. Provide step-by-step solutions, show your work clearly, and explain mathematical concepts in an understandable way."
-      model_scores:
-        - model: qwen3
-          score: 1.0
-          use_reasoning: true
-    - name: physics
-      system_prompt: "You are a physics expert with deep understanding of physical laws and phenomena. Provide clear explanations with mathematical derivations when appropriate."
-      model_scores:
-        - model: qwen3
-          score: 0.7
-          use_reasoning: true
-    - name: computer science
-      system_prompt: "You are a computer science expert with knowledge of algorithms, data structures, programming languages, and software engineering. Provide clear, practical solutions with code examples when helpful."
-      model_scores:
-        - model: qwen3
-          score: 0.6
-          use_reasoning: false
-    - name: philosophy
-      system_prompt: "You are a philosophy expert with comprehensive knowledge of philosophical traditions, ethical theories, logic, metaphysics, epistemology, political philosophy, and the history of philosophical thought. Engage with complex philosophical questions by presenting multiple perspectives, analyzing arguments rigorously, and encouraging critical thinking. Draw connections between philosophical concepts and contemporary issues while maintaining intellectual honesty about the complexity and ongoing nature of philosophical debates."
-      model_scores:
-        - model: qwen3
-          score: 0.5
-          use_reasoning: false
-    - name: engineering
-      system_prompt: "You are an engineering expert with knowledge across multiple engineering disciplines including mechanical, electrical, civil, chemical, software, and systems engineering. Apply engineering principles, design methodologies, and problem-solving approaches to provide practical solutions. Consider safety, efficiency, sustainability, and cost-effectiveness in your recommendations. Use technical precision while explaining concepts clearly, and emphasize the importance of proper engineering practices and standards."
-      model_scores:
-        - model: qwen3
-          score: 0.7
-          use_reasoning: false
-
-  # Default model
-  default_model: "qwen3"
-
   # Reasoning families
   reasoning_families:
     deepseek:
diff --git a/deploy/kubernetes/ai-gateway/semantic-router-values/values.yaml b/deploy/kubernetes/ai-gateway/semantic-router-values/values.yaml
@@ -64,7 +64,7 @@ config:
         conditions:
           - type: "domain"
             category: "business"
-      model_refs:
+      modelRefs:
         - model: base-model
           lora_name: social-expert
           use_reasoning: false
@@ -83,7 +83,7 @@ config:
         conditions:
           - type: "domain"
             category: "law"
-      model_refs:
+      modelRefs:
         - model: base-model
           lora_name: law-expert
           use_reasoning: false
@@ -102,7 +102,7 @@ config:
         conditions:
           - type: "domain"
             category: "psychology"
-      model_refs:
+      modelRefs:
         - model: base-model
           lora_name: humanities-expert
           use_reasoning: false
@@ -125,7 +125,7 @@ config:
         conditions:
           - type: "domain"
             category: "biology"
-      model_refs:
+      modelRefs:
         - model: base-model
           lora_name: science-expert
           use_reasoning: false
@@ -144,7 +144,7 @@ config:
         conditions:
           - type: "domain"
             category: "chemistry"
-      model_refs:
+      modelRefs:
         - model: base-model
           lora_name: science-expert
           use_reasoning: true
@@ -163,7 +163,7 @@ config:
         conditions:
           - type: "domain"
             category: "history"
-      model_refs:
+      modelRefs:
         - model: base-model
           lora_name: humanities-expert
           use_reasoning: false
@@ -182,7 +182,7 @@ config:
         conditions:
           - type: "domain"
             category: "health"
-      model_refs:
+      modelRefs:
         - model: base-model
           lora_name: science-expert
           use_reasoning: false
@@ -205,7 +205,7 @@ config:
         conditions:
           - type: "domain"
             category: "economics"
-      model_refs:
+      modelRefs:
         - model: base-model
           lora_name: social-expert
           use_reasoning: false
@@ -224,7 +224,7 @@ config:
         conditions:
           - type: "domain"
             category: "math"
-      model_refs:
+      modelRefs:
         - model: base-model
           lora_name: math-expert
           use_reasoning: true
@@ -243,7 +243,7 @@ config:
         conditions:
           - type: "domain"
             category: "physics"
-      model_refs:
+      modelRefs:
         - model: base-model
           lora_name: science-expert
           use_reasoning: true
@@ -262,7 +262,7 @@ config:
         conditions:
           - type: "domain"
             category: "computer_science"
-      model_refs:
+      modelRefs:
         - model: base-model
           lora_name: science-expert
           use_reasoning: false
@@ -281,7 +281,7 @@ config:
         conditions:
           - type: "domain"
             category: "philosophy"
-      model_refs:
+      modelRefs:
         - model: base-model
           lora_name: humanities-expert
           use_reasoning: false
@@ -300,7 +300,7 @@ config:
         conditions:
           - type: "domain"
             category: "engineering"
-      model_refs:
+      modelRefs:
         - model: base-model
           lora_name: science-expert
           use_reasoning: false
@@ -319,7 +319,7 @@ config:
         conditions:
           - type: "keyword"
             rule_name: "thinking"
-      model_refs:
+      modelRefs:
         - model: base-model
           lora_name: general-expert
           use_reasoning: true
@@ -338,7 +338,7 @@ config:
         conditions:
           - type: "domain"
             category: "other"
-      model_refs:
+      modelRefs:
         - model: base-model
           lora_name: general-expert
           use_reasoning: false
diff --git a/src/semantic-router/pkg/config/validator.go b/src/semantic-router/pkg/config/validator.go
@@ -85,7 +85,14 @@ func getIPAddressType(address string) string {
 
 // validateConfigStructure performs additional validation on the parsed config
 func validateConfigStructure(cfg *RouterConfig) error {
-	// Validate decisions have at least one model ref
+	// In Kubernetes mode, decisions and model_config will be loaded from CRDs
+	// Skip validation for these fields during initial config parse
+	if cfg.ConfigSource == ConfigSourceKubernetes {
+		// Skip validation for decisions and model_config
+		return nil
+	}
+
+	// File mode: validate decisions have at least one model ref
 	for _, decision := range cfg.Decisions {
 		if len(decision.ModelRefs) == 0 {
 			return fmt.Errorf("decision '%s' has no modelRefs defined - each decision must have at least one model", decision.Name)