Skip to content

Commit 82323fb

Browse files
committed
fix
Signed-off-by: yuluo-yx <[email protected]>
1 parent 805a082 commit 82323fb

File tree

2 files changed

+61
-20
lines changed

2 files changed

+61
-20
lines changed
Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,8 @@
1+
{{- if not (lookup "v1" "Namespace" "" (include "semantic-router.namespace" .)) }}
12
apiVersion: v1
23
kind: Namespace
34
metadata:
45
name: {{ include "semantic-router.namespace" . }}
56
labels:
67
{{- include "semantic-router.labels" . | nindent 4 }}
8+
{{- end }}

deploy/helm/semantic-router/values.yaml

Lines changed: 59 additions & 20 deletions
Original file line numberDiff line numberDiff line change
@@ -137,6 +137,8 @@ initContainer:
137137
cpu: "250m"
138138
# -- Models to download
139139
models:
140+
- name: all-MiniLM-L12-v2
141+
repo: sentence-transformers/all-MiniLM-L12-v2
140142
- name: category_classifier_modernbert-base_model
141143
repo: LLM-Semantic-Router/category_classifier_modernbert-base_model
142144
- name: pii_classifier_modernbert-base_model
@@ -213,7 +215,7 @@ persistence:
213215
config:
214216
# BERT model configuration
215217
bert_model:
216-
model_id: sentence-transformers/all-MiniLM-L12-v2
218+
model_id: models/all-MiniLM-L12-v2
217219
threshold: 0.6
218220
use_cpu: true
219221

@@ -246,14 +248,14 @@ config:
246248
# vLLM endpoints configuration
247249
vllm_endpoints:
248250
- name: "endpoint1"
249-
address: "127.0.0.1"
250-
port: 8000
251+
address: "172.28.0.20"
252+
port: 8002
251253
weight: 1
252254

253255
# Model configuration
254256
model_config:
255-
"openai/gpt-oss-20b":
256-
reasoning_family: "gpt-oss"
257+
"qwen3":
258+
reasoning_family: "qwen3"
257259
preferred_endpoints: ["endpoint1"]
258260
pii_policy:
259261
allow_by_default: true
@@ -276,78 +278,98 @@ config:
276278
# Categories configuration
277279
categories:
278280
- name: business
281+
system_prompt: "You are a senior business consultant and strategic advisor with expertise in corporate strategy, operations management, financial analysis, marketing, and organizational development. Provide practical, actionable business advice backed by proven methodologies and industry best practices. Consider market dynamics, competitive landscape, and stakeholder interests in your recommendations."
279282
model_scores:
280-
- model: openai/gpt-oss-20b
283+
- model: qwen3
281284
score: 0.7
282285
use_reasoning: false
283286
- name: law
287+
system_prompt: "You are a knowledgeable legal expert with comprehensive understanding of legal principles, case law, statutory interpretation, and legal procedures across multiple jurisdictions. Provide accurate legal information and analysis while clearly stating that your responses are for informational purposes only and do not constitute legal advice. Always recommend consulting with qualified legal professionals for specific legal matters."
284288
model_scores:
285-
- model: openai/gpt-oss-20b
289+
- model: qwen3
286290
score: 0.4
287291
use_reasoning: false
288292
- name: psychology
293+
system_prompt: "You are a psychology expert with deep knowledge of cognitive processes, behavioral patterns, mental health, developmental psychology, social psychology, and therapeutic approaches. Provide evidence-based insights grounded in psychological research and theory. When discussing mental health topics, emphasize the importance of professional consultation and avoid providing diagnostic or therapeutic advice."
294+
semantic_cache_enabled: true
295+
semantic_cache_similarity_threshold: 0.92
289296
model_scores:
290-
- model: openai/gpt-oss-20b
297+
- model: qwen3
291298
score: 0.6
292299
use_reasoning: false
293300
- name: biology
301+
system_prompt: "You are a biology expert with comprehensive knowledge spanning molecular biology, genetics, cell biology, ecology, evolution, anatomy, physiology, and biotechnology. Explain biological concepts with scientific accuracy, use appropriate terminology, and provide examples from current research. Connect biological principles to real-world applications and emphasize the interconnectedness of biological systems."
294302
model_scores:
295-
- model: openai/gpt-oss-20b
303+
- model: qwen3
296304
score: 0.9
297305
use_reasoning: false
298306
- name: chemistry
307+
system_prompt: "You are a chemistry expert specializing in chemical reactions, molecular structures, and laboratory techniques. Provide detailed, step-by-step explanations."
299308
model_scores:
300-
- model: openai/gpt-oss-20b
309+
- model: qwen3
301310
score: 0.6
302311
use_reasoning: true
303312
- name: history
313+
system_prompt: "You are a historian with expertise across different time periods and cultures. Provide accurate historical context and analysis."
304314
model_scores:
305-
- model: openai/gpt-oss-20b
315+
- model: qwen3
306316
score: 0.7
307317
use_reasoning: false
308318
- name: other
319+
system_prompt: "You are a helpful and knowledgeable assistant. Provide accurate, helpful responses across a wide range of topics."
320+
semantic_cache_enabled: true
321+
semantic_cache_similarity_threshold: 0.75
309322
model_scores:
310-
- model: openai/gpt-oss-20b
323+
- model: qwen3
311324
score: 0.7
312325
use_reasoning: false
313326
- name: health
327+
system_prompt: "You are a health and medical information expert with knowledge of anatomy, physiology, diseases, treatments, preventive care, nutrition, and wellness. Provide accurate, evidence-based health information while emphasizing that your responses are for educational purposes only and should never replace professional medical advice, diagnosis, or treatment. Always encourage users to consult healthcare professionals for medical concerns and emergencies."
328+
semantic_cache_enabled: true
329+
semantic_cache_similarity_threshold: 0.95
314330
model_scores:
315-
- model: openai/gpt-oss-20b
331+
- model: qwen3
316332
score: 0.5
317333
use_reasoning: false
318334
- name: economics
335+
system_prompt: "You are an economics expert with deep understanding of microeconomics, macroeconomics, econometrics, financial markets, monetary policy, fiscal policy, international trade, and economic theory. Analyze economic phenomena using established economic principles, provide data-driven insights, and explain complex economic concepts in accessible terms. Consider both theoretical frameworks and real-world applications in your responses."
319336
model_scores:
320-
- model: openai/gpt-oss-20b
337+
- model: qwen3
321338
score: 1.0
322339
use_reasoning: false
323340
- name: math
341+
system_prompt: "You are a mathematics expert. Provide step-by-step solutions, show your work clearly, and explain mathematical concepts in an understandable way."
324342
model_scores:
325-
- model: openai/gpt-oss-20b
343+
- model: qwen3
326344
score: 1.0
327345
use_reasoning: true
328346
- name: physics
347+
system_prompt: "You are a physics expert with deep understanding of physical laws and phenomena. Provide clear explanations with mathematical derivations when appropriate."
329348
model_scores:
330-
- model: openai/gpt-oss-20b
349+
- model: qwen3
331350
score: 0.7
332351
use_reasoning: true
333352
- name: computer science
353+
system_prompt: "You are a computer science expert with knowledge of algorithms, data structures, programming languages, and software engineering. Provide clear, practical solutions with code examples when helpful."
334354
model_scores:
335-
- model: openai/gpt-oss-20b
355+
- model: qwen3
336356
score: 0.6
337357
use_reasoning: false
338358
- name: philosophy
359+
system_prompt: "You are a philosophy expert with comprehensive knowledge of philosophical traditions, ethical theories, logic, metaphysics, epistemology, political philosophy, and the history of philosophical thought. Engage with complex philosophical questions by presenting multiple perspectives, analyzing arguments rigorously, and encouraging critical thinking. Draw connections between philosophical concepts and contemporary issues while maintaining intellectual honesty about the complexity and ongoing nature of philosophical debates."
339360
model_scores:
340-
- model: openai/gpt-oss-20b
361+
- model: qwen3
341362
score: 0.5
342363
use_reasoning: false
343364
- name: engineering
365+
system_prompt: "You are an engineering expert with knowledge across multiple engineering disciplines including mechanical, electrical, civil, chemical, software, and systems engineering. Apply engineering principles, design methodologies, and problem-solving approaches to provide practical solutions. Consider safety, efficiency, sustainability, and cost-effectiveness in your recommendations. Use technical precision while explaining concepts clearly, and emphasize the importance of proper engineering practices and standards."
344366
model_scores:
345-
- model: openai/gpt-oss-20b
367+
- model: qwen3
346368
score: 0.7
347369
use_reasoning: false
348370

349371
# Default model
350-
default_model: "openai/gpt-oss-20b"
372+
default_model: "qwen3"
351373

352374
# Reasoning families
353375
reasoning_families:
@@ -381,6 +403,23 @@ config:
381403
duration_buckets: [0.001, 0.005, 0.01, 0.025, 0.05, 0.1, 0.25, 0.5, 1, 2.5, 5, 10, 30]
382404
size_buckets: [1, 2, 5, 10, 20, 50, 100, 200]
383405

406+
# Observability configuration
407+
observability:
408+
tracing:
409+
enabled: true
410+
provider: "opentelemetry"
411+
exporter:
412+
type: "otlp"
413+
endpoint: "jaeger:4317"
414+
insecure: true
415+
sampling:
416+
type: "always_on"
417+
rate: 1.0
418+
resource:
419+
service_name: "vllm-semantic-router"
420+
service_version: "v0.1.0"
421+
deployment_environment: "development"
422+
384423
# Tools database configuration
385424
toolsDb:
386425
- tool:

0 commit comments

Comments
 (0)