You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
Copy file name to clipboardExpand all lines: config/config.yaml
+19-19Lines changed: 19 additions & 19 deletions
Original file line number
Diff line number
Diff line change
@@ -1,15 +1,15 @@
1
1
bert_model:
2
-
model_id: sentence-transformers/all-MiniLM-L12-v2
2
+
model_id: models/all-MiniLM-L12-v2
3
3
threshold: 0.6
4
4
use_cpu: true
5
5
6
6
semantic_cache:
7
7
enabled: true
8
-
backend_type: "memory"# Options: "memory" or "milvus"
8
+
backend_type: "memory"# Options: "memory" or "milvus"
9
9
similarity_threshold: 0.8
10
-
max_entries: 1000# Only applies to memory backend
10
+
max_entries: 1000# Only applies to memory backend
11
11
ttl_seconds: 3600
12
-
eviction_policy: "fifo"
12
+
eviction_policy: "fifo"
13
13
14
14
tools:
15
15
enabled: true
@@ -32,13 +32,13 @@ prompt_guard:
32
32
# NOT supported: domain names (example.com), protocol prefixes (http://), paths (/api), ports in address (use 'port' field)
33
33
vllm_endpoints:
34
34
- name: "endpoint1"
35
-
address: "172.28.0.20"# Static IPv4 of llm-katan within docker compose network
35
+
address: "172.28.0.20"# Static IPv4 of llm-katan within docker compose network
36
36
port: 8002
37
37
weight: 1
38
38
39
39
model_config:
40
40
"qwen3":
41
-
reasoning_family: "qwen3"# This model uses Qwen-3 reasoning syntax
41
+
reasoning_family: "qwen3"# This model uses Qwen-3 reasoning syntax
42
42
preferred_endpoints: ["endpoint1"]
43
43
pii_policy:
44
44
allow_by_default: true
@@ -65,7 +65,7 @@ categories:
65
65
model_scores:
66
66
- model: qwen3
67
67
score: 0.7
68
-
use_reasoning: false # Business performs better without reasoning
68
+
use_reasoning: false # Business performs better without reasoning
69
69
- name: law
70
70
system_prompt: "You are a knowledgeable legal expert with comprehensive understanding of legal principles, case law, statutory interpretation, and legal procedures across multiple jurisdictions. Provide accurate legal information and analysis while clearly stating that your responses are for informational purposes only and do not constitute legal advice. Always recommend consulting with qualified legal professionals for specific legal matters."
71
71
model_scores:
@@ -89,7 +89,7 @@ categories:
89
89
model_scores:
90
90
- model: qwen3
91
91
score: 0.6
92
-
use_reasoning: true # Enable reasoning for complex chemistry
92
+
use_reasoning: true # Enable reasoning for complex chemistry
93
93
- name: history
94
94
system_prompt: "You are a historian with expertise across different time periods and cultures. Provide accurate historical context and analysis."
95
95
model_scores:
@@ -119,13 +119,13 @@ categories:
119
119
model_scores:
120
120
- model: qwen3
121
121
score: 1.0
122
-
use_reasoning: true # Enable reasoning for complex math
122
+
use_reasoning: true # Enable reasoning for complex math
123
123
- name: physics
124
124
system_prompt: "You are a physics expert with deep understanding of physical laws and phenomena. Provide clear explanations with mathematical derivations when appropriate."
125
125
model_scores:
126
126
- model: qwen3
127
127
score: 0.7
128
-
use_reasoning: true # Enable reasoning for physics
128
+
use_reasoning: true # Enable reasoning for physics
129
129
- name: computer science
130
130
system_prompt: "You are a computer science expert with knowledge of algorithms, data structures, programming languages, and software engineering. Provide clear, practical solutions with code examples when helpful."
0 commit comments