forked from zilliztech/deep-searcher
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathconfig.yaml
More file actions
128 lines (105 loc) · 3.62 KB
/
config.yaml
File metadata and controls
128 lines (105 loc) · 3.62 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
provide_settings:
llm:
provider: "OpenAI"
config:
model: "gpt-4o-mini" # "gpt-o1-mini"
# api_key: "sk-xxxx" # Uncomment to override the `OPENAI_API_KEY` set in the environment variable
# base_url: ""
# provider: "DeepSeek"
# config:
# model: "deepseek-chat" # "deepseek-reasoner"
## api_key: "sk-xxxx" # Uncomment to override the `DEEPSEEK_API_KEY` set in the environment variable
## base_url: ""
# provider: "SiliconFlow"
# config:
# model: "deepseek-ai/DeepSeek-V3"
## api_key: "xxxx" # Uncomment to override the `SILICONFLOW_API_KEY` set in the environment variable
## base_url: ""
# provider: "PPIO"
# config:
# model: "deepseek/deepseek-v3/community"
## api_key: "sk_xxxxxx" # Uncomment to override the `PPIO_API_KEY` set in the environment variable
## base_url: ""
# provider: "TogetherAI"
# config:
# model: "deepseek-ai/DeepSeek-V3"
## api_key: "xxxx" # Uncomment to override the `TOGETHER_API_KEY` set in the environment variable
# provider: "AzureOpenAI"
# config:
# model: ""
# api_version: ""
## azure_endpoint: "xxxx" # Uncomment to override the `AZURE_OPENAI_ENDPOINT` set in the environment variable
## api_key: "xxxx" # Uncomment to override the `AZURE_OPENAI_KEY` set in the environment variable
# provider: "Ollama"
# config:
# model: "qwen2.5:3b"
## base_url: ""
embedding:
provider: "OpenAIEmbedding"
config:
model: "text-embedding-ada-002"
# api_key: "" # Uncomment to override the `OPENAI_API_KEY` set in the environment variable
# base_url: "" # Uncomment to override the `OPENAI_BASE_URL` set in the environment variable
# dimension: 1536 # Uncomment to customize the embedding dimension
# provider: "MilvusEmbedding"
# config:
# model: "default"
# provider: "VoyageEmbedding"
# config:
# model: "voyage-3"
## api_key: "" # Uncomment to override the `VOYAGE_API_KEY` set in the environment variable
# provider: "BedrockEmbedding"
# config:
# model: "amazon.titan-embed-text-v2:0"
## aws_access_key_id: "" # Uncomment to override the `AWS_ACCESS_KEY_ID` set in the environment variable
## aws_secret_access_key: "" # Uncomment to override the `AWS_SECRET_ACCESS_KEY` set in the environment variable
# provider: "SiliconflowEmbedding"
# config:
# model: "BAAI/bge-m3"
# . api_key: "" # Uncomment to override the `SILICONFLOW_API_KEY` set in the environment variable
file_loader:
provider: "PDFLoader"
config: {}
# provider: "JsonFileLoader"
# config:
# text_key: ""
# provider: "TextLoader"
# config: {}
# provider: "UnstructuredLoader"
# config: {}
web_crawler:
provider: "FireCrawlCrawler"
config: {}
# provider: "Crawl4AICrawler"
# config: # Uncomment to custom browser configuration for Crawl4AI
# browser_config:
# headless: false
# proxy: "http://127.0.0.1:7890"
# chrome_channel: "chrome"
# verbose: true
# viewport_width: 800
# viewport_height: 600
# provider: "JinaCrawler"
# config: {}
vector_db:
provider: "Milvus"
config:
default_collection: "deepsearcher"
uri: "./milvus.db"
token: "root:Milvus"
db: "default"
# vector_db:
# provider: "OracleDB"
# config:
# default_collection: "deepsearcher"
# user: ""
# password: ""
# dsn: ""
# config_dir: ""
# wallet_location: ""
# wallet_password: ""
query_settings:
max_iter: 3
load_settings:
chunk_size: 1500
chunk_overlap: 100