Skip to content

Commit 9bdf109

Browse files
committed
Merge commit '652499ed81bf1c8629073b5589dbd6f5ec014b37'
2 parents 4cf9697 + 652499e commit 9bdf109

File tree

39 files changed

+419
-414
lines changed

39 files changed

+419
-414
lines changed

Cargo.toml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
[package]
22
name = "echokit_server"
3-
version = "0.2.5"
3+
version = "0.3.0"
44
edition = "2021"
55

66
[dependencies]

docker/server-vad/config.toml

Lines changed: 5 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -2,12 +2,14 @@ addr = "0.0.0.0:8080"
22
hello_wav = "hello.wav"
33

44
[tts]
5-
platform = "Groq"
5+
platform = "openai"
6+
url = "https://api.groq.com/openai/v1/audio/speech"
67
model = "playai-tts"
78
api_key = "gsk_ABCD"
89
voice = "Fritz-PlayAI"
910

1011
[asr]
12+
platform = "openai"
1113
url = "https://api.groq.com/openai/v1/audio/transcriptions"
1214
api_key = "gsk_ABCD"
1315
model = "whisper-large-v3"
@@ -19,7 +21,8 @@ vad_url = "http://localhost:8000/v1/audio/vad"
1921
# vad_realtime_url = "ws://localhost:8000/v1/audio/realtime_vad"
2022

2123
[llm]
22-
llm_chat_url = "https://api.groq.com/openai/v1/chat/completions"
24+
platform = "openai_chat"
25+
url = "https://api.groq.com/openai/v1/chat/completions"
2326
api_key = "gsk_ABCD"
2427
model = "openai/gpt-oss-20b"
2528
history = 5

docker/server/config.toml

Lines changed: 5 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -2,20 +2,23 @@ addr = "0.0.0.0:8080"
22
hello_wav = "hello.wav"
33

44
[tts]
5-
platform = "Groq"
5+
platform = "openai"
6+
url = "https://api.groq.com/openai/v1/audio/speech"
67
model = "playai-tts"
78
api_key = "gsk_ABCD"
89
voice = "Fritz-PlayAI"
910

1011
[asr]
12+
platform = "openai"
1113
url = "https://api.groq.com/openai/v1/audio/transcriptions"
1214
api_key = "gsk_ABCD"
1315
model = "whisper-large-v3"
1416
lang = "en"
1517
prompt = "Hello\n你好\n(noise)\n(bgm)\n(silence)\n"
1618

1719
[llm]
18-
llm_chat_url = "https://api.groq.com/openai/v1/chat/completions"
20+
platform = "openai_chat"
21+
url = "https://api.groq.com/openai/v1/chat/completions"
1922
api_key = "gsk_ABCD"
2023
model = "openai/gpt-oss-20b"
2124
history = 5

examples/alibailian/config.toml

Lines changed: 26 additions & 31 deletions
Original file line numberDiff line numberDiff line change
@@ -1,56 +1,51 @@
1-
addr = "0.0.0.0:8070"
1+
addr = "0.0.0.0:8080"
22
hello_wav = "hello.wav"
33

4+
# Get your API key from https://bailian.console.aliyun.com/
5+
46
[asr]
5-
# platform = "paraformer_v2"
6-
platform = "ParaformerV2"
7-
paraformer_token = "API Key"
7+
platform = "paraformer_v2"
8+
url = "wss://dashscope.aliyuncs.com/api-ws/v1/inference"
9+
paraformer_token = "sk-API-KEY"
810

9-
# Get your API key from https://bailian.console.aliyun.com/
1011

1112
[tts]
12-
# platform = "cosyvoice"
13-
platform = "CosyVoice"
14-
token = "API Key"
13+
platform = "cosyvoice"
14+
url = "wss://dashscope.aliyuncs.com/api-ws/v1/inference"
15+
token = "sk-API-KEY"
1516
speaker = "longhua_v2"
1617

17-
# Get your API key from https://bailian.console.aliyun.com/
1818
# Supported platforms: cosyvoice-v2 (default) and cosyvoice-v1
1919
# Get speaker list from https://help.aliyun.com/zh/model-studio/cosyvoice-java-sdk#722dd7ca66a6x
2020

2121
[llm]
22-
platform = "chat"
22+
platform = "openai_chat"
2323
url = "https://dashscope.aliyuncs.com/compatible-mode/v1/chat/completions"
24-
api_key = "API-key"
24+
api_key = "sk-API-KEY"
2525
model = "qwen-plus"
2626
history = 5
2727

28-
# Get your API key from https://bailian.console.aliyun.com/
29-
# Any text generation models is supported.
30-
28+
[llm.extra]
29+
enable_search = true
3130

3231
[[llm.sys_prompts]]
3332
role = "system"
3433
content = """
35-
你叫胡桃,是一个优秀的翻译官。你现在的任务是,把我给你的中文翻译成英文,并且用英文回答我。
34+
You are a helpful assistant. Answer truthfully and concisely.
3635
37-
你说话时必须满足以下格式
38-
第一行是你当前的状态或者要执行的动作,第二行开始是你的对话内容
36+
- NEVER use bullet points
37+
- NEVER use tables
38+
- Answer in complete sentences as if you are in a conversation.
39+
- Use the web_search tool if you need information about current events such as news, political figures, stock prices, and crypto prices.
3940
40-
比如:
41-
[翻译]
42-
这句话的翻译是 "I am a translator"。
43-
"""
41+
------
4442
45-
[[llm.sys_prompts]]
46-
role = "user"
47-
content = """
48-
我是一个翻译官
49-
"""
43+
您是一位乐于助人的助手。请如实简洁地回答问题。
44+
45+
- 切勿使用列表
46+
- 切勿使用表格
47+
- 请使用完整的句子回答,就像在对话一样。
48+
- 如果您需要了解时事信息,例如新闻、政治人物、股票价格和加密货币价格,请使用 web_search tool。
5049
51-
[[llm.sys_prompts]]
52-
role = "assistant"
53-
content = """
54-
[翻译]
55-
这句话的翻译是 "I am a translator"。
5650
"""
51+

examples/background_gaia.gif

-44.5 KB
Binary file not shown.

examples/background_gosim.gif

-2.68 KB
Binary file not shown.

examples/background_wasmedge.gif

-5.74 KB
Binary file not shown.

examples/gaia/config.toml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -3,13 +3,13 @@ hello_wav = "hello.wav"
33

44
# Requires a local gsv_tts server at port 9094: https://github.com/second-state/gsv_tts
55
[tts]
6-
platform = "StreamGSV"
6+
platform = "stream_gsv"
77
url = "http://localhost:9094/v1/audio/stream_speech"
88
speaker = "cooper"
99

1010
# Requires a local Whisper API server at port 9092: https://llamaedge.com/docs/ai-models/speech-to-text/quick-start-whisper
1111
[asr]
12-
platform = "whisper"
12+
platform = "openai"
1313
url = "http://localhost:9092/v1/audio/transcriptions"
1414
lang = "auto"
1515
# Requires a local Silero VAD server at port 9093: https://github.com/second-state/silero_vad_server
@@ -18,7 +18,7 @@ vad_url = "http://localhost:9093/v1/audio/vad"
1818

1919
# Requires a local LlamaEdge API server at port 9091: https://llamaedge.com/docs/ai-models/llm/quick-start-llm
2020
[llm]
21-
platform = "chat"
21+
platform = "openai_chat"
2222
url = "http://localhost:9091/v1/chat/completions"
2323
api_key = "Bearer gaia-1234"
2424
model = "default"

examples/gaia/english_teacher/config.toml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -2,21 +2,21 @@ addr = "0.0.0.0:9090"
22
hello_wav = "hello.wav"
33

44
[tts]
5-
platform = "StreamGSV"
5+
platform = "stream_gsv"
66
url = "http://localhost:9094/v1/audio/stream_speech"
77
speaker = "cooper"
88

99
[asr]
10-
platform = "whisper"
10+
platform = "openai"
1111
url = "http://localhost:9092/v1/audio/transcriptions"
1212
lang = "auto"
1313
# vad_url = "http://localhost:9093/v1/audio/vad"
1414
vad_realtime_url = "ws://localhost:9093/v1/audio/realtime_vad"
1515

1616
[llm]
17-
platform = "chat"
17+
platform = "openai_chat"
1818
url = "http://localhost:9091/v1/chat/completions"
19-
api_key = "Bearer gaia-1234"
19+
api_key = "gaia-1234"
2020
history = 5
2121

2222
[[llm.sys_prompts]]

examples/gaia/oppenheimer/config.toml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -2,21 +2,21 @@ addr = "0.0.0.0:9090"
22
hello_wav = "hello.wav"
33

44
[tts]
5-
platform = "StreamGSV"
5+
platform = "stream_gsv"
66
url = "http://localhost:9094/v1/audio/stream_speech"
77
speaker = "cooper"
88

99
[asr]
10-
platform = "whisper"
10+
platform = "openai"
1111
url = "http://localhost:9092/v1/audio/transcriptions"
1212
lang = "auto"
1313
# vad_url = "http://localhost:9093/v1/audio/vad"
1414
vad_realtime_url = "ws://localhost:9093/v1/audio/realtime_vad"
1515

1616
[llm]
17-
platform = "chat"
17+
platform = "openai_chat"
1818
url = "http://localhost:9091/v1/chat/completions"
19-
api_key = "Bearer gaia-1234"
19+
api_key = "gaia-1234"
2020
history = 5
2121

2222
[[llm.sys_prompts]]

0 commit comments

Comments
 (0)