Skip to content
This repository was archived by the owner on Oct 15, 2025. It is now read-only.

Commit 6842d8f

Browse files
committed
add tool-calling quickstart
Signed-off-by: sallyom <somalley@redhat.com>
1 parent 83a237c commit 6842d8f

File tree

1 file changed

+50
-0
lines changed

1 file changed

+50
-0
lines changed
Lines changed: 50 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,50 @@
1+
# To run this example:
2+
# ./llmd-installer.sh --values-file examples/tool-calling/llama3-2-tool-calling.yaml
3+
sampleApplication:
4+
baseConfigMapRefName: basic-gpu-preset
5+
model:
6+
modelArtifactURI: hf://meta-llama/Llama-3.2-3B-Instruct
7+
modelName: "meta-llama/Llama-3.2-3B-Instruct"
8+
redis:
9+
enabled: false
10+
modelservice:
11+
prefill:
12+
replicas: 1
13+
extraArgs:
14+
- --enable-auto-tool-choice
15+
- --tool-call-parser
16+
- llama3_json
17+
- --chat-template
18+
# See https://github.com/neuralmagic/vllm/tree/main/examples for other templates
19+
- /workspace/vllm/examples/tool_chat_template_llama3.2_json.jinja
20+
decode:
21+
replicas: 1
22+
extraArgs:
23+
- --enable-auto-tool-choice
24+
- --tool-call-parser
25+
- llama3_json
26+
- --chat-template
27+
# See https://github.com/neuralmagic/vllm/tree/main/examples for other templates
28+
- /workspace/vllm/examples/tool_chat_template_llama3.2_json.jinja
29+
epp:
30+
defaultEnvVarsOverride:
31+
- name: ENABLE_KVCACHE_AWARE_SCORER
32+
value: "false"
33+
- name: ENABLE_PREFIX_AWARE_SCORER
34+
value: "true"
35+
- name: ENABLE_LOAD_AWARE_SCORER
36+
value: "true"
37+
- name: ENABLE_SESSION_AWARE_SCORER
38+
value: "false"
39+
- name: PD_ENABLED
40+
value: "false"
41+
- name: PD_PROMPT_LEN_THRESHOLD
42+
value: "10"
43+
- name: PREFILL_ENABLE_KVCACHE_AWARE_SCORER
44+
value: "false"
45+
- name: PREFILL_ENABLE_LOAD_AWARE_SCORER
46+
value: "false"
47+
- name: PREFILL_ENABLE_PREFIX_AWARE_SCORER
48+
value: "false"
49+
- name: PREFILL_ENABLE_SESSION_AWARE_SCORER
50+
value: "false"

0 commit comments

Comments
 (0)