This repository was archived by the owner on Oct 15, 2025. It is now read-only.
File tree Expand file tree Collapse file tree 1 file changed +50
-0
lines changed
quickstart/examples/tool-calling Expand file tree Collapse file tree 1 file changed +50
-0
lines changed Original file line number Diff line number Diff line change 1+ # To run this example:
2+ # ./llmd-installer.sh --values-file examples/tool-calling/llama3-2-tool-calling.yaml
3+ sampleApplication :
4+ baseConfigMapRefName : basic-gpu-preset
5+ model :
6+ modelArtifactURI : hf://meta-llama/Llama-3.2-3B-Instruct
7+ modelName : " meta-llama/Llama-3.2-3B-Instruct"
8+ redis :
9+ enabled : false
10+ modelservice :
11+ prefill :
12+ replicas : 1
13+ extraArgs :
14+ - --enable-auto-tool-choice
15+ - --tool-call-parser
16+ - llama3_json
17+ - --chat-template
18+ # See https://github.com/neuralmagic/vllm/tree/main/examples for other templates
19+ - /workspace/vllm/examples/tool_chat_template_llama3.2_json.jinja
20+ decode :
21+ replicas : 1
22+ extraArgs :
23+ - --enable-auto-tool-choice
24+ - --tool-call-parser
25+ - llama3_json
26+ - --chat-template
27+ # See https://github.com/neuralmagic/vllm/tree/main/examples for other templates
28+ - /workspace/vllm/examples/tool_chat_template_llama3.2_json.jinja
29+ epp :
30+ defaultEnvVarsOverride :
31+ - name : ENABLE_KVCACHE_AWARE_SCORER
32+ value : " false"
33+ - name : ENABLE_PREFIX_AWARE_SCORER
34+ value : " true"
35+ - name : ENABLE_LOAD_AWARE_SCORER
36+ value : " true"
37+ - name : ENABLE_SESSION_AWARE_SCORER
38+ value : " false"
39+ - name : PD_ENABLED
40+ value : " false"
41+ - name : PD_PROMPT_LEN_THRESHOLD
42+ value : " 10"
43+ - name : PREFILL_ENABLE_KVCACHE_AWARE_SCORER
44+ value : " false"
45+ - name : PREFILL_ENABLE_LOAD_AWARE_SCORER
46+ value : " false"
47+ - name : PREFILL_ENABLE_PREFIX_AWARE_SCORER
48+ value : " false"
49+ - name : PREFILL_ENABLE_SESSION_AWARE_SCORER
50+ value : " false"
You can’t perform that action at this time.
0 commit comments