Skip to content

Commit e882c8b

Browse files
committed
swap to distilled model
1 parent baddb41 commit e882c8b

File tree

1 file changed

+10
-4
lines changed

1 file changed

+10
-4
lines changed

kubernetes/apps/base/llm/openclaw/llama-35b/helmrelease.yaml

Lines changed: 10 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -26,13 +26,19 @@ spec:
2626
- |
2727
set -euo pipefail
2828
29-
if [ ! -s /models/qwen35b/Qwen3.5-35B-A3B-UD-Q4_K_XL.gguf ] || [ ! -s /models/qwen35b/mmproj-F16.gguf ]; then
29+
if [ ! -s /models/qwen35b/Qwen3.5-35B-A3B-Claude-4.6-Opus-Reasoning-Distilled.i1-Q4_K_M.gguf ] || [ ! -s /models/qwen35b/mmproj-F16.gguf ]; then
3030
pip install --no-cache-dir huggingface_hub
3131
mkdir -p /models/qwen35b
32-
rm -rf /models/qwen35b/.cache/huggingface/download/Qwen3.5-35B-A3B-UD-Q4_K_XL.gguf.lock
32+
rm -rf /models/qwen35b/.cache/huggingface/download/Qwen3.5-35B-A3B-Claude-4.6-Opus-Reasoning-Distilled.i1-Q4_K_M.gguf.lock
33+
rm -rf /models/qwen35b/.cache/huggingface/download/mmproj-F16.gguf.lock
34+
35+
hf download \
36+
mradermacher/Qwen3.5-35B-A3B-Claude-4.6-Opus-Reasoning-Distilled-i1-GGUF \
37+
Qwen3.5-35B-A3B-Claude-4.6-Opus-Reasoning-Distilled.i1-Q4_K_M.gguf \
38+
--local-dir /models/qwen35b
39+
3340
hf download \
3441
unsloth/Qwen3.5-35B-A3B-GGUF \
35-
Qwen3.5-35B-A3B-UD-Q4_K_XL.gguf \
3642
mmproj-F16.gguf \
3743
--local-dir /models/qwen35b
3844
@@ -68,7 +74,7 @@ spec:
6874
- --alias
6975
- qwen35b
7076
- --model
71-
- /models/qwen35b/Qwen3.5-35B-A3B-UD-Q4_K_XL.gguf
77+
- /models/qwen35b/Qwen3.5-35B-A3B-Claude-4.6-Opus-Reasoning-Distilled.i1-Q4_K_M.gguf
7278
- --mmproj
7379
- /models/qwen35b/mmproj-F16.gguf
7480
- --ctx-size

0 commit comments

Comments
 (0)