Skip to content

Commit 4ad7e11

Browse files
committed
Added Q6_K kv cache option
1 parent c8c32fd commit 4ad7e11

File tree

3 files changed

+7
-3
lines changed

3 files changed

+7
-3
lines changed

.gitignore

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -4,3 +4,7 @@ __pycache__
44
.gitignore
55
llama.log
66
llama.log
7+
log.txt
8+
tensor_overrides/Kimi-K2-Instruct-UD-IQ1_S-00001-of-00006_Kimi-K2-Instruct-UD-IQ1_S_kv=q4_0_vv=q4_0_th=24_tb=48_ctx=131072_fa_tensor_params.txt
9+
tensor_overrides/Kimi-K2-Instruct-UD-IQ1_S-00001-of-00006_Kimi-K2-Instruct-UD-IQ1_S_kv=q4_0_vv=q4_0_th=24_tb=48_ctx=131072_fa_tensor_params_balanced.txt
10+
tensor_overrides/Kimi-K2-Instruct-UD-IQ1_S-00001-of-00006_Kimi-K2-Instruct-UD-IQ1_S_kv=q4_0_vv=q4_0_th=24_tb=48_ctx=131072_fa_tensor_params_original.txt

llamacpp-server-launcher.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1063,15 +1063,15 @@ def _setup_advanced_tab(self, parent):
10631063
ttk.Label(inner, text="KV Cache Type (--cache-type-k):")\
10641064
.grid(column=0, row=r, sticky="w", padx=10, pady=3)
10651065
# Combobox state is "readonly" for selection, but not disabled
1066-
self.cache_type_k_combo = ttk.Combobox(inner, textvariable=self.cache_type_k, width=10, values=("f16","f32","q8_0","q4_0","q4_1","q5_0","q5_1"), state="readonly")
1066+
self.cache_type_k_combo = ttk.Combobox(inner, textvariable=self.cache_type_k, width=10, values=("f16","f32","q8_0","q4_0","q4_1","q5_0","q5_1","q6_k"), state="readonly")
10671067
self.cache_type_k_combo.grid(column=1, row=r, sticky="w", padx=5, pady=3); r += 1
10681068
ttk.Label(inner, text="Quantization for KV cache (f16 is default, lower Q=more memory saved)", font=("TkSmallCaptionFont"))\
10691069
.grid(column=2, row=r-1, columnspan=2, sticky="w", padx=5, pady=3);
10701070

10711071
ttk.Label(inner, text="V Cache Type (--cache-type-v):")\
10721072
.grid(column=0, row=r, sticky="w", padx=10, pady=3)
10731073
# Combobox state is "readonly" for selection, but not disabled
1074-
self.cache_type_v_combo = ttk.Combobox(inner, textvariable=self.cache_type_v, width=10, values=("f16","f32","q8_0","q4_0","q4_1","q5_0","q5_1"), state="readonly")
1074+
self.cache_type_v_combo = ttk.Combobox(inner, textvariable=self.cache_type_v, width=10, values=("f16","f32","q8_0","q4_0","q4_1","q5_0","q5_1","q6_k"), state="readonly")
10751075
self.cache_type_v_combo.grid(column=1, row=r, sticky="w", padx=5, pady=3); r += 1
10761076
ttk.Label(inner, text="Quantization for V cache (f16 is default, lower Q=more memory saved)", font=("TkSmallCaptionFont"))\
10771077
.grid(column=2, row=r-1, columnspan=2, sticky="w", padx=5, pady=3);

version

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1 +1 @@
1-
2025-07-12-2
1+
2025-07-22-0

0 commit comments

Comments
 (0)