changed all defined short options to their corresponding long format in models.json.

kerem seyhan · kerem seyhan · commit 42e73e584d52 · 2025-05-12T16:20:53.000+03:00
diff --git a/models.json b/models.json
@@ -5,15 +5,15 @@
             "profiles": [
                 {
                     "name": "thinking",
-                    "command": "./llama-cli -hf Qwen/Qwen3-8B-GGUF:Q8_0 --jinja -fa --temp 0.6 --top-k 20 --top-p 0.95 --min-p 0 -c 40960 -n 32768 --no-context-shift",
+                    "command": "./llama-cli --model bartowski/Qwen_Qwen3-8B-GGUF/Qwen_Qwen3-8B-Q3_K_M.gguf --jinja --flash-attn --temp 0.6 --top-k 20 --top-p 0.95 --min-p 0 --ctx-size 40960 --predict 32768 --no-context-shift",
                     "references": [
                         "https://qwen.readthedocs.io/en/latest/run_locally/llama.cpp.html#llama-cli",
                         "https://huggingface.co/Qwen/Qwen3-235B-A22B#switching-between-thinking-and-non-thinking-mode"
                     ]
                 },
                 {
                     "name": "non thinking",
-                    "command": "./llama-cli -hf Qwen/Qwen3-8B-GGUF:Q8_0 --jinja -fa --temp 0.7 --top-k 20 --top-p 0.8 --min-p 0 -c 40960 -n 32768 --no-context-shift",
+                    "command": "./llama-cli --model bartowski/Qwen_Qwen3-8B-GGUF/Qwen_Qwen3-8B-Q3_K_M.gguf --jinja --flash-attn --temp 0.7 --top-k 20 --top-p 0.8 --min-p 0 --ctx-size 40960 --predict 32768 --no-context-shift",
                     "references": [
                         "https://qwen.readthedocs.io/en/latest/run_locally/llama.cpp.html#llama-cli",
                         "https://huggingface.co/Qwen/Qwen3-235B-A22B#switching-between-thinking-and-non-thinking-mode"
@@ -26,7 +26,7 @@
             "profiles": [
                 {
                     "name": "chat",
-                    "command": "./llama-cli --model unsloth-QwQ-32B-GGUF/QwQ-32B-Q4_K_M.gguf --ctx-size 16384 --temp 0.6 --repeat-penalty 1.1 --dry-multiplier 0.5 --min-p 0.01 --top-k 40 --top-p 0.95 --samplers \"top_k;top_p;min_p;temperature;dry;typ_p;xtc\"",
+                    "command": "./llama-cli --model unsloth-QwQ-32B-GGUF/QwQ-32B-Q4_K_M.gguf --ctx-size 32768 --temp 0.6 --repeat-penalty 1.1 --dry-multiplier 0.5 --min-p 0.01 --top-k 40 --top-p 0.95 --samplers \"top_k;top_p;min_p;temperature;dry;typ_p;xtc\"",
                     "references": [
                         "https://modelscope.cn/models/Qwen/QwQ-32B",
                         "https://huggingface.co/Qwen/QwQ-32B",
@@ -40,7 +40,7 @@
             "profiles": [
                 {
                     "name": "chat",
-                    "command": "./llama-cli --model unsloth/Llama-4-Scout-17B-16E-Instruct-GGUF/Llama-4-Scout-17B-16E-Instruct-UD-IQ2_XXS.gguf --ctx-size 16384 -ot \".ffn_.*_exps.=CPU\" --temp 0.6 --min-p 0.01 --top-p 0.9",
+                    "command": "./llama-cli --model unsloth/Llama-4-Scout-17B-16E-Instruct-GGUF/Llama-4-Scout-17B-16E-Instruct-UD-IQ2_XXS.gguf --ctx-size 10485760 --temp 0.6 --min-p 0.01 --top-p 0.9",
                     "references": [
                         "https://www.llama.com/docs/llama-everywhere/running-meta-llama-on-linux/",
                         "https://docs.unsloth.ai/basics/llama-4-how-to-run-and-fine-tune"
@@ -53,7 +53,7 @@
             "profiles": [
                 {
                     "name": "chat",
-                    "command": "./llama-cli --model bartowski/google_gemma-3-27b-it-qat-GGUF/gemma-3-27b-it-Q4_K_M.gguf --ctx-size 16384 --temp 1.0 --repeat-penalty 1.0 --min-p 0.01 --top-k 64 --top-p 0.95",
+                    "command": "./llama-cli --model bartowski/google_gemma-3-27b-it-qat-GGUF/gemma-3-27b-it-Q4_K_M.gguf --ctx-size 131072 --temp 1.0 --repeat-penalty 1.0 --min-p 0.01 --top-k 64 --top-p 0.95",
                     "references": [
                         "https://ollama.com/library/gemma3/blobs/3116c5225075",
                         "https://docs.unsloth.ai/basics/gemma-3-how-to-run-and-fine-tune"
@@ -78,7 +78,7 @@
             "profiles": [
                 {
                     "name": "chat",
-                    "command": "./llama-cli --model bartowski/agentica-org_DeepCoder-14B-Preview-GGUF/agentica-org_DeepCoder-14B-Preview-Q6_K.gguf --ctx-size 64000 --temp 0.6 --top-p 0.95",
+                    "command": "./llama-cli --model bartowski/agentica-org_DeepCoder-14B-Preview-GGUF/agentica-org_DeepCoder-14B-Preview-Q6_K.gguf --ctx-size 131072 --temp 0.6 --top-p 0.95",
                     "references": [
                         "https://huggingface.co/agentica-org/DeepCoder-14B-Preview"
                     ],