|
15 | 15 | "export", "file", "frequency-penalty", "grammar", "grammar-file", "hellaswag", |
16 | 16 | "hellaswag-tasks", "ignore-eos", "in-prefix", "in-prefix-bos", "in-suffix", |
17 | 17 | "interactive", "interactive-first", "keep", "logdir", "logit-bias", "lora", "lora-base", |
18 | | - "low-vram", "main-gpu", "memory-f32", "mirostat", "mirostat-ent", "mirostat-lr", "mlock", |
| 18 | + "low-vram", "main-gpu", "mirostat", "mirostat-ent", "mirostat-lr", "mlock", |
19 | 19 | "model", "multiline-input", "n-gpu-layers", "n-predict", "no-mmap", "no-mul-mat-q", |
20 | 20 | "np-penalize-nl", "numa", "ppl-output-type", "ppl-stride", "presence-penalty", "prompt", |
21 | 21 | "prompt-cache", "prompt-cache-all", "prompt-cache-ro", "repeat-last-n", |
|
25 | 25 | ] |
26 | 26 |
|
27 | 27 | CLI_ARGS_LLAMA_BENCH = [ |
28 | | - "batch-size", "memory-f32", "low-vram", "model", "mul-mat-q", "n-gen", "n-gpu-layers", |
| 28 | + "batch-size", "low-vram", "model", "mul-mat-q", "n-gen", "n-gpu-layers", |
29 | 29 | "n-prompt", "output", "repetitions", "tensor-split", "threads", "verbose" |
30 | 30 | ] |
31 | 31 |
|
32 | 32 | CLI_ARGS_LLAMA_SERVER = [ |
33 | | - "alias", "batch-size", "ctx-size", "embedding", "host", "memory-f32", "lora", "lora-base", |
| 33 | + "alias", "batch-size", "ctx-size", "embedding", "host", "lora", "lora-base", |
34 | 34 | "low-vram", "main-gpu", "mlock", "model", "n-gpu-layers", "n-probs", "no-mmap", "no-mul-mat-q", |
35 | 35 | "numa", "path", "port", "rope-freq-base", "timeout", "rope-freq-scale", "tensor-split", |
36 | 36 | "threads", "verbose" |
|
0 commit comments