|
15 | 15 | "export", "file", "frequency-penalty", "grammar", "grammar-file", "hellaswag",
|
16 | 16 | "hellaswag-tasks", "ignore-eos", "in-prefix", "in-prefix-bos", "in-suffix",
|
17 | 17 | "interactive", "interactive-first", "keep", "logdir", "logit-bias", "lora", "lora-base",
|
18 |
| - "low-vram", "main-gpu", "memory-f32", "mirostat", "mirostat-ent", "mirostat-lr", "mlock", |
| 18 | + "low-vram", "main-gpu", "mirostat", "mirostat-ent", "mirostat-lr", "mlock", |
19 | 19 | "model", "multiline-input", "n-gpu-layers", "n-predict", "no-mmap", "no-mul-mat-q",
|
20 | 20 | "np-penalize-nl", "numa", "ppl-output-type", "ppl-stride", "presence-penalty", "prompt",
|
21 | 21 | "prompt-cache", "prompt-cache-all", "prompt-cache-ro", "repeat-last-n",
|
|
25 | 25 | ]
|
26 | 26 |
|
27 | 27 | CLI_ARGS_LLAMA_BENCH = [
|
28 |
| - "batch-size", "memory-f32", "low-vram", "model", "mul-mat-q", "n-gen", "n-gpu-layers", |
| 28 | + "batch-size", "low-vram", "model", "mul-mat-q", "n-gen", "n-gpu-layers", |
29 | 29 | "n-prompt", "output", "repetitions", "tensor-split", "threads", "verbose"
|
30 | 30 | ]
|
31 | 31 |
|
32 | 32 | CLI_ARGS_LLAMA_SERVER = [
|
33 |
| - "alias", "batch-size", "ctx-size", "embedding", "host", "memory-f32", "lora", "lora-base", |
| 33 | + "alias", "batch-size", "ctx-size", "embedding", "host", "lora", "lora-base", |
34 | 34 | "low-vram", "main-gpu", "mlock", "model", "n-gpu-layers", "n-probs", "no-mmap", "no-mul-mat-q",
|
35 | 35 | "numa", "path", "port", "rope-freq-base", "timeout", "rope-freq-scale", "tensor-split",
|
36 | 36 | "threads", "verbose"
|
|
0 commit comments