14
14
# - Might be unstable!
15
15
#
16
16
# Usage:
17
- # ./server-llm.sh [--port] [--repo] [--wtype] [--backend] [--gpu-id] [--n-parallel] [--n-kv] [--verbose]
17
+ # ./server-llm.sh [--port] [--repo] [--wtype] [--backend] [--gpu-id] [--n-parallel] [--n-kv] [--verbose] [-non-interactive]
18
18
#
19
- # --port: port number, default is 8888
20
- # --repo: path to a repo containing GGUF model files
21
- # --wtype: weights type (f16, q8_0, q4_0, q4_1), default is user-input
22
- # --backend: cpu, cuda, metal, opencl, depends on the OS
23
- # --gpu-id: gpu id, default is 0
24
- # --n-parallel: number of parallel requests, default is 8
25
- # --n-kv: KV cache size, default is 4096
26
- # --verbose: verbose output
19
+ # --port: port number, default is 8888
20
+ # --repo: path to a repo containing GGUF model files
21
+ # --wtype: weights type (f16, q8_0, q4_0, q4_1), default is user-input
22
+ # --backend: cpu, cuda, metal, opencl, depends on the OS
23
+ # --gpu-id: gpu id, default is 0
24
+ # --n-parallel: number of parallel requests, default is 8
25
+ # --n-kv: KV cache size, default is 4096
26
+ # --verbose: verbose output
27
+ # --non-interactive: run without asking a permission to run
27
28
#
28
29
# Example:
29
30
#
@@ -67,8 +68,7 @@ verbose=0
67
68
68
69
function print_usage {
69
70
printf " Usage:\n"
70
- printf " ./server-llm.sh [-interactive] [--port] [--repo] [--wtype] [--backend] [--gpu-id] [--n-parallel] [--n-kv] [--verbose]\n\n"
71
- printf " --non-interactive: run without asking a permision to run\n"
71
+ printf " ./server-llm.sh [--port] [--repo] [--wtype] [--backend] [--gpu-id] [--n-parallel] [--n-kv] [--verbose] [-non-interactive]\n\n"
72
72
printf " --port: port number, default is 8888\n"
73
73
printf " --repo: path to a repo containing GGUF model files\n"
74
74
printf " --wtype: weights type (f16, q8_0, q4_0, q4_1), default is user-input\n"
@@ -77,6 +77,7 @@ function print_usage {
77
77
printf " --n-parallel: number of parallel requests, default is 8\n"
78
78
printf " --n-kv: KV cache size, default is 4096\n"
79
79
printf " --verbose: verbose output\n\n"
80
+ printf " --non-interactive: run without asking a permission to run\n"
80
81
printf " Example:\n\n"
81
82
printf ' bash -c "$(curl -s https://ggml.ai/server-llm.sh)"\n\n'
82
83
}
0 commit comments