Skip to content

Commit e9c70d5

Browse files
ggerganovhodlen
authored andcommitted
scripts : fix typos, cleanup (ggml-org#5303)
1 parent 9873e98 commit e9c70d5

File tree

1 file changed

+12
-11
lines changed

1 file changed

+12
-11
lines changed

scripts/server-llm.sh

Lines changed: 12 additions & 11 deletions
Original file line numberDiff line numberDiff line change
@@ -14,16 +14,17 @@
1414
# - Might be unstable!
1515
#
1616
# Usage:
17-
# ./server-llm.sh [--port] [--repo] [--wtype] [--backend] [--gpu-id] [--n-parallel] [--n-kv] [--verbose]
17+
# ./server-llm.sh [--port] [--repo] [--wtype] [--backend] [--gpu-id] [--n-parallel] [--n-kv] [--verbose] [-non-interactive]
1818
#
19-
# --port: port number, default is 8888
20-
# --repo: path to a repo containing GGUF model files
21-
# --wtype: weights type (f16, q8_0, q4_0, q4_1), default is user-input
22-
# --backend: cpu, cuda, metal, opencl, depends on the OS
23-
# --gpu-id: gpu id, default is 0
24-
# --n-parallel: number of parallel requests, default is 8
25-
# --n-kv: KV cache size, default is 4096
26-
# --verbose: verbose output
19+
# --port: port number, default is 8888
20+
# --repo: path to a repo containing GGUF model files
21+
# --wtype: weights type (f16, q8_0, q4_0, q4_1), default is user-input
22+
# --backend: cpu, cuda, metal, opencl, depends on the OS
23+
# --gpu-id: gpu id, default is 0
24+
# --n-parallel: number of parallel requests, default is 8
25+
# --n-kv: KV cache size, default is 4096
26+
# --verbose: verbose output
27+
# --non-interactive: run without asking a permission to run
2728
#
2829
# Example:
2930
#
@@ -67,8 +68,7 @@ verbose=0
6768

6869
function print_usage {
6970
printf "Usage:\n"
70-
printf " ./server-llm.sh [-interactive] [--port] [--repo] [--wtype] [--backend] [--gpu-id] [--n-parallel] [--n-kv] [--verbose]\n\n"
71-
printf " --non-interactive: run without asking a permision to run\n"
71+
printf " ./server-llm.sh [--port] [--repo] [--wtype] [--backend] [--gpu-id] [--n-parallel] [--n-kv] [--verbose] [-non-interactive]\n\n"
7272
printf " --port: port number, default is 8888\n"
7373
printf " --repo: path to a repo containing GGUF model files\n"
7474
printf " --wtype: weights type (f16, q8_0, q4_0, q4_1), default is user-input\n"
@@ -77,6 +77,7 @@ function print_usage {
7777
printf " --n-parallel: number of parallel requests, default is 8\n"
7878
printf " --n-kv: KV cache size, default is 4096\n"
7979
printf " --verbose: verbose output\n\n"
80+
printf " --non-interactive: run without asking a permission to run\n"
8081
printf "Example:\n\n"
8182
printf ' bash -c "$(curl -s https://ggml.ai/server-llm.sh)"\n\n'
8283
}

0 commit comments

Comments
 (0)