Skip to content

Commit c8047d5

Browse files
scripts: update compare_llama_bench.py [no ci] (#7673)
1 parent 30e238b commit c8047d5

File tree

1 file changed

+10
-10
lines changed

1 file changed

+10
-10
lines changed

scripts/compare-llama-bench.py

Lines changed: 10 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -19,22 +19,22 @@
1919

2020
# Properties by which to differentiate results per commit:
2121
KEY_PROPERTIES = [
22-
"cpu_info", "gpu_info", "n_gpu_layers", "main_gpu", "cuda", "opencl", "metal", "gpu_blas",
23-
"blas", "model_filename", "model_type", "model_size", "model_n_params", "n_batch", "n_threads",
24-
"type_k", "type_v", "no_kv_offload", "tensor_split", "n_prompt", "n_gen"
22+
"cpu_info", "gpu_info", "n_gpu_layers", "cuda", "opencl", "vulkan", "kompute", "metal", "sycl", "rpc", "gpu_blas",
23+
"blas", "model_filename", "model_type", "model_size", "model_n_params", "n_batch", "n_ubatch", "embeddings", "n_threads",
24+
"type_k", "type_v", "use_mmap", "no_kv_offload", "split_mode", "main_gpu", "tensor_split", "flash_attn", "n_prompt", "n_gen"
2525
]
2626

2727
# Properties that are boolean and are converted to Yes/No for the table:
28-
BOOL_PROPERTIES = ["cuda", "opencl", "metal", "gpu_blas", "blas"]
28+
BOOL_PROPERTIES = ["cuda", "opencl", "vulkan", "kompute", "metal", "sycl", "gpu_blas", "blas", "embeddings", "use_mmap", "no_kv_offload", "flash_attn"]
2929

3030
# Header names for the table:
3131
PRETTY_NAMES = {
32-
"cuda": "CUDA", "opencl": "OpenCL", "metal": "Metal", "gpu_blas": "GPU BLAS", "blas": "BLAS",
33-
"cpu_info": "CPU", "gpu_info": "GPU", "model_filename": "File", "model_type": "Model",
34-
"model_size": "Model Size [GiB]", "model_n_params": "Num. of Parameters",
35-
"n_batch": "Batch size", "n_threads": "Threads", "type_k": "K type", "type_v": "V type",
36-
"n_gpu_layers": "GPU layers", "main_gpu": "Main GPU", "no_kv_offload": "NKVO",
37-
"tensor_split": "Tensor split"
32+
"cuda": "CUDA", "opencl": "OpenCL", "vulkan": "Vulkan", "kompute": "Kompute", "metal": "Metal", "sycl": "SYCL", "rpc": "RPC",
33+
"gpu_blas": "GPU BLAS", "blas": "BLAS", "cpu_info": "CPU", "gpu_info": "GPU", "model_filename": "File", "model_type": "Model",
34+
"model_size": "Model Size [GiB]", "model_n_params": "Num. of Par.", "n_batch": "Batch size", "n_ubatch": "Microbatch size",
35+
"n_threads": "Threads", "type_k": "K type", "type_v": "V type", "n_gpu_layers": "GPU layers", "split_mode": "Split mode",
36+
"main_gpu": "Main GPU", "no_kv_offload": "NKVO", "flash_attn": "FlashAttention", "tensor_split": "Tensor split",
37+
"use_mmap": "Use mmap", "embeddings": "Embeddings",
3838
}
3939

4040
DEFAULT_SHOW = ["model_type"] # Always show these properties by default.

0 commit comments

Comments
 (0)