|
19 | 19 |
|
20 | 20 | # Properties by which to differentiate results per commit:
|
21 | 21 | KEY_PROPERTIES = [
|
22 |
| - "cpu_info", "gpu_info", "n_gpu_layers", "main_gpu", "cuda", "opencl", "metal", "gpu_blas", |
23 |
| - "blas", "model_filename", "model_type", "model_size", "model_n_params", "n_batch", "n_threads", |
24 |
| - "type_k", "type_v", "no_kv_offload", "tensor_split", "n_prompt", "n_gen" |
| 22 | + "cpu_info", "gpu_info", "n_gpu_layers", "cuda", "opencl", "vulkan", "kompute", "metal", "sycl", "rpc", "gpu_blas", |
| 23 | + "blas", "model_filename", "model_type", "model_size", "model_n_params", "n_batch", "n_ubatch", "embeddings", "n_threads", |
| 24 | + "type_k", "type_v", "use_mmap", "no_kv_offload", "split_mode", "main_gpu", "tensor_split", "flash_attn", "n_prompt", "n_gen" |
25 | 25 | ]
|
26 | 26 |
|
27 | 27 | # Properties that are boolean and are converted to Yes/No for the table:
|
28 |
| -BOOL_PROPERTIES = ["cuda", "opencl", "metal", "gpu_blas", "blas"] |
| 28 | +BOOL_PROPERTIES = ["cuda", "opencl", "vulkan", "kompute", "metal", "sycl", "gpu_blas", "blas", "embeddings", "use_mmap", "no_kv_offload", "flash_attn"] |
29 | 29 |
|
30 | 30 | # Header names for the table:
|
31 | 31 | PRETTY_NAMES = {
|
32 |
| - "cuda": "CUDA", "opencl": "OpenCL", "metal": "Metal", "gpu_blas": "GPU BLAS", "blas": "BLAS", |
33 |
| - "cpu_info": "CPU", "gpu_info": "GPU", "model_filename": "File", "model_type": "Model", |
34 |
| - "model_size": "Model Size [GiB]", "model_n_params": "Num. of Parameters", |
35 |
| - "n_batch": "Batch size", "n_threads": "Threads", "type_k": "K type", "type_v": "V type", |
36 |
| - "n_gpu_layers": "GPU layers", "main_gpu": "Main GPU", "no_kv_offload": "NKVO", |
37 |
| - "tensor_split": "Tensor split" |
| 32 | + "cuda": "CUDA", "opencl": "OpenCL", "vulkan": "Vulkan", "kompute": "Kompute", "metal": "Metal", "sycl": "SYCL", "rpc": "RPC", |
| 33 | + "gpu_blas": "GPU BLAS", "blas": "BLAS", "cpu_info": "CPU", "gpu_info": "GPU", "model_filename": "File", "model_type": "Model", |
| 34 | + "model_size": "Model Size [GiB]", "model_n_params": "Num. of Par.", "n_batch": "Batch size", "n_ubatch": "Microbatch size", |
| 35 | + "n_threads": "Threads", "type_k": "K type", "type_v": "V type", "n_gpu_layers": "GPU layers", "split_mode": "Split mode", |
| 36 | + "main_gpu": "Main GPU", "no_kv_offload": "NKVO", "flash_attn": "FlashAttention", "tensor_split": "Tensor split", |
| 37 | + "use_mmap": "Use mmap", "embeddings": "Embeddings", |
38 | 38 | }
|
39 | 39 |
|
40 | 40 | DEFAULT_SHOW = ["model_type"] # Always show these properties by default.
|
|
0 commit comments