Skip to content

Commit b772bba

Browse files
CUDA: fixed cmake F16 option (#2471)
1 parent 0728c5a commit b772bba

File tree

1 file changed

+3
-3
lines changed

1 file changed

+3
-3
lines changed

CMakeLists.txt

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -73,7 +73,7 @@ set(LLAMA_CUDA_MMQ_Y "64" CACHE STRING "llama: y tile size for mmq CUDA ke
7373
option(LLAMA_CUDA_FORCE_DMMV "llama: use dmmv instead of mmvq CUDA kernels" OFF)
7474
set(LLAMA_CUDA_DMMV_X "32" CACHE STRING "llama: x stride for dmmv CUDA kernels")
7575
set(LLAMA_CUDA_MMV_Y "1" CACHE STRING "llama: y block size for mmv CUDA kernels")
76-
option(LLAMA_CUDA_DMMV_F16 "llama: use 16 bit floats for dmmv CUDA kernels" OFF)
76+
option(LLAMA_CUDA_F16 "llama: use 16 bit floats for some calculations" OFF)
7777
set(LLAMA_CUDA_KQUANTS_ITER "2" CACHE STRING "llama: iters./thread per block for Q2_K/Q6_K")
7878
option(LLAMA_CLBLAST "llama: use CLBlast" OFF)
7979
option(LLAMA_METAL "llama: use Metal" OFF)
@@ -265,8 +265,8 @@ if (LLAMA_CUBLAS)
265265
if (DEFINED LLAMA_CUDA_DMMV_Y)
266266
add_compile_definitions(GGML_CUDA_MMV_Y=${LLAMA_CUDA_DMMV_Y}) # for backwards compatibility
267267
endif()
268-
if (LLAMA_CUDA_DMMV_F16)
269-
add_compile_definitions(GGML_CUDA_DMMV_F16)
268+
if (LLAMA_CUDA_F16 OR LLAMA_CUDA_DMMV_F16)
269+
add_compile_definitions(GGML_CUDA_F16)
270270
endif()
271271
add_compile_definitions(K_QUANTS_PER_ITERATION=${LLAMA_CUDA_KQUANTS_ITER})
272272

0 commit comments

Comments
 (0)