Skip to content

Commit 6266f14

Browse files
CUDA: mul_mat_q RDNA2 tunings
1 parent 230d46c commit 6266f14

File tree

3 files changed

+255
-40
lines changed

3 files changed

+255
-40
lines changed

CMakeLists.txt

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -377,7 +377,6 @@ if (LLAMA_HIPBLAS)
377377
target_compile_definitions(ggml-rocm PRIVATE GGML_CUDA_DMMV_X=${LLAMA_CUDA_DMMV_X})
378378
target_compile_definitions(ggml-rocm PRIVATE GGML_CUDA_MMV_Y=${LLAMA_CUDA_MMV_Y})
379379
target_compile_definitions(ggml-rocm PRIVATE K_QUANTS_PER_ITERATION=${LLAMA_CUDA_KQUANTS_ITER})
380-
target_compile_definitions(ggml-rocm PRIVATE CC_TURING=1000000000)
381380
set_source_files_properties(ggml-cuda.cu PROPERTIES LANGUAGE CXX)
382381
target_link_libraries(ggml-rocm PRIVATE hip::device PUBLIC hip::host roc::rocblas roc::hipblas)
383382

Makefile

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -295,7 +295,6 @@ ifdef LLAMA_HIPBLAS
295295
HIPFLAGS += -DGGML_CUDA_DMMV_X=$(LLAMA_CUDA_DMMV_X)
296296
HIPFLAGS += -DGGML_CUDA_MMV_Y=$(LLAMA_CUDA_MMV_Y)
297297
HIPFLAGS += -DK_QUANTS_PER_ITERATION=$(LLAMA_CUDA_KQUANTS_ITER)
298-
HIPFLAGS += -DCC_TURING=1000000000
299298
ifdef LLAMA_CUDA_FORCE_DMMV
300299
HIPFLAGS += -DGGML_CUDA_FORCE_DMMV
301300
endif # LLAMA_CUDA_FORCE_DMMV

0 commit comments

Comments
 (0)