Skip to content

Commit 0e018fe

Browse files
committed
ggml : fix Q4_3 cuBLAS
1 parent 857308d commit 0e018fe

File tree

2 files changed

+5
-0
lines changed

2 files changed

+5
-0
lines changed

CMakeLists.txt

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -312,6 +312,7 @@ add_library(ggml OBJECT
312312
target_include_directories(ggml PUBLIC .)
313313
target_compile_features(ggml PUBLIC c_std_11) # don't bump
314314
target_link_libraries(ggml PUBLIC Threads::Threads ${LLAMA_EXTRA_LIBS})
315+
315316
if (BUILD_SHARED_LIBS)
316317
set_target_properties(ggml PROPERTIES POSITION_INDEPENDENT_CODE ON)
317318
endif()
@@ -324,6 +325,7 @@ add_library(llama
324325
target_include_directories(llama PUBLIC .)
325326
target_compile_features(llama PUBLIC cxx_std_11) # don't bump
326327
target_link_libraries(llama PRIVATE ggml ${LLAMA_EXTRA_LIBS})
328+
327329
if (BUILD_SHARED_LIBS)
328330
set_target_properties(llama PROPERTIES POSITION_INDEPENDENT_CODE ON)
329331
target_compile_definitions(llama PRIVATE LLAMA_SHARED LLAMA_BUILD)

ggml.c

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -7992,6 +7992,9 @@ static void ggml_compute_forward_mul_mat_q_f32(
79927992
else if (type == GGML_TYPE_Q4_2) {
79937993
dequantize_row_q_cuda = dequantize_row_q4_2_cuda;
79947994
}
7995+
else if (type == GGML_TYPE_Q4_3) {
7996+
dequantize_row_q_cuda = dequantize_row_q4_3_cuda;
7997+
}
79957998
else {
79967999
GGML_ASSERT(false);
79978000
}

0 commit comments

Comments
 (0)