Skip to content

Commit 0640427

Browse files
committed
limit to GGML_ALLOW_CUDA_GRAPHS defined in llama.cpp cmake
1 parent 4087596 commit 0640427

File tree

2 files changed

+2
-1
lines changed

2 files changed

+2
-1
lines changed

CMakeLists.txt

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -413,6 +413,7 @@ if (LLAMA_CUDA)
413413
list(APPEND GGML_SOURCES_CUDA "ggml-cuda.cu")
414414

415415
add_compile_definitions(GGML_USE_CUDA)
416+
add_compile_definitions(GGML_ALLOW_CUDA_GRAPHS)
416417
if (LLAMA_CUDA_FORCE_DMMV)
417418
add_compile_definitions(GGML_CUDA_FORCE_DMMV)
418419
endif()

ggml-cuda.cu

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2405,7 +2405,7 @@ GGML_CALL static void ggml_backend_cuda_synchronize(ggml_backend_t backend) {
24052405
GGML_UNUSED(backend);
24062406
}
24072407

2408-
#if (CUDART_VERSION >= 12000)
2408+
#if (CUDART_VERSION >= 12000) && defined(GGML_ALLOW_CUDA_GRAPHS)
24092409
#define USE_CUDA_GRAPH
24102410
#endif
24112411

0 commit comments

Comments
 (0)