Skip to content

Commit 91bb39c

Browse files
authored
cuda: fix vmm oom issue on NVIDIA AGX Orin (#4687)
Signed-off-by: hydai <[email protected]>
1 parent 04ac060 commit 91bb39c

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

ggml-cuda.cu

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -6662,7 +6662,7 @@ static void ggml_cuda_pool_free_leg(int device, void * ptr, size_t size) {
66626662
// pool with virtual memory
66636663
static CUdeviceptr g_cuda_pool_addr[GGML_CUDA_MAX_DEVICES] = {0};
66646664
static size_t g_cuda_pool_used[GGML_CUDA_MAX_DEVICES] = {0};
6665-
static const size_t CUDA_POOL_VMM_MAX_SIZE = 1ull << 36; // 64 GB
6665+
static const size_t CUDA_POOL_VMM_MAX_SIZE = 1ull << 35; // 32 GB
66666666

66676667
static void * ggml_cuda_pool_malloc_vmm(int device, size_t size, size_t * actual_size) {
66686668
scoped_spin_lock lock(g_cuda_pool_lock);

0 commit comments

Comments
 (0)