Skip to content

Commit a76cada

Browse files
committed
use recommended granularity instead of minimum
1 parent 2c3fbf9 commit a76cada

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

ggml-cuda.cu

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -6840,7 +6840,7 @@ void ggml_init_cublas() {
68406840
alloc_prop.type = CU_MEM_ALLOCATION_TYPE_PINNED;
68416841
alloc_prop.location.type = CU_MEM_LOCATION_TYPE_DEVICE;
68426842
alloc_prop.location.id = id;
6843-
CU_CHECK(cuMemGetAllocationGranularity(&g_device_caps[id].vmm_granularity, &alloc_prop, CU_MEM_ALLOC_GRANULARITY_MINIMUM));
6843+
CU_CHECK(cuMemGetAllocationGranularity(&g_device_caps[id].vmm_granularity, &alloc_prop, CU_MEM_ALLOC_GRANULARITY_RECOMMENDED));
68446844
}
68456845
#endif // !defined(GGML_USE_HIPBLAS)
68466846
g_device_caps[id].vmm = !!device_vmm;

0 commit comments

Comments
 (0)