Skip to content

Commit 95a2041

Browse files
committed
Rebase to CTK 11.7
1 parent a6511d5 commit 95a2041

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

75 files changed

+79715
-48647
lines changed

README.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -8,7 +8,7 @@ Dependencies of the CUDA-Python bindings and some versions that are known to
88
work are as follows:
99

1010
* Driver: Linux (450.80.02 or later) Windows(456.38 or later)
11-
* CUDA Toolkit 11.0 to 11.6
11+
* CUDA Toolkit 11.0 to 11.7
1212
* Cython - e.g. 0.29.21
1313

1414
### Compilation

cuda/_cuda/ccuda.pxd

Lines changed: 22 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -421,6 +421,16 @@ cdef CUresult _cuStreamWriteValue64(CUstream stream, CUdeviceptr addr, cuuint64_
421421

422422
cdef CUresult _cuStreamBatchMemOp(CUstream stream, unsigned int count, CUstreamBatchMemOpParams* paramArray, unsigned int flags) nogil except ?CUDA_ERROR_NOT_FOUND
423423

424+
cdef CUresult _cuStreamWaitValue32_v2(CUstream stream, CUdeviceptr addr, cuuint32_t value, unsigned int flags) nogil except ?CUDA_ERROR_NOT_FOUND
425+
426+
cdef CUresult _cuStreamWaitValue64_v2(CUstream stream, CUdeviceptr addr, cuuint64_t value, unsigned int flags) nogil except ?CUDA_ERROR_NOT_FOUND
427+
428+
cdef CUresult _cuStreamWriteValue32_v2(CUstream stream, CUdeviceptr addr, cuuint32_t value, unsigned int flags) nogil except ?CUDA_ERROR_NOT_FOUND
429+
430+
cdef CUresult _cuStreamWriteValue64_v2(CUstream stream, CUdeviceptr addr, cuuint64_t value, unsigned int flags) nogil except ?CUDA_ERROR_NOT_FOUND
431+
432+
cdef CUresult _cuStreamBatchMemOp_v2(CUstream stream, unsigned int count, CUstreamBatchMemOpParams* paramArray, unsigned int flags) nogil except ?CUDA_ERROR_NOT_FOUND
433+
424434
cdef CUresult _cuFuncGetAttribute(int* pi, CUfunction_attribute attrib, CUfunction hfunc) nogil except ?CUDA_ERROR_NOT_FOUND
425435

426436
cdef CUresult _cuFuncSetAttribute(CUfunction hfunc, CUfunction_attribute attrib, int value) nogil except ?CUDA_ERROR_NOT_FOUND
@@ -515,6 +525,14 @@ cdef CUresult _cuGraphExternalSemaphoresWaitNodeGetParams(CUgraphNode hNode, CUD
515525

516526
cdef CUresult _cuGraphExternalSemaphoresWaitNodeSetParams(CUgraphNode hNode, const CUDA_EXT_SEM_WAIT_NODE_PARAMS* nodeParams) nogil except ?CUDA_ERROR_NOT_FOUND
517527

528+
cdef CUresult _cuGraphAddBatchMemOpNode(CUgraphNode* phGraphNode, CUgraph hGraph, const CUgraphNode* dependencies, size_t numDependencies, const CUDA_BATCH_MEM_OP_NODE_PARAMS* nodeParams) nogil except ?CUDA_ERROR_NOT_FOUND
529+
530+
cdef CUresult _cuGraphBatchMemOpNodeGetParams(CUgraphNode hNode, CUDA_BATCH_MEM_OP_NODE_PARAMS* nodeParams_out) nogil except ?CUDA_ERROR_NOT_FOUND
531+
532+
cdef CUresult _cuGraphBatchMemOpNodeSetParams(CUgraphNode hNode, const CUDA_BATCH_MEM_OP_NODE_PARAMS* nodeParams) nogil except ?CUDA_ERROR_NOT_FOUND
533+
534+
cdef CUresult _cuGraphExecBatchMemOpNodeSetParams(CUgraphExec hGraphExec, CUgraphNode hNode, const CUDA_BATCH_MEM_OP_NODE_PARAMS* nodeParams) nogil except ?CUDA_ERROR_NOT_FOUND
535+
518536
cdef CUresult _cuGraphAddMemAllocNode(CUgraphNode* phGraphNode, CUgraph hGraph, const CUgraphNode* dependencies, size_t numDependencies, CUDA_MEM_ALLOC_NODE_PARAMS* nodeParams) nogil except ?CUDA_ERROR_NOT_FOUND
519537

520538
cdef CUresult _cuGraphMemAllocNodeGetParams(CUgraphNode hNode, CUDA_MEM_ALLOC_NODE_PARAMS* params_out) nogil except ?CUDA_ERROR_NOT_FOUND
@@ -713,6 +731,10 @@ cdef CUresult _cuGraphicsUnmapResources(unsigned int count, CUgraphicsResource*
713731

714732
cdef CUresult _cuGetProcAddress(const char* symbol, void** pfn, int cudaVersion, cuuint64_t flags) nogil except ?CUDA_ERROR_NOT_FOUND
715733

734+
cdef CUresult _cuModuleGetLoadingMode(CUmoduleLoadingMode* mode) nogil except ?CUDA_ERROR_NOT_FOUND
735+
736+
cdef CUresult _cuMemGetHandleForAddressRange(void* handle, CUdeviceptr dptr, size_t size, CUmemRangeHandleType handleType, unsigned long long flags) nogil except ?CUDA_ERROR_NOT_FOUND
737+
716738
cdef CUresult _cuGetExportTable(const void** ppExportTable, const CUuuid* pExportTableId) nogil except ?CUDA_ERROR_NOT_FOUND
717739

718740
cdef CUresult _cuProfilerInitialize(const char* configFile, const char* outputFile, CUoutput_mode outputMode) nogil except ?CUDA_ERROR_NOT_FOUND

cuda/_cuda/ccuda.pyx

Lines changed: 217 additions & 0 deletions
Large diffs are not rendered by default.

cuda/ccuda.pxd

Lines changed: 81 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -203,10 +203,17 @@ cdef enum CUstreamBatchMemOpType_enum:
203203
CU_STREAM_MEM_OP_WRITE_VALUE_32 = 2
204204
CU_STREAM_MEM_OP_WAIT_VALUE_64 = 4
205205
CU_STREAM_MEM_OP_WRITE_VALUE_64 = 5
206+
CU_STREAM_MEM_OP_BARRIER = 6
206207
CU_STREAM_MEM_OP_FLUSH_REMOTE_WRITES = 3
207208

208209
ctypedef CUstreamBatchMemOpType_enum CUstreamBatchMemOpType
209210

211+
cdef enum CUstreamMemoryBarrier_flags_enum:
212+
CU_STREAM_MEMORY_BARRIER_TYPE_SYS = 0
213+
CU_STREAM_MEMORY_BARRIER_TYPE_GPU = 1
214+
215+
ctypedef CUstreamMemoryBarrier_flags_enum CUstreamMemoryBarrier_flags
216+
210217
cdef struct CUstreamMemOpWaitValueParams_st:
211218
CUstreamBatchMemOpType operation
212219
CUdeviceptr address
@@ -225,17 +232,30 @@ cdef struct CUstreamMemOpFlushRemoteWritesParams_st:
225232
CUstreamBatchMemOpType operation
226233
unsigned int flags
227234

235+
cdef struct CUstreamMemOpMemoryBarrierParams_st:
236+
CUstreamBatchMemOpType operation
237+
unsigned int flags
238+
228239
cdef union CUstreamBatchMemOpParams_union:
229240
CUstreamBatchMemOpType operation
230241
CUstreamMemOpWaitValueParams_st waitValue
231242
CUstreamMemOpWriteValueParams_st writeValue
232243
CUstreamMemOpFlushRemoteWritesParams_st flushRemoteWrites
244+
CUstreamMemOpMemoryBarrierParams_st memoryBarrier
233245
cuuint64_t pad[6]
234246

235247
ctypedef CUstreamBatchMemOpParams_union CUstreamBatchMemOpParams_v1
236248

237249
ctypedef CUstreamBatchMemOpParams_v1 CUstreamBatchMemOpParams
238250

251+
cdef struct CUDA_BATCH_MEM_OP_NODE_PARAMS_st:
252+
CUcontext ctx
253+
unsigned int count
254+
CUstreamBatchMemOpParams* paramArray
255+
unsigned int flags
256+
257+
ctypedef CUDA_BATCH_MEM_OP_NODE_PARAMS_st CUDA_BATCH_MEM_OP_NODE_PARAMS
258+
239259
cdef enum CUoccupancy_flags_enum:
240260
CU_OCCUPANCY_DEFAULT = 0
241261
CU_OCCUPANCY_DISABLE_CACHING_OVERRIDE = 1
@@ -428,7 +448,10 @@ cdef enum CUdevice_attribute_enum:
428448
CU_DEVICE_ATTRIBUTE_GPU_DIRECT_RDMA_WRITES_ORDERING = 118
429449
CU_DEVICE_ATTRIBUTE_MEMPOOL_SUPPORTED_HANDLE_TYPES = 119
430450
CU_DEVICE_ATTRIBUTE_DEFERRED_MAPPING_CUDA_ARRAY_SUPPORTED = 121
431-
CU_DEVICE_ATTRIBUTE_MAX = 122
451+
CU_DEVICE_ATTRIBUTE_CAN_USE_64_BIT_STREAM_MEM_OPS_V2 = 122
452+
CU_DEVICE_ATTRIBUTE_CAN_USE_STREAM_WAIT_VALUE_NOR_V2 = 123
453+
CU_DEVICE_ATTRIBUTE_DMA_BUF_SUPPORTED = 124
454+
CU_DEVICE_ATTRIBUTE_MAX = 125
432455

433456
ctypedef CUdevice_attribute_enum CUdevice_attribute
434457

@@ -466,6 +489,9 @@ cdef enum CUpointer_attribute_enum:
466489
CU_POINTER_ATTRIBUTE_IS_GPU_DIRECT_RDMA_CAPABLE = 15
467490
CU_POINTER_ATTRIBUTE_ACCESS_FLAGS = 16
468491
CU_POINTER_ATTRIBUTE_MEMPOOL_HANDLE = 17
492+
CU_POINTER_ATTRIBUTE_MAPPING_SIZE = 18
493+
CU_POINTER_ATTRIBUTE_MAPPING_BASE_ADDR = 19
494+
CU_POINTER_ATTRIBUTE_MEMORY_BLOCK_ID = 20
469495

470496
ctypedef CUpointer_attribute_enum CUpointer_attribute
471497

@@ -565,7 +591,12 @@ cdef enum CUjit_option_enum:
565591
CU_JIT_PREC_DIV = 22
566592
CU_JIT_PREC_SQRT = 23
567593
CU_JIT_FMA = 24
568-
CU_JIT_NUM_OPTIONS = 25
594+
CU_JIT_REFERENCED_KERNEL_NAMES = 25
595+
CU_JIT_REFERENCED_KERNEL_COUNT = 26
596+
CU_JIT_REFERENCED_VARIABLE_NAMES = 27
597+
CU_JIT_REFERENCED_VARIABLE_COUNT = 28
598+
CU_JIT_OPTIMIZE_UNUSED_DEVICE_VARIABLES = 29
599+
CU_JIT_NUM_OPTIONS = 30
569600

570601
ctypedef CUjit_option_enum CUjit_option
571602

@@ -587,6 +618,7 @@ cdef enum CUjit_target_enum:
587618
CU_TARGET_COMPUTE_75 = 75
588619
CU_TARGET_COMPUTE_80 = 80
589620
CU_TARGET_COMPUTE_86 = 86
621+
CU_TARGET_COMPUTE_87 = 87
590622

591623
ctypedef CUjit_target_enum CUjit_target
592624

@@ -734,6 +766,7 @@ cdef enum CUgraphNodeType_enum:
734766
CU_GRAPH_NODE_TYPE_EXT_SEMAS_WAIT = 9
735767
CU_GRAPH_NODE_TYPE_MEM_ALLOC = 10
736768
CU_GRAPH_NODE_TYPE_MEM_FREE = 11
769+
CU_GRAPH_NODE_TYPE_BATCH_MEM_OP = 12
737770

738771
ctypedef CUgraphNodeType_enum CUgraphNodeType
739772

@@ -748,12 +781,14 @@ ctypedef CUsynchronizationPolicy_enum CUsynchronizationPolicy
748781
cdef enum CUkernelNodeAttrID_enum:
749782
CU_KERNEL_NODE_ATTRIBUTE_ACCESS_POLICY_WINDOW = 1
750783
CU_KERNEL_NODE_ATTRIBUTE_COOPERATIVE = 2
784+
CU_KERNEL_NODE_ATTRIBUTE_PRIORITY = 8
751785

752786
ctypedef CUkernelNodeAttrID_enum CUkernelNodeAttrID
753787

754788
cdef union CUkernelNodeAttrValue_union:
755789
CUaccessPolicyWindow accessPolicyWindow
756790
int cooperative
791+
int priority
757792

758793
ctypedef CUkernelNodeAttrValue_union CUkernelNodeAttrValue_v1
759794

@@ -829,6 +864,7 @@ cdef enum cudaError_enum:
829864
CUDA_ERROR_PROFILER_ALREADY_STARTED = 7
830865
CUDA_ERROR_PROFILER_ALREADY_STOPPED = 8
831866
CUDA_ERROR_STUB_LIBRARY = 34
867+
CUDA_ERROR_DEVICE_UNAVAILABLE = 46
832868
CUDA_ERROR_NO_DEVICE = 100
833869
CUDA_ERROR_INVALID_DEVICE = 101
834870
CUDA_ERROR_DEVICE_NOT_LICENSED = 102
@@ -1388,6 +1424,12 @@ cdef enum CUmemAllocationGranularity_flags_enum:
13881424

13891425
ctypedef CUmemAllocationGranularity_flags_enum CUmemAllocationGranularity_flags
13901426

1427+
cdef enum CUmemRangeHandleType_enum:
1428+
CU_MEM_RANGE_HANDLE_TYPE_DMA_BUF_FD = 1
1429+
CU_MEM_RANGE_HANDLE_TYPE_MAX = 2147483647
1430+
1431+
ctypedef CUmemRangeHandleType_enum CUmemRangeHandleType
1432+
13911433
cdef enum CUarraySparseSubresourceType_enum:
13921434
CU_ARRAY_SPARSE_SUBRESOURCE_TYPE_SPARSE_LEVEL = 0
13931435
CU_ARRAY_SPARSE_SUBRESOURCE_TYPE_MIPTAIL = 1
@@ -1585,6 +1627,7 @@ cdef enum CUgraphDebugDot_flags_enum:
15851627
CU_GRAPH_DEBUG_DOT_FLAGS_HANDLES = 1024
15861628
CU_GRAPH_DEBUG_DOT_FLAGS_MEM_ALLOC_NODE_PARAMS = 2048
15871629
CU_GRAPH_DEBUG_DOT_FLAGS_MEM_FREE_NODE_PARAMS = 4096
1630+
CU_GRAPH_DEBUG_DOT_FLAGS_BATCH_MEM_OP_NODE_PARAMS = 8192
15881631

15891632
ctypedef CUgraphDebugDot_flags_enum CUgraphDebugDot_flags
15901633

@@ -1600,6 +1643,7 @@ ctypedef CUuserObjectRetain_flags_enum CUuserObjectRetain_flags
16001643

16011644
cdef enum CUgraphInstantiate_flags_enum:
16021645
CUDA_GRAPH_INSTANTIATE_FLAG_AUTO_FREE_ON_LAUNCH = 1
1646+
CUDA_GRAPH_INSTANTIATE_FLAG_USE_NODE_PRIORITY = 8
16031647

16041648
ctypedef CUgraphInstantiate_flags_enum CUgraphInstantiate_flags
16051649

@@ -2017,6 +2061,16 @@ cdef CUresult cuStreamWriteValue64(CUstream stream, CUdeviceptr addr, cuuint64_t
20172061

20182062
cdef CUresult cuStreamBatchMemOp(CUstream stream, unsigned int count, CUstreamBatchMemOpParams* paramArray, unsigned int flags) nogil except ?CUDA_ERROR_NOT_FOUND
20192063

2064+
cdef CUresult cuStreamWaitValue32_v2(CUstream stream, CUdeviceptr addr, cuuint32_t value, unsigned int flags) nogil except ?CUDA_ERROR_NOT_FOUND
2065+
2066+
cdef CUresult cuStreamWaitValue64_v2(CUstream stream, CUdeviceptr addr, cuuint64_t value, unsigned int flags) nogil except ?CUDA_ERROR_NOT_FOUND
2067+
2068+
cdef CUresult cuStreamWriteValue32_v2(CUstream stream, CUdeviceptr addr, cuuint32_t value, unsigned int flags) nogil except ?CUDA_ERROR_NOT_FOUND
2069+
2070+
cdef CUresult cuStreamWriteValue64_v2(CUstream stream, CUdeviceptr addr, cuuint64_t value, unsigned int flags) nogil except ?CUDA_ERROR_NOT_FOUND
2071+
2072+
cdef CUresult cuStreamBatchMemOp_v2(CUstream stream, unsigned int count, CUstreamBatchMemOpParams* paramArray, unsigned int flags) nogil except ?CUDA_ERROR_NOT_FOUND
2073+
20202074
cdef CUresult cuFuncGetAttribute(int* pi, CUfunction_attribute attrib, CUfunction hfunc) nogil except ?CUDA_ERROR_NOT_FOUND
20212075

20222076
cdef CUresult cuFuncSetAttribute(CUfunction hfunc, CUfunction_attribute attrib, int value) nogil except ?CUDA_ERROR_NOT_FOUND
@@ -2111,6 +2165,14 @@ cdef CUresult cuGraphExternalSemaphoresWaitNodeGetParams(CUgraphNode hNode, CUDA
21112165

21122166
cdef CUresult cuGraphExternalSemaphoresWaitNodeSetParams(CUgraphNode hNode, const CUDA_EXT_SEM_WAIT_NODE_PARAMS* nodeParams) nogil except ?CUDA_ERROR_NOT_FOUND
21132167

2168+
cdef CUresult cuGraphAddBatchMemOpNode(CUgraphNode* phGraphNode, CUgraph hGraph, const CUgraphNode* dependencies, size_t numDependencies, const CUDA_BATCH_MEM_OP_NODE_PARAMS* nodeParams) nogil except ?CUDA_ERROR_NOT_FOUND
2169+
2170+
cdef CUresult cuGraphBatchMemOpNodeGetParams(CUgraphNode hNode, CUDA_BATCH_MEM_OP_NODE_PARAMS* nodeParams_out) nogil except ?CUDA_ERROR_NOT_FOUND
2171+
2172+
cdef CUresult cuGraphBatchMemOpNodeSetParams(CUgraphNode hNode, const CUDA_BATCH_MEM_OP_NODE_PARAMS* nodeParams) nogil except ?CUDA_ERROR_NOT_FOUND
2173+
2174+
cdef CUresult cuGraphExecBatchMemOpNodeSetParams(CUgraphExec hGraphExec, CUgraphNode hNode, const CUDA_BATCH_MEM_OP_NODE_PARAMS* nodeParams) nogil except ?CUDA_ERROR_NOT_FOUND
2175+
21142176
cdef CUresult cuGraphAddMemAllocNode(CUgraphNode* phGraphNode, CUgraph hGraph, const CUgraphNode* dependencies, size_t numDependencies, CUDA_MEM_ALLOC_NODE_PARAMS* nodeParams) nogil except ?CUDA_ERROR_NOT_FOUND
21152177

21162178
cdef CUresult cuGraphMemAllocNodeGetParams(CUgraphNode hNode, CUDA_MEM_ALLOC_NODE_PARAMS* params_out) nogil except ?CUDA_ERROR_NOT_FOUND
@@ -2309,6 +2371,16 @@ cdef CUresult cuGraphicsUnmapResources(unsigned int count, CUgraphicsResource* r
23092371

23102372
cdef CUresult cuGetProcAddress(const char* symbol, void** pfn, int cudaVersion, cuuint64_t flags) nogil except ?CUDA_ERROR_NOT_FOUND
23112373

2374+
cdef enum CUmoduleLoadingMode_enum:
2375+
CU_MODULE_EAGER_LOADING = 1
2376+
CU_MODULE_LAZY_LOADING = 2
2377+
2378+
ctypedef CUmoduleLoadingMode_enum CUmoduleLoadingMode
2379+
2380+
cdef CUresult cuModuleGetLoadingMode(CUmoduleLoadingMode* mode) nogil except ?CUDA_ERROR_NOT_FOUND
2381+
2382+
cdef CUresult cuMemGetHandleForAddressRange(void* handle, CUdeviceptr dptr, size_t size, CUmemRangeHandleType handleType, unsigned long long flags) nogil except ?CUDA_ERROR_NOT_FOUND
2383+
23122384
cdef CUresult cuGetExportTable(const void** ppExportTable, const CUuuid* pExportTableId) nogil except ?CUDA_ERROR_NOT_FOUND
23132385

23142386
cdef enum CUoutput_mode_enum:
@@ -2562,7 +2634,7 @@ cdef enum CUGLmap_flags_enum:
25622634

25632635
ctypedef CUGLmap_flags_enum CUGLmap_flags
25642636

2565-
cdef enum: CUDA_VERSION = 11060
2637+
cdef enum: CUDA_VERSION = 11070
25662638

25672639
cdef enum: CU_IPC_HANDLE_SIZE = 64
25682640

@@ -2632,10 +2704,16 @@ cdef enum: CU_TRSF_DISABLE_TRILINEAR_OPTIMIZATION = 32
26322704

26332705
cdef enum: CU_TRSF_SEAMLESS_CUBEMAP = 64
26342706

2707+
cdef enum: CU_LAUNCH_PARAM_END_AS_INT = 0
2708+
26352709
cdef enum: CU_LAUNCH_PARAM_END = 0
26362710

2711+
cdef enum: CU_LAUNCH_PARAM_BUFFER_POINTER_AS_INT = 1
2712+
26372713
cdef enum: CU_LAUNCH_PARAM_BUFFER_POINTER = 1
26382714

2715+
cdef enum: CU_LAUNCH_PARAM_BUFFER_SIZE_AS_INT = 2
2716+
26392717
cdef enum: CU_LAUNCH_PARAM_BUFFER_SIZE = 2
26402718

26412719
cdef enum: CU_PARAM_TR_DEFAULT = -1

cuda/ccuda.pyx

Lines changed: 33 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -628,6 +628,21 @@ cdef CUresult cuStreamWriteValue64(CUstream stream, CUdeviceptr addr, cuuint64_t
628628
cdef CUresult cuStreamBatchMemOp(CUstream stream, unsigned int count, CUstreamBatchMemOpParams* paramArray, unsigned int flags) nogil except ?CUDA_ERROR_NOT_FOUND:
629629
return ccuda._cuStreamBatchMemOp(stream, count, paramArray, flags)
630630

631+
cdef CUresult cuStreamWaitValue32_v2(CUstream stream, CUdeviceptr addr, cuuint32_t value, unsigned int flags) nogil except ?CUDA_ERROR_NOT_FOUND:
632+
return ccuda._cuStreamWaitValue32_v2(stream, addr, value, flags)
633+
634+
cdef CUresult cuStreamWaitValue64_v2(CUstream stream, CUdeviceptr addr, cuuint64_t value, unsigned int flags) nogil except ?CUDA_ERROR_NOT_FOUND:
635+
return ccuda._cuStreamWaitValue64_v2(stream, addr, value, flags)
636+
637+
cdef CUresult cuStreamWriteValue32_v2(CUstream stream, CUdeviceptr addr, cuuint32_t value, unsigned int flags) nogil except ?CUDA_ERROR_NOT_FOUND:
638+
return ccuda._cuStreamWriteValue32_v2(stream, addr, value, flags)
639+
640+
cdef CUresult cuStreamWriteValue64_v2(CUstream stream, CUdeviceptr addr, cuuint64_t value, unsigned int flags) nogil except ?CUDA_ERROR_NOT_FOUND:
641+
return ccuda._cuStreamWriteValue64_v2(stream, addr, value, flags)
642+
643+
cdef CUresult cuStreamBatchMemOp_v2(CUstream stream, unsigned int count, CUstreamBatchMemOpParams* paramArray, unsigned int flags) nogil except ?CUDA_ERROR_NOT_FOUND:
644+
return ccuda._cuStreamBatchMemOp_v2(stream, count, paramArray, flags)
645+
631646
cdef CUresult cuFuncGetAttribute(int* pi, CUfunction_attribute attrib, CUfunction hfunc) nogil except ?CUDA_ERROR_NOT_FOUND:
632647
return ccuda._cuFuncGetAttribute(pi, attrib, hfunc)
633648

@@ -769,6 +784,18 @@ cdef CUresult cuGraphExternalSemaphoresWaitNodeGetParams(CUgraphNode hNode, CUDA
769784
cdef CUresult cuGraphExternalSemaphoresWaitNodeSetParams(CUgraphNode hNode, const CUDA_EXT_SEM_WAIT_NODE_PARAMS* nodeParams) nogil except ?CUDA_ERROR_NOT_FOUND:
770785
return ccuda._cuGraphExternalSemaphoresWaitNodeSetParams(hNode, nodeParams)
771786

787+
cdef CUresult cuGraphAddBatchMemOpNode(CUgraphNode* phGraphNode, CUgraph hGraph, const CUgraphNode* dependencies, size_t numDependencies, const CUDA_BATCH_MEM_OP_NODE_PARAMS* nodeParams) nogil except ?CUDA_ERROR_NOT_FOUND:
788+
return ccuda._cuGraphAddBatchMemOpNode(phGraphNode, hGraph, dependencies, numDependencies, nodeParams)
789+
790+
cdef CUresult cuGraphBatchMemOpNodeGetParams(CUgraphNode hNode, CUDA_BATCH_MEM_OP_NODE_PARAMS* nodeParams_out) nogil except ?CUDA_ERROR_NOT_FOUND:
791+
return ccuda._cuGraphBatchMemOpNodeGetParams(hNode, nodeParams_out)
792+
793+
cdef CUresult cuGraphBatchMemOpNodeSetParams(CUgraphNode hNode, const CUDA_BATCH_MEM_OP_NODE_PARAMS* nodeParams) nogil except ?CUDA_ERROR_NOT_FOUND:
794+
return ccuda._cuGraphBatchMemOpNodeSetParams(hNode, nodeParams)
795+
796+
cdef CUresult cuGraphExecBatchMemOpNodeSetParams(CUgraphExec hGraphExec, CUgraphNode hNode, const CUDA_BATCH_MEM_OP_NODE_PARAMS* nodeParams) nogil except ?CUDA_ERROR_NOT_FOUND:
797+
return ccuda._cuGraphExecBatchMemOpNodeSetParams(hGraphExec, hNode, nodeParams)
798+
772799
cdef CUresult cuGraphAddMemAllocNode(CUgraphNode* phGraphNode, CUgraph hGraph, const CUgraphNode* dependencies, size_t numDependencies, CUDA_MEM_ALLOC_NODE_PARAMS* nodeParams) nogil except ?CUDA_ERROR_NOT_FOUND:
773800
return ccuda._cuGraphAddMemAllocNode(phGraphNode, hGraph, dependencies, numDependencies, nodeParams)
774801

@@ -1066,6 +1093,12 @@ cdef CUresult cuGraphicsUnmapResources(unsigned int count, CUgraphicsResource* r
10661093
cdef CUresult cuGetProcAddress(const char* symbol, void** pfn, int cudaVersion, cuuint64_t flags) nogil except ?CUDA_ERROR_NOT_FOUND:
10671094
return ccuda._cuGetProcAddress(symbol, pfn, cudaVersion, flags)
10681095

1096+
cdef CUresult cuModuleGetLoadingMode(CUmoduleLoadingMode* mode) nogil except ?CUDA_ERROR_NOT_FOUND:
1097+
return ccuda._cuModuleGetLoadingMode(mode)
1098+
1099+
cdef CUresult cuMemGetHandleForAddressRange(void* handle, CUdeviceptr dptr, size_t size, CUmemRangeHandleType handleType, unsigned long long flags) nogil except ?CUDA_ERROR_NOT_FOUND:
1100+
return ccuda._cuMemGetHandleForAddressRange(handle, dptr, size, handleType, flags)
1101+
10691102
cdef CUresult cuGetExportTable(const void** ppExportTable, const CUuuid* pExportTableId) nogil except ?CUDA_ERROR_NOT_FOUND:
10701103
return ccuda._cuGetExportTable(ppExportTable, pExportTableId)
10711104

0 commit comments

Comments
 (0)