tinygrad 0.10.2__py3-none-any.whl → 0.11.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (131) hide show
  1. tinygrad/__init__.py +1 -1
  2. tinygrad/apps/llm.py +206 -0
  3. tinygrad/codegen/__init__.py +116 -0
  4. tinygrad/codegen/devectorizer.py +315 -172
  5. tinygrad/codegen/expander.py +8 -16
  6. tinygrad/codegen/gpudims.py +89 -0
  7. tinygrad/codegen/linearize.py +205 -203
  8. tinygrad/codegen/lowerer.py +92 -139
  9. tinygrad/codegen/opt/__init__.py +38 -0
  10. tinygrad/codegen/opt/heuristic.py +125 -0
  11. tinygrad/codegen/opt/kernel.py +510 -0
  12. tinygrad/{engine → codegen/opt}/search.py +51 -35
  13. tinygrad/codegen/opt/swizzler.py +134 -0
  14. tinygrad/codegen/opt/tc.py +127 -0
  15. tinygrad/codegen/quantize.py +67 -0
  16. tinygrad/device.py +122 -132
  17. tinygrad/dtype.py +152 -35
  18. tinygrad/engine/jit.py +81 -54
  19. tinygrad/engine/memory.py +46 -27
  20. tinygrad/engine/realize.py +82 -41
  21. tinygrad/engine/schedule.py +70 -445
  22. tinygrad/frontend/__init__.py +0 -0
  23. tinygrad/frontend/onnx.py +1253 -0
  24. tinygrad/frontend/torch.py +5 -0
  25. tinygrad/gradient.py +19 -27
  26. tinygrad/helpers.py +95 -47
  27. tinygrad/nn/__init__.py +7 -8
  28. tinygrad/nn/optim.py +72 -41
  29. tinygrad/nn/state.py +37 -23
  30. tinygrad/renderer/__init__.py +40 -60
  31. tinygrad/renderer/cstyle.py +143 -128
  32. tinygrad/renderer/llvmir.py +113 -62
  33. tinygrad/renderer/ptx.py +50 -32
  34. tinygrad/renderer/wgsl.py +27 -23
  35. tinygrad/runtime/autogen/am/am.py +5861 -0
  36. tinygrad/runtime/autogen/am/pm4_nv.py +962 -0
  37. tinygrad/runtime/autogen/am/pm4_soc15.py +931 -0
  38. tinygrad/runtime/autogen/am/sdma_4_0_0.py +5209 -0
  39. tinygrad/runtime/autogen/am/sdma_4_4_2.py +5209 -0
  40. tinygrad/runtime/autogen/am/sdma_5_0_0.py +7103 -0
  41. tinygrad/runtime/autogen/am/sdma_6_0_0.py +8085 -0
  42. tinygrad/runtime/autogen/am/smu_v13_0_0.py +3068 -0
  43. tinygrad/runtime/autogen/am/smu_v14_0_2.py +3605 -0
  44. tinygrad/runtime/autogen/amd_gpu.py +1433 -67197
  45. tinygrad/runtime/autogen/comgr.py +35 -9
  46. tinygrad/runtime/autogen/comgr_3.py +906 -0
  47. tinygrad/runtime/autogen/cuda.py +2419 -494
  48. tinygrad/runtime/autogen/hsa.py +57 -16
  49. tinygrad/runtime/autogen/ib.py +7171 -0
  50. tinygrad/runtime/autogen/io_uring.py +917 -118
  51. tinygrad/runtime/autogen/kfd.py +748 -26
  52. tinygrad/runtime/autogen/libc.py +613 -218
  53. tinygrad/runtime/autogen/libusb.py +1643 -0
  54. tinygrad/runtime/autogen/nv/nv.py +8602 -0
  55. tinygrad/runtime/autogen/nv_gpu.py +7218 -2072
  56. tinygrad/runtime/autogen/opencl.py +2 -4
  57. tinygrad/runtime/autogen/sqtt.py +1789 -0
  58. tinygrad/runtime/autogen/vfio.py +3 -3
  59. tinygrad/runtime/autogen/webgpu.py +273 -264
  60. tinygrad/runtime/graph/cuda.py +3 -3
  61. tinygrad/runtime/graph/hcq.py +68 -29
  62. tinygrad/runtime/graph/metal.py +29 -13
  63. tinygrad/runtime/graph/remote.py +114 -0
  64. tinygrad/runtime/ops_amd.py +537 -320
  65. tinygrad/runtime/ops_cpu.py +108 -7
  66. tinygrad/runtime/ops_cuda.py +12 -14
  67. tinygrad/runtime/ops_disk.py +13 -10
  68. tinygrad/runtime/ops_dsp.py +47 -40
  69. tinygrad/runtime/ops_gpu.py +13 -11
  70. tinygrad/runtime/ops_hip.py +6 -9
  71. tinygrad/runtime/ops_llvm.py +35 -15
  72. tinygrad/runtime/ops_metal.py +29 -19
  73. tinygrad/runtime/ops_npy.py +5 -3
  74. tinygrad/runtime/ops_null.py +28 -0
  75. tinygrad/runtime/ops_nv.py +306 -234
  76. tinygrad/runtime/ops_python.py +62 -52
  77. tinygrad/runtime/ops_qcom.py +28 -39
  78. tinygrad/runtime/ops_remote.py +482 -0
  79. tinygrad/runtime/ops_webgpu.py +28 -28
  80. tinygrad/runtime/support/am/amdev.py +114 -249
  81. tinygrad/runtime/support/am/ip.py +211 -172
  82. tinygrad/runtime/support/amd.py +138 -0
  83. tinygrad/runtime/support/{compiler_hip.py → compiler_amd.py} +40 -8
  84. tinygrad/runtime/support/compiler_cuda.py +8 -11
  85. tinygrad/runtime/support/elf.py +2 -1
  86. tinygrad/runtime/support/hcq.py +184 -97
  87. tinygrad/runtime/support/ib.py +172 -0
  88. tinygrad/runtime/support/llvm.py +3 -4
  89. tinygrad/runtime/support/memory.py +251 -0
  90. tinygrad/runtime/support/nv/__init__.py +0 -0
  91. tinygrad/runtime/support/nv/ip.py +581 -0
  92. tinygrad/runtime/support/nv/nvdev.py +183 -0
  93. tinygrad/runtime/support/system.py +170 -0
  94. tinygrad/runtime/support/usb.py +268 -0
  95. tinygrad/runtime/support/webgpu.py +18 -0
  96. tinygrad/schedule/__init__.py +0 -0
  97. tinygrad/schedule/grouper.py +119 -0
  98. tinygrad/schedule/kernelize.py +368 -0
  99. tinygrad/schedule/multi.py +231 -0
  100. tinygrad/shape/shapetracker.py +40 -46
  101. tinygrad/shape/view.py +88 -52
  102. tinygrad/tensor.py +968 -542
  103. tinygrad/uop/__init__.py +117 -0
  104. tinygrad/{codegen/transcendental.py → uop/decompositions.py} +125 -38
  105. tinygrad/uop/mathtraits.py +169 -0
  106. tinygrad/uop/ops.py +1021 -0
  107. tinygrad/uop/spec.py +228 -0
  108. tinygrad/{codegen → uop}/symbolic.py +239 -216
  109. tinygrad/uop/upat.py +163 -0
  110. tinygrad/viz/assets/cdnjs.cloudflare.com/ajax/libs/highlight.js/11.10.0/languages/x86asm.min.js +19 -0
  111. tinygrad/viz/assets/d3js.org/d3.v7.min.js +2 -0
  112. tinygrad/viz/assets/dagrejs.github.io/project/dagre/latest/dagre.min.js +801 -0
  113. tinygrad/viz/index.html +203 -403
  114. tinygrad/viz/js/index.js +718 -0
  115. tinygrad/viz/js/worker.js +29 -0
  116. tinygrad/viz/serve.py +224 -102
  117. {tinygrad-0.10.2.dist-info → tinygrad-0.11.0.dist-info}/METADATA +24 -16
  118. tinygrad-0.11.0.dist-info/RECORD +141 -0
  119. {tinygrad-0.10.2.dist-info → tinygrad-0.11.0.dist-info}/WHEEL +1 -1
  120. tinygrad/codegen/kernel.py +0 -693
  121. tinygrad/engine/multi.py +0 -161
  122. tinygrad/ops.py +0 -1003
  123. tinygrad/runtime/ops_cloud.py +0 -220
  124. tinygrad/runtime/support/allocator.py +0 -94
  125. tinygrad/spec.py +0 -155
  126. tinygrad/viz/assets/d3js.org/d3.v5.min.js +0 -2
  127. tinygrad/viz/assets/dagrejs.github.io/project/dagre-d3/latest/dagre-d3.min.js +0 -4816
  128. tinygrad/viz/perfetto.html +0 -178
  129. tinygrad-0.10.2.dist-info/RECORD +0 -99
  130. {tinygrad-0.10.2.dist-info → tinygrad-0.11.0.dist-info/licenses}/LICENSE +0 -0
  131. {tinygrad-0.10.2.dist-info → tinygrad-0.11.0.dist-info}/top_level.txt +0 -0
@@ -1,7 +1,7 @@
1
1
  # mypy: ignore-errors
2
2
  # -*- coding: utf-8 -*-
3
3
  #
4
- # TARGET arch is: []
4
+ # TARGET arch is: ['-D__CUDA_API_VERSION_INTERNAL']
5
5
  # WORD_SIZE is: 8
6
6
  # POINTER_SIZE is: 8
7
7
  # LONGDOUBLE_SIZE is: 16
@@ -166,6 +166,14 @@ class struct_CUfunc_st(Structure):
166
166
  pass
167
167
 
168
168
  CUfunction = ctypes.POINTER(struct_CUfunc_st)
169
+ class struct_CUlib_st(Structure):
170
+ pass
171
+
172
+ CUlibrary = ctypes.POINTER(struct_CUlib_st)
173
+ class struct_CUkern_st(Structure):
174
+ pass
175
+
176
+ CUkernel = ctypes.POINTER(struct_CUkern_st)
169
177
  class struct_CUarray_st(Structure):
170
178
  pass
171
179
 
@@ -303,6 +311,51 @@ CUctx_flags_enum = ctypes.c_uint32 # enum
303
311
  CUctx_flags = CUctx_flags_enum
304
312
  CUctx_flags__enumvalues = CUctx_flags_enum__enumvalues
305
313
 
314
+ # values for enumeration 'CUevent_sched_flags_enum'
315
+ CUevent_sched_flags_enum__enumvalues = {
316
+ 0: 'CU_EVENT_SCHED_AUTO',
317
+ 1: 'CU_EVENT_SCHED_SPIN',
318
+ 2: 'CU_EVENT_SCHED_YIELD',
319
+ 4: 'CU_EVENT_SCHED_BLOCKING_SYNC',
320
+ }
321
+ CU_EVENT_SCHED_AUTO = 0
322
+ CU_EVENT_SCHED_SPIN = 1
323
+ CU_EVENT_SCHED_YIELD = 2
324
+ CU_EVENT_SCHED_BLOCKING_SYNC = 4
325
+ CUevent_sched_flags_enum = ctypes.c_uint32 # enum
326
+ CUevent_sched_flags = CUevent_sched_flags_enum
327
+ CUevent_sched_flags__enumvalues = CUevent_sched_flags_enum__enumvalues
328
+
329
+ # values for enumeration 'cl_event_flags_enum'
330
+ cl_event_flags_enum__enumvalues = {
331
+ 0: 'NVCL_EVENT_SCHED_AUTO',
332
+ 1: 'NVCL_EVENT_SCHED_SPIN',
333
+ 2: 'NVCL_EVENT_SCHED_YIELD',
334
+ 4: 'NVCL_EVENT_SCHED_BLOCKING_SYNC',
335
+ }
336
+ NVCL_EVENT_SCHED_AUTO = 0
337
+ NVCL_EVENT_SCHED_SPIN = 1
338
+ NVCL_EVENT_SCHED_YIELD = 2
339
+ NVCL_EVENT_SCHED_BLOCKING_SYNC = 4
340
+ cl_event_flags_enum = ctypes.c_uint32 # enum
341
+ cl_event_flags = cl_event_flags_enum
342
+ cl_event_flags__enumvalues = cl_event_flags_enum__enumvalues
343
+
344
+ # values for enumeration 'cl_context_flags_enum'
345
+ cl_context_flags_enum__enumvalues = {
346
+ 0: 'NVCL_CTX_SCHED_AUTO',
347
+ 1: 'NVCL_CTX_SCHED_SPIN',
348
+ 2: 'NVCL_CTX_SCHED_YIELD',
349
+ 4: 'NVCL_CTX_SCHED_BLOCKING_SYNC',
350
+ }
351
+ NVCL_CTX_SCHED_AUTO = 0
352
+ NVCL_CTX_SCHED_SPIN = 1
353
+ NVCL_CTX_SCHED_YIELD = 2
354
+ NVCL_CTX_SCHED_BLOCKING_SYNC = 4
355
+ cl_context_flags_enum = ctypes.c_uint32 # enum
356
+ cl_context_flags = cl_context_flags_enum
357
+ cl_context_flags__enumvalues = cl_context_flags_enum__enumvalues
358
+
306
359
  # values for enumeration 'CUstream_flags_enum'
307
360
  CUstream_flags_enum__enumvalues = {
308
361
  0: 'CU_STREAM_DEFAULT',
@@ -385,16 +438,29 @@ CUstreamBatchMemOpType_enum__enumvalues = {
385
438
  2: 'CU_STREAM_MEM_OP_WRITE_VALUE_32',
386
439
  4: 'CU_STREAM_MEM_OP_WAIT_VALUE_64',
387
440
  5: 'CU_STREAM_MEM_OP_WRITE_VALUE_64',
441
+ 6: 'CU_STREAM_MEM_OP_BARRIER',
388
442
  3: 'CU_STREAM_MEM_OP_FLUSH_REMOTE_WRITES',
389
443
  }
390
444
  CU_STREAM_MEM_OP_WAIT_VALUE_32 = 1
391
445
  CU_STREAM_MEM_OP_WRITE_VALUE_32 = 2
392
446
  CU_STREAM_MEM_OP_WAIT_VALUE_64 = 4
393
447
  CU_STREAM_MEM_OP_WRITE_VALUE_64 = 5
448
+ CU_STREAM_MEM_OP_BARRIER = 6
394
449
  CU_STREAM_MEM_OP_FLUSH_REMOTE_WRITES = 3
395
450
  CUstreamBatchMemOpType_enum = ctypes.c_uint32 # enum
396
451
  CUstreamBatchMemOpType = CUstreamBatchMemOpType_enum
397
452
  CUstreamBatchMemOpType__enumvalues = CUstreamBatchMemOpType_enum__enumvalues
453
+
454
+ # values for enumeration 'CUstreamMemoryBarrier_flags_enum'
455
+ CUstreamMemoryBarrier_flags_enum__enumvalues = {
456
+ 0: 'CU_STREAM_MEMORY_BARRIER_TYPE_SYS',
457
+ 1: 'CU_STREAM_MEMORY_BARRIER_TYPE_GPU',
458
+ }
459
+ CU_STREAM_MEMORY_BARRIER_TYPE_SYS = 0
460
+ CU_STREAM_MEMORY_BARRIER_TYPE_GPU = 1
461
+ CUstreamMemoryBarrier_flags_enum = ctypes.c_uint32 # enum
462
+ CUstreamMemoryBarrier_flags = CUstreamMemoryBarrier_flags_enum
463
+ CUstreamMemoryBarrier_flags__enumvalues = CUstreamMemoryBarrier_flags_enum__enumvalues
398
464
  class union_CUstreamBatchMemOpParams_union(Union):
399
465
  pass
400
466
 
@@ -455,17 +521,41 @@ struct_CUstreamMemOpFlushRemoteWritesParams_st._fields_ = [
455
521
  ('flags', ctypes.c_uint32),
456
522
  ]
457
523
 
524
+ class struct_CUstreamMemOpMemoryBarrierParams_st(Structure):
525
+ pass
526
+
527
+ struct_CUstreamMemOpMemoryBarrierParams_st._pack_ = 1 # source:False
528
+ struct_CUstreamMemOpMemoryBarrierParams_st._fields_ = [
529
+ ('operation', CUstreamBatchMemOpType),
530
+ ('flags', ctypes.c_uint32),
531
+ ]
532
+
458
533
  union_CUstreamBatchMemOpParams_union._pack_ = 1 # source:False
459
534
  union_CUstreamBatchMemOpParams_union._fields_ = [
460
535
  ('operation', CUstreamBatchMemOpType),
461
536
  ('waitValue', struct_CUstreamMemOpWaitValueParams_st),
462
537
  ('writeValue', struct_CUstreamMemOpWriteValueParams_st),
463
538
  ('flushRemoteWrites', struct_CUstreamMemOpFlushRemoteWritesParams_st),
539
+ ('memoryBarrier', struct_CUstreamMemOpMemoryBarrierParams_st),
464
540
  ('pad', ctypes.c_uint64 * 6),
465
541
  ]
466
542
 
467
543
  CUstreamBatchMemOpParams_v1 = union_CUstreamBatchMemOpParams_union
468
544
  CUstreamBatchMemOpParams = union_CUstreamBatchMemOpParams_union
545
+ class struct_CUDA_BATCH_MEM_OP_NODE_PARAMS_st(Structure):
546
+ pass
547
+
548
+ struct_CUDA_BATCH_MEM_OP_NODE_PARAMS_st._pack_ = 1 # source:False
549
+ struct_CUDA_BATCH_MEM_OP_NODE_PARAMS_st._fields_ = [
550
+ ('ctx', ctypes.POINTER(struct_CUctx_st)),
551
+ ('count', ctypes.c_uint32),
552
+ ('PADDING_0', ctypes.c_ubyte * 4),
553
+ ('paramArray', ctypes.POINTER(union_CUstreamBatchMemOpParams_union)),
554
+ ('flags', ctypes.c_uint32),
555
+ ('PADDING_1', ctypes.c_ubyte * 4),
556
+ ]
557
+
558
+ CUDA_BATCH_MEM_OP_NODE_PARAMS = struct_CUDA_BATCH_MEM_OP_NODE_PARAMS_st
469
559
 
470
560
  # values for enumeration 'CUoccupancy_flags_enum'
471
561
  CUoccupancy_flags_enum__enumvalues = {
@@ -690,9 +780,9 @@ CUdevice_attribute_enum__enumvalues = {
690
780
  89: 'CU_DEVICE_ATTRIBUTE_CONCURRENT_MANAGED_ACCESS',
691
781
  90: 'CU_DEVICE_ATTRIBUTE_COMPUTE_PREEMPTION_SUPPORTED',
692
782
  91: 'CU_DEVICE_ATTRIBUTE_CAN_USE_HOST_POINTER_FOR_REGISTERED_MEM',
693
- 92: 'CU_DEVICE_ATTRIBUTE_CAN_USE_STREAM_MEM_OPS',
694
- 93: 'CU_DEVICE_ATTRIBUTE_CAN_USE_64_BIT_STREAM_MEM_OPS',
695
- 94: 'CU_DEVICE_ATTRIBUTE_CAN_USE_STREAM_WAIT_VALUE_NOR',
783
+ 92: 'CU_DEVICE_ATTRIBUTE_CAN_USE_STREAM_MEM_OPS_V1',
784
+ 93: 'CU_DEVICE_ATTRIBUTE_CAN_USE_64_BIT_STREAM_MEM_OPS_V1',
785
+ 94: 'CU_DEVICE_ATTRIBUTE_CAN_USE_STREAM_WAIT_VALUE_NOR_V1',
696
786
  95: 'CU_DEVICE_ATTRIBUTE_COOPERATIVE_LAUNCH',
697
787
  96: 'CU_DEVICE_ATTRIBUTE_COOPERATIVE_MULTI_DEVICE_LAUNCH',
698
788
  97: 'CU_DEVICE_ATTRIBUTE_MAX_SHARED_MEMORY_PER_BLOCK_OPTIN',
@@ -719,7 +809,16 @@ CUdevice_attribute_enum__enumvalues = {
719
809
  117: 'CU_DEVICE_ATTRIBUTE_GPU_DIRECT_RDMA_FLUSH_WRITES_OPTIONS',
720
810
  118: 'CU_DEVICE_ATTRIBUTE_GPU_DIRECT_RDMA_WRITES_ORDERING',
721
811
  119: 'CU_DEVICE_ATTRIBUTE_MEMPOOL_SUPPORTED_HANDLE_TYPES',
722
- 120: 'CU_DEVICE_ATTRIBUTE_MAX',
812
+ 120: 'CU_DEVICE_ATTRIBUTE_CLUSTER_LAUNCH',
813
+ 121: 'CU_DEVICE_ATTRIBUTE_DEFERRED_MAPPING_CUDA_ARRAY_SUPPORTED',
814
+ 122: 'CU_DEVICE_ATTRIBUTE_CAN_USE_64_BIT_STREAM_MEM_OPS',
815
+ 123: 'CU_DEVICE_ATTRIBUTE_CAN_USE_STREAM_WAIT_VALUE_NOR',
816
+ 124: 'CU_DEVICE_ATTRIBUTE_DMA_BUF_SUPPORTED',
817
+ 125: 'CU_DEVICE_ATTRIBUTE_IPC_EVENT_SUPPORTED',
818
+ 126: 'CU_DEVICE_ATTRIBUTE_MEM_SYNC_DOMAIN_COUNT',
819
+ 127: 'CU_DEVICE_ATTRIBUTE_TENSOR_MAP_ACCESS_SUPPORTED',
820
+ 129: 'CU_DEVICE_ATTRIBUTE_UNIFIED_FUNCTION_POINTERS',
821
+ 130: 'CU_DEVICE_ATTRIBUTE_MAX',
723
822
  }
724
823
  CU_DEVICE_ATTRIBUTE_MAX_THREADS_PER_BLOCK = 1
725
824
  CU_DEVICE_ATTRIBUTE_MAX_BLOCK_DIM_X = 2
@@ -817,9 +916,9 @@ CU_DEVICE_ATTRIBUTE_PAGEABLE_MEMORY_ACCESS = 88
817
916
  CU_DEVICE_ATTRIBUTE_CONCURRENT_MANAGED_ACCESS = 89
818
917
  CU_DEVICE_ATTRIBUTE_COMPUTE_PREEMPTION_SUPPORTED = 90
819
918
  CU_DEVICE_ATTRIBUTE_CAN_USE_HOST_POINTER_FOR_REGISTERED_MEM = 91
820
- CU_DEVICE_ATTRIBUTE_CAN_USE_STREAM_MEM_OPS = 92
821
- CU_DEVICE_ATTRIBUTE_CAN_USE_64_BIT_STREAM_MEM_OPS = 93
822
- CU_DEVICE_ATTRIBUTE_CAN_USE_STREAM_WAIT_VALUE_NOR = 94
919
+ CU_DEVICE_ATTRIBUTE_CAN_USE_STREAM_MEM_OPS_V1 = 92
920
+ CU_DEVICE_ATTRIBUTE_CAN_USE_64_BIT_STREAM_MEM_OPS_V1 = 93
921
+ CU_DEVICE_ATTRIBUTE_CAN_USE_STREAM_WAIT_VALUE_NOR_V1 = 94
823
922
  CU_DEVICE_ATTRIBUTE_COOPERATIVE_LAUNCH = 95
824
923
  CU_DEVICE_ATTRIBUTE_COOPERATIVE_MULTI_DEVICE_LAUNCH = 96
825
924
  CU_DEVICE_ATTRIBUTE_MAX_SHARED_MEMORY_PER_BLOCK_OPTIN = 97
@@ -846,7 +945,16 @@ CU_DEVICE_ATTRIBUTE_GPU_DIRECT_RDMA_SUPPORTED = 116
846
945
  CU_DEVICE_ATTRIBUTE_GPU_DIRECT_RDMA_FLUSH_WRITES_OPTIONS = 117
847
946
  CU_DEVICE_ATTRIBUTE_GPU_DIRECT_RDMA_WRITES_ORDERING = 118
848
947
  CU_DEVICE_ATTRIBUTE_MEMPOOL_SUPPORTED_HANDLE_TYPES = 119
849
- CU_DEVICE_ATTRIBUTE_MAX = 120
948
+ CU_DEVICE_ATTRIBUTE_CLUSTER_LAUNCH = 120
949
+ CU_DEVICE_ATTRIBUTE_DEFERRED_MAPPING_CUDA_ARRAY_SUPPORTED = 121
950
+ CU_DEVICE_ATTRIBUTE_CAN_USE_64_BIT_STREAM_MEM_OPS = 122
951
+ CU_DEVICE_ATTRIBUTE_CAN_USE_STREAM_WAIT_VALUE_NOR = 123
952
+ CU_DEVICE_ATTRIBUTE_DMA_BUF_SUPPORTED = 124
953
+ CU_DEVICE_ATTRIBUTE_IPC_EVENT_SUPPORTED = 125
954
+ CU_DEVICE_ATTRIBUTE_MEM_SYNC_DOMAIN_COUNT = 126
955
+ CU_DEVICE_ATTRIBUTE_TENSOR_MAP_ACCESS_SUPPORTED = 127
956
+ CU_DEVICE_ATTRIBUTE_UNIFIED_FUNCTION_POINTERS = 129
957
+ CU_DEVICE_ATTRIBUTE_MAX = 130
850
958
  CUdevice_attribute_enum = ctypes.c_uint32 # enum
851
959
  CUdevice_attribute = CUdevice_attribute_enum
852
960
  CUdevice_attribute__enumvalues = CUdevice_attribute_enum__enumvalues
@@ -889,6 +997,9 @@ CUpointer_attribute_enum__enumvalues = {
889
997
  15: 'CU_POINTER_ATTRIBUTE_IS_GPU_DIRECT_RDMA_CAPABLE',
890
998
  16: 'CU_POINTER_ATTRIBUTE_ACCESS_FLAGS',
891
999
  17: 'CU_POINTER_ATTRIBUTE_MEMPOOL_HANDLE',
1000
+ 18: 'CU_POINTER_ATTRIBUTE_MAPPING_SIZE',
1001
+ 19: 'CU_POINTER_ATTRIBUTE_MAPPING_BASE_ADDR',
1002
+ 20: 'CU_POINTER_ATTRIBUTE_MEMORY_BLOCK_ID',
892
1003
  }
893
1004
  CU_POINTER_ATTRIBUTE_CONTEXT = 1
894
1005
  CU_POINTER_ATTRIBUTE_MEMORY_TYPE = 2
@@ -907,6 +1018,9 @@ CU_POINTER_ATTRIBUTE_ALLOWED_HANDLE_TYPES = 14
907
1018
  CU_POINTER_ATTRIBUTE_IS_GPU_DIRECT_RDMA_CAPABLE = 15
908
1019
  CU_POINTER_ATTRIBUTE_ACCESS_FLAGS = 16
909
1020
  CU_POINTER_ATTRIBUTE_MEMPOOL_HANDLE = 17
1021
+ CU_POINTER_ATTRIBUTE_MAPPING_SIZE = 18
1022
+ CU_POINTER_ATTRIBUTE_MAPPING_BASE_ADDR = 19
1023
+ CU_POINTER_ATTRIBUTE_MEMORY_BLOCK_ID = 20
910
1024
  CUpointer_attribute_enum = ctypes.c_uint32 # enum
911
1025
  CUpointer_attribute = CUpointer_attribute_enum
912
1026
  CUpointer_attribute__enumvalues = CUpointer_attribute_enum__enumvalues
@@ -923,7 +1037,13 @@ CUfunction_attribute_enum__enumvalues = {
923
1037
  7: 'CU_FUNC_ATTRIBUTE_CACHE_MODE_CA',
924
1038
  8: 'CU_FUNC_ATTRIBUTE_MAX_DYNAMIC_SHARED_SIZE_BYTES',
925
1039
  9: 'CU_FUNC_ATTRIBUTE_PREFERRED_SHARED_MEMORY_CARVEOUT',
926
- 10: 'CU_FUNC_ATTRIBUTE_MAX',
1040
+ 10: 'CU_FUNC_ATTRIBUTE_CLUSTER_SIZE_MUST_BE_SET',
1041
+ 11: 'CU_FUNC_ATTRIBUTE_REQUIRED_CLUSTER_WIDTH',
1042
+ 12: 'CU_FUNC_ATTRIBUTE_REQUIRED_CLUSTER_HEIGHT',
1043
+ 13: 'CU_FUNC_ATTRIBUTE_REQUIRED_CLUSTER_DEPTH',
1044
+ 14: 'CU_FUNC_ATTRIBUTE_NON_PORTABLE_CLUSTER_SIZE_ALLOWED',
1045
+ 15: 'CU_FUNC_ATTRIBUTE_CLUSTER_SCHEDULING_POLICY_PREFERENCE',
1046
+ 16: 'CU_FUNC_ATTRIBUTE_MAX',
927
1047
  }
928
1048
  CU_FUNC_ATTRIBUTE_MAX_THREADS_PER_BLOCK = 0
929
1049
  CU_FUNC_ATTRIBUTE_SHARED_SIZE_BYTES = 1
@@ -935,7 +1055,13 @@ CU_FUNC_ATTRIBUTE_BINARY_VERSION = 6
935
1055
  CU_FUNC_ATTRIBUTE_CACHE_MODE_CA = 7
936
1056
  CU_FUNC_ATTRIBUTE_MAX_DYNAMIC_SHARED_SIZE_BYTES = 8
937
1057
  CU_FUNC_ATTRIBUTE_PREFERRED_SHARED_MEMORY_CARVEOUT = 9
938
- CU_FUNC_ATTRIBUTE_MAX = 10
1058
+ CU_FUNC_ATTRIBUTE_CLUSTER_SIZE_MUST_BE_SET = 10
1059
+ CU_FUNC_ATTRIBUTE_REQUIRED_CLUSTER_WIDTH = 11
1060
+ CU_FUNC_ATTRIBUTE_REQUIRED_CLUSTER_HEIGHT = 12
1061
+ CU_FUNC_ATTRIBUTE_REQUIRED_CLUSTER_DEPTH = 13
1062
+ CU_FUNC_ATTRIBUTE_NON_PORTABLE_CLUSTER_SIZE_ALLOWED = 14
1063
+ CU_FUNC_ATTRIBUTE_CLUSTER_SCHEDULING_POLICY_PREFERENCE = 15
1064
+ CU_FUNC_ATTRIBUTE_MAX = 16
939
1065
  CUfunction_attribute_enum = ctypes.c_uint32 # enum
940
1066
  CUfunction_attribute = CUfunction_attribute_enum
941
1067
  CUfunction_attribute__enumvalues = CUfunction_attribute_enum__enumvalues
@@ -1070,7 +1196,13 @@ CUjit_option_enum__enumvalues = {
1070
1196
  22: 'CU_JIT_PREC_DIV',
1071
1197
  23: 'CU_JIT_PREC_SQRT',
1072
1198
  24: 'CU_JIT_FMA',
1073
- 25: 'CU_JIT_NUM_OPTIONS',
1199
+ 25: 'CU_JIT_REFERENCED_KERNEL_NAMES',
1200
+ 26: 'CU_JIT_REFERENCED_KERNEL_COUNT',
1201
+ 27: 'CU_JIT_REFERENCED_VARIABLE_NAMES',
1202
+ 28: 'CU_JIT_REFERENCED_VARIABLE_COUNT',
1203
+ 29: 'CU_JIT_OPTIMIZE_UNUSED_DEVICE_VARIABLES',
1204
+ 30: 'CU_JIT_POSITION_INDEPENDENT_CODE',
1205
+ 31: 'CU_JIT_NUM_OPTIONS',
1074
1206
  }
1075
1207
  CU_JIT_MAX_REGISTERS = 0
1076
1208
  CU_JIT_THREADS_PER_BLOCK = 1
@@ -1097,15 +1229,19 @@ CU_JIT_FTZ = 21
1097
1229
  CU_JIT_PREC_DIV = 22
1098
1230
  CU_JIT_PREC_SQRT = 23
1099
1231
  CU_JIT_FMA = 24
1100
- CU_JIT_NUM_OPTIONS = 25
1232
+ CU_JIT_REFERENCED_KERNEL_NAMES = 25
1233
+ CU_JIT_REFERENCED_KERNEL_COUNT = 26
1234
+ CU_JIT_REFERENCED_VARIABLE_NAMES = 27
1235
+ CU_JIT_REFERENCED_VARIABLE_COUNT = 28
1236
+ CU_JIT_OPTIMIZE_UNUSED_DEVICE_VARIABLES = 29
1237
+ CU_JIT_POSITION_INDEPENDENT_CODE = 30
1238
+ CU_JIT_NUM_OPTIONS = 31
1101
1239
  CUjit_option_enum = ctypes.c_uint32 # enum
1102
1240
  CUjit_option = CUjit_option_enum
1103
1241
  CUjit_option__enumvalues = CUjit_option_enum__enumvalues
1104
1242
 
1105
1243
  # values for enumeration 'CUjit_target_enum'
1106
1244
  CUjit_target_enum__enumvalues = {
1107
- 20: 'CU_TARGET_COMPUTE_20',
1108
- 21: 'CU_TARGET_COMPUTE_21',
1109
1245
  30: 'CU_TARGET_COMPUTE_30',
1110
1246
  32: 'CU_TARGET_COMPUTE_32',
1111
1247
  35: 'CU_TARGET_COMPUTE_35',
@@ -1121,9 +1257,11 @@ CUjit_target_enum__enumvalues = {
1121
1257
  75: 'CU_TARGET_COMPUTE_75',
1122
1258
  80: 'CU_TARGET_COMPUTE_80',
1123
1259
  86: 'CU_TARGET_COMPUTE_86',
1260
+ 87: 'CU_TARGET_COMPUTE_87',
1261
+ 89: 'CU_TARGET_COMPUTE_89',
1262
+ 90: 'CU_TARGET_COMPUTE_90',
1263
+ 65626: 'CU_TARGET_COMPUTE_90A',
1124
1264
  }
1125
- CU_TARGET_COMPUTE_20 = 20
1126
- CU_TARGET_COMPUTE_21 = 21
1127
1265
  CU_TARGET_COMPUTE_30 = 30
1128
1266
  CU_TARGET_COMPUTE_32 = 32
1129
1267
  CU_TARGET_COMPUTE_35 = 35
@@ -1139,6 +1277,10 @@ CU_TARGET_COMPUTE_72 = 72
1139
1277
  CU_TARGET_COMPUTE_75 = 75
1140
1278
  CU_TARGET_COMPUTE_80 = 80
1141
1279
  CU_TARGET_COMPUTE_86 = 86
1280
+ CU_TARGET_COMPUTE_87 = 87
1281
+ CU_TARGET_COMPUTE_89 = 89
1282
+ CU_TARGET_COMPUTE_90 = 90
1283
+ CU_TARGET_COMPUTE_90A = 65626
1142
1284
  CUjit_target_enum = ctypes.c_uint32 # enum
1143
1285
  CUjit_target = CUjit_target_enum
1144
1286
  CUjit_target__enumvalues = CUjit_target_enum__enumvalues
@@ -1326,7 +1468,28 @@ struct_CUDA_KERNEL_NODE_PARAMS_st._fields_ = [
1326
1468
  ]
1327
1469
 
1328
1470
  CUDA_KERNEL_NODE_PARAMS_v1 = struct_CUDA_KERNEL_NODE_PARAMS_st
1329
- CUDA_KERNEL_NODE_PARAMS = struct_CUDA_KERNEL_NODE_PARAMS_st
1471
+ class struct_CUDA_KERNEL_NODE_PARAMS_v2_st(Structure):
1472
+ pass
1473
+
1474
+ struct_CUDA_KERNEL_NODE_PARAMS_v2_st._pack_ = 1 # source:False
1475
+ struct_CUDA_KERNEL_NODE_PARAMS_v2_st._fields_ = [
1476
+ ('func', ctypes.POINTER(struct_CUfunc_st)),
1477
+ ('gridDimX', ctypes.c_uint32),
1478
+ ('gridDimY', ctypes.c_uint32),
1479
+ ('gridDimZ', ctypes.c_uint32),
1480
+ ('blockDimX', ctypes.c_uint32),
1481
+ ('blockDimY', ctypes.c_uint32),
1482
+ ('blockDimZ', ctypes.c_uint32),
1483
+ ('sharedMemBytes', ctypes.c_uint32),
1484
+ ('PADDING_0', ctypes.c_ubyte * 4),
1485
+ ('kernelParams', ctypes.POINTER(ctypes.POINTER(None))),
1486
+ ('extra', ctypes.POINTER(ctypes.POINTER(None))),
1487
+ ('kern', ctypes.POINTER(struct_CUkern_st)),
1488
+ ('ctx', ctypes.POINTER(struct_CUctx_st)),
1489
+ ]
1490
+
1491
+ CUDA_KERNEL_NODE_PARAMS_v2 = struct_CUDA_KERNEL_NODE_PARAMS_v2_st
1492
+ CUDA_KERNEL_NODE_PARAMS = struct_CUDA_KERNEL_NODE_PARAMS_v2_st
1330
1493
  class struct_CUDA_MEMSET_NODE_PARAMS_st(Structure):
1331
1494
  pass
1332
1495
 
@@ -1368,6 +1531,7 @@ CUgraphNodeType_enum__enumvalues = {
1368
1531
  9: 'CU_GRAPH_NODE_TYPE_EXT_SEMAS_WAIT',
1369
1532
  10: 'CU_GRAPH_NODE_TYPE_MEM_ALLOC',
1370
1533
  11: 'CU_GRAPH_NODE_TYPE_MEM_FREE',
1534
+ 12: 'CU_GRAPH_NODE_TYPE_BATCH_MEM_OP',
1371
1535
  }
1372
1536
  CU_GRAPH_NODE_TYPE_KERNEL = 0
1373
1537
  CU_GRAPH_NODE_TYPE_MEMCPY = 1
@@ -1381,10 +1545,41 @@ CU_GRAPH_NODE_TYPE_EXT_SEMAS_SIGNAL = 8
1381
1545
  CU_GRAPH_NODE_TYPE_EXT_SEMAS_WAIT = 9
1382
1546
  CU_GRAPH_NODE_TYPE_MEM_ALLOC = 10
1383
1547
  CU_GRAPH_NODE_TYPE_MEM_FREE = 11
1548
+ CU_GRAPH_NODE_TYPE_BATCH_MEM_OP = 12
1384
1549
  CUgraphNodeType_enum = ctypes.c_uint32 # enum
1385
1550
  CUgraphNodeType = CUgraphNodeType_enum
1386
1551
  CUgraphNodeType__enumvalues = CUgraphNodeType_enum__enumvalues
1387
1552
 
1553
+ # values for enumeration 'CUgraphInstantiateResult_enum'
1554
+ CUgraphInstantiateResult_enum__enumvalues = {
1555
+ 0: 'CUDA_GRAPH_INSTANTIATE_SUCCESS',
1556
+ 1: 'CUDA_GRAPH_INSTANTIATE_ERROR',
1557
+ 2: 'CUDA_GRAPH_INSTANTIATE_INVALID_STRUCTURE',
1558
+ 3: 'CUDA_GRAPH_INSTANTIATE_NODE_OPERATION_NOT_SUPPORTED',
1559
+ 4: 'CUDA_GRAPH_INSTANTIATE_MULTIPLE_CTXS_NOT_SUPPORTED',
1560
+ }
1561
+ CUDA_GRAPH_INSTANTIATE_SUCCESS = 0
1562
+ CUDA_GRAPH_INSTANTIATE_ERROR = 1
1563
+ CUDA_GRAPH_INSTANTIATE_INVALID_STRUCTURE = 2
1564
+ CUDA_GRAPH_INSTANTIATE_NODE_OPERATION_NOT_SUPPORTED = 3
1565
+ CUDA_GRAPH_INSTANTIATE_MULTIPLE_CTXS_NOT_SUPPORTED = 4
1566
+ CUgraphInstantiateResult_enum = ctypes.c_uint32 # enum
1567
+ CUgraphInstantiateResult = CUgraphInstantiateResult_enum
1568
+ CUgraphInstantiateResult__enumvalues = CUgraphInstantiateResult_enum__enumvalues
1569
+ class struct_CUDA_GRAPH_INSTANTIATE_PARAMS_st(Structure):
1570
+ pass
1571
+
1572
+ struct_CUDA_GRAPH_INSTANTIATE_PARAMS_st._pack_ = 1 # source:False
1573
+ struct_CUDA_GRAPH_INSTANTIATE_PARAMS_st._fields_ = [
1574
+ ('flags', ctypes.c_uint64),
1575
+ ('hUploadStream', ctypes.POINTER(struct_CUstream_st)),
1576
+ ('hErrNode_out', ctypes.POINTER(struct_CUgraphNode_st)),
1577
+ ('result_out', CUgraphInstantiateResult),
1578
+ ('PADDING_0', ctypes.c_ubyte * 4),
1579
+ ]
1580
+
1581
+ CUDA_GRAPH_INSTANTIATE_PARAMS = struct_CUDA_GRAPH_INSTANTIATE_PARAMS_st
1582
+
1388
1583
  # values for enumeration 'CUsynchronizationPolicy_enum'
1389
1584
  CUsynchronizationPolicy_enum__enumvalues = {
1390
1585
  1: 'CU_SYNC_POLICY_AUTO',
@@ -1400,28 +1595,143 @@ CUsynchronizationPolicy_enum = ctypes.c_uint32 # enum
1400
1595
  CUsynchronizationPolicy = CUsynchronizationPolicy_enum
1401
1596
  CUsynchronizationPolicy__enumvalues = CUsynchronizationPolicy_enum__enumvalues
1402
1597
 
1403
- # values for enumeration 'CUkernelNodeAttrID_enum'
1404
- CUkernelNodeAttrID_enum__enumvalues = {
1405
- 1: 'CU_KERNEL_NODE_ATTRIBUTE_ACCESS_POLICY_WINDOW',
1406
- 2: 'CU_KERNEL_NODE_ATTRIBUTE_COOPERATIVE',
1598
+ # values for enumeration 'CUclusterSchedulingPolicy_enum'
1599
+ CUclusterSchedulingPolicy_enum__enumvalues = {
1600
+ 0: 'CU_CLUSTER_SCHEDULING_POLICY_DEFAULT',
1601
+ 1: 'CU_CLUSTER_SCHEDULING_POLICY_SPREAD',
1602
+ 2: 'CU_CLUSTER_SCHEDULING_POLICY_LOAD_BALANCING',
1603
+ }
1604
+ CU_CLUSTER_SCHEDULING_POLICY_DEFAULT = 0
1605
+ CU_CLUSTER_SCHEDULING_POLICY_SPREAD = 1
1606
+ CU_CLUSTER_SCHEDULING_POLICY_LOAD_BALANCING = 2
1607
+ CUclusterSchedulingPolicy_enum = ctypes.c_uint32 # enum
1608
+ CUclusterSchedulingPolicy = CUclusterSchedulingPolicy_enum
1609
+ CUclusterSchedulingPolicy__enumvalues = CUclusterSchedulingPolicy_enum__enumvalues
1610
+
1611
+ # values for enumeration 'CUlaunchMemSyncDomain_enum'
1612
+ CUlaunchMemSyncDomain_enum__enumvalues = {
1613
+ 0: 'CU_LAUNCH_MEM_SYNC_DOMAIN_DEFAULT',
1614
+ 1: 'CU_LAUNCH_MEM_SYNC_DOMAIN_REMOTE',
1615
+ }
1616
+ CU_LAUNCH_MEM_SYNC_DOMAIN_DEFAULT = 0
1617
+ CU_LAUNCH_MEM_SYNC_DOMAIN_REMOTE = 1
1618
+ CUlaunchMemSyncDomain_enum = ctypes.c_uint32 # enum
1619
+ CUlaunchMemSyncDomain = CUlaunchMemSyncDomain_enum
1620
+ CUlaunchMemSyncDomain__enumvalues = CUlaunchMemSyncDomain_enum__enumvalues
1621
+ class struct_CUlaunchMemSyncDomainMap_st(Structure):
1622
+ pass
1623
+
1624
+ struct_CUlaunchMemSyncDomainMap_st._pack_ = 1 # source:False
1625
+ struct_CUlaunchMemSyncDomainMap_st._fields_ = [
1626
+ ('default_', ctypes.c_ubyte),
1627
+ ('remote', ctypes.c_ubyte),
1628
+ ]
1629
+
1630
+ CUlaunchMemSyncDomainMap = struct_CUlaunchMemSyncDomainMap_st
1631
+
1632
+ # values for enumeration 'CUlaunchAttributeID_enum'
1633
+ CUlaunchAttributeID_enum__enumvalues = {
1634
+ 0: 'CU_LAUNCH_ATTRIBUTE_IGNORE',
1635
+ 1: 'CU_LAUNCH_ATTRIBUTE_ACCESS_POLICY_WINDOW',
1636
+ 2: 'CU_LAUNCH_ATTRIBUTE_COOPERATIVE',
1637
+ 3: 'CU_LAUNCH_ATTRIBUTE_SYNCHRONIZATION_POLICY',
1638
+ 4: 'CU_LAUNCH_ATTRIBUTE_CLUSTER_DIMENSION',
1639
+ 5: 'CU_LAUNCH_ATTRIBUTE_CLUSTER_SCHEDULING_POLICY_PREFERENCE',
1640
+ 6: 'CU_LAUNCH_ATTRIBUTE_PROGRAMMATIC_STREAM_SERIALIZATION',
1641
+ 7: 'CU_LAUNCH_ATTRIBUTE_PROGRAMMATIC_EVENT',
1642
+ 8: 'CU_LAUNCH_ATTRIBUTE_PRIORITY',
1643
+ 9: 'CU_LAUNCH_ATTRIBUTE_MEM_SYNC_DOMAIN_MAP',
1644
+ 10: 'CU_LAUNCH_ATTRIBUTE_MEM_SYNC_DOMAIN',
1407
1645
  }
1408
- CU_KERNEL_NODE_ATTRIBUTE_ACCESS_POLICY_WINDOW = 1
1409
- CU_KERNEL_NODE_ATTRIBUTE_COOPERATIVE = 2
1410
- CUkernelNodeAttrID_enum = ctypes.c_uint32 # enum
1411
- CUkernelNodeAttrID = CUkernelNodeAttrID_enum
1412
- CUkernelNodeAttrID__enumvalues = CUkernelNodeAttrID_enum__enumvalues
1413
- class union_CUkernelNodeAttrValue_union(Union):
1646
+ CU_LAUNCH_ATTRIBUTE_IGNORE = 0
1647
+ CU_LAUNCH_ATTRIBUTE_ACCESS_POLICY_WINDOW = 1
1648
+ CU_LAUNCH_ATTRIBUTE_COOPERATIVE = 2
1649
+ CU_LAUNCH_ATTRIBUTE_SYNCHRONIZATION_POLICY = 3
1650
+ CU_LAUNCH_ATTRIBUTE_CLUSTER_DIMENSION = 4
1651
+ CU_LAUNCH_ATTRIBUTE_CLUSTER_SCHEDULING_POLICY_PREFERENCE = 5
1652
+ CU_LAUNCH_ATTRIBUTE_PROGRAMMATIC_STREAM_SERIALIZATION = 6
1653
+ CU_LAUNCH_ATTRIBUTE_PROGRAMMATIC_EVENT = 7
1654
+ CU_LAUNCH_ATTRIBUTE_PRIORITY = 8
1655
+ CU_LAUNCH_ATTRIBUTE_MEM_SYNC_DOMAIN_MAP = 9
1656
+ CU_LAUNCH_ATTRIBUTE_MEM_SYNC_DOMAIN = 10
1657
+ CUlaunchAttributeID_enum = ctypes.c_uint32 # enum
1658
+ CUlaunchAttributeID = CUlaunchAttributeID_enum
1659
+ CUlaunchAttributeID__enumvalues = CUlaunchAttributeID_enum__enumvalues
1660
+ class union_CUlaunchAttributeValue_union(Union):
1661
+ pass
1662
+
1663
+ class struct_CUlaunchAttributeValue_union_clusterDim(Structure):
1664
+ pass
1665
+
1666
+ struct_CUlaunchAttributeValue_union_clusterDim._pack_ = 1 # source:False
1667
+ struct_CUlaunchAttributeValue_union_clusterDim._fields_ = [
1668
+ ('x', ctypes.c_uint32),
1669
+ ('y', ctypes.c_uint32),
1670
+ ('z', ctypes.c_uint32),
1671
+ ]
1672
+
1673
+ class struct_CUlaunchAttributeValue_union_programmaticEvent(Structure):
1414
1674
  pass
1415
1675
 
1416
- union_CUkernelNodeAttrValue_union._pack_ = 1 # source:False
1417
- union_CUkernelNodeAttrValue_union._fields_ = [
1676
+ struct_CUlaunchAttributeValue_union_programmaticEvent._pack_ = 1 # source:False
1677
+ struct_CUlaunchAttributeValue_union_programmaticEvent._fields_ = [
1678
+ ('event', ctypes.POINTER(struct_CUevent_st)),
1679
+ ('flags', ctypes.c_int32),
1680
+ ('triggerAtBlockStart', ctypes.c_int32),
1681
+ ]
1682
+
1683
+ union_CUlaunchAttributeValue_union._pack_ = 1 # source:False
1684
+ union_CUlaunchAttributeValue_union._fields_ = [
1685
+ ('pad', ctypes.c_char * 64),
1418
1686
  ('accessPolicyWindow', CUaccessPolicyWindow),
1419
1687
  ('cooperative', ctypes.c_int32),
1420
- ('PADDING_0', ctypes.c_ubyte * 28),
1688
+ ('syncPolicy', CUsynchronizationPolicy),
1689
+ ('clusterDim', struct_CUlaunchAttributeValue_union_clusterDim),
1690
+ ('clusterSchedulingPolicyPreference', CUclusterSchedulingPolicy),
1691
+ ('programmaticStreamSerializationAllowed', ctypes.c_int32),
1692
+ ('programmaticEvent', struct_CUlaunchAttributeValue_union_programmaticEvent),
1693
+ ('priority', ctypes.c_int32),
1694
+ ('memSyncDomainMap', CUlaunchMemSyncDomainMap),
1695
+ ('memSyncDomain', CUlaunchMemSyncDomain),
1696
+ ('PADDING_0', ctypes.c_ubyte * 60),
1697
+ ]
1698
+
1699
+ CUlaunchAttributeValue = union_CUlaunchAttributeValue_union
1700
+ class struct_CUlaunchAttribute_st(Structure):
1701
+ pass
1702
+
1703
+ struct_CUlaunchAttribute_st._pack_ = 1 # source:False
1704
+ struct_CUlaunchAttribute_st._fields_ = [
1705
+ ('id', CUlaunchAttributeID),
1706
+ ('pad', ctypes.c_char * 4),
1707
+ ('value', CUlaunchAttributeValue),
1708
+ ]
1709
+
1710
+ CUlaunchAttribute = struct_CUlaunchAttribute_st
1711
+ class struct_CUlaunchConfig_st(Structure):
1712
+ pass
1713
+
1714
+ struct_CUlaunchConfig_st._pack_ = 1 # source:False
1715
+ struct_CUlaunchConfig_st._fields_ = [
1716
+ ('gridDimX', ctypes.c_uint32),
1717
+ ('gridDimY', ctypes.c_uint32),
1718
+ ('gridDimZ', ctypes.c_uint32),
1719
+ ('blockDimX', ctypes.c_uint32),
1720
+ ('blockDimY', ctypes.c_uint32),
1721
+ ('blockDimZ', ctypes.c_uint32),
1722
+ ('sharedMemBytes', ctypes.c_uint32),
1723
+ ('PADDING_0', ctypes.c_ubyte * 4),
1724
+ ('hStream', ctypes.POINTER(struct_CUstream_st)),
1725
+ ('attrs', ctypes.POINTER(struct_CUlaunchAttribute_st)),
1726
+ ('numAttrs', ctypes.c_uint32),
1727
+ ('PADDING_1', ctypes.c_ubyte * 4),
1421
1728
  ]
1422
1729
 
1423
- CUkernelNodeAttrValue_v1 = union_CUkernelNodeAttrValue_union
1424
- CUkernelNodeAttrValue = union_CUkernelNodeAttrValue_union
1730
+ CUlaunchConfig = struct_CUlaunchConfig_st
1731
+ CUkernelNodeAttrID = CUlaunchAttributeID_enum
1732
+ CUkernelNodeAttrID__enumvalues = CUlaunchAttributeID_enum__enumvalues
1733
+ CUkernelNodeAttrValue_v1 = union_CUlaunchAttributeValue_union
1734
+ CUkernelNodeAttrValue = union_CUlaunchAttributeValue_union
1425
1735
 
1426
1736
  # values for enumeration 'CUstreamCaptureStatus_enum'
1427
1737
  CUstreamCaptureStatus_enum__enumvalues = {
@@ -1448,29 +1758,10 @@ CU_STREAM_CAPTURE_MODE_RELAXED = 2
1448
1758
  CUstreamCaptureMode_enum = ctypes.c_uint32 # enum
1449
1759
  CUstreamCaptureMode = CUstreamCaptureMode_enum
1450
1760
  CUstreamCaptureMode__enumvalues = CUstreamCaptureMode_enum__enumvalues
1451
-
1452
- # values for enumeration 'CUstreamAttrID_enum'
1453
- CUstreamAttrID_enum__enumvalues = {
1454
- 1: 'CU_STREAM_ATTRIBUTE_ACCESS_POLICY_WINDOW',
1455
- 3: 'CU_STREAM_ATTRIBUTE_SYNCHRONIZATION_POLICY',
1456
- }
1457
- CU_STREAM_ATTRIBUTE_ACCESS_POLICY_WINDOW = 1
1458
- CU_STREAM_ATTRIBUTE_SYNCHRONIZATION_POLICY = 3
1459
- CUstreamAttrID_enum = ctypes.c_uint32 # enum
1460
- CUstreamAttrID = CUstreamAttrID_enum
1461
- CUstreamAttrID__enumvalues = CUstreamAttrID_enum__enumvalues
1462
- class union_CUstreamAttrValue_union(Union):
1463
- pass
1464
-
1465
- union_CUstreamAttrValue_union._pack_ = 1 # source:False
1466
- union_CUstreamAttrValue_union._fields_ = [
1467
- ('accessPolicyWindow', CUaccessPolicyWindow),
1468
- ('syncPolicy', CUsynchronizationPolicy),
1469
- ('PADDING_0', ctypes.c_ubyte * 28),
1470
- ]
1471
-
1472
- CUstreamAttrValue_v1 = union_CUstreamAttrValue_union
1473
- CUstreamAttrValue = union_CUstreamAttrValue_union
1761
+ CUstreamAttrID = CUlaunchAttributeID_enum
1762
+ CUstreamAttrID__enumvalues = CUlaunchAttributeID_enum__enumvalues
1763
+ CUstreamAttrValue_v1 = union_CUlaunchAttributeValue_union
1764
+ CUstreamAttrValue = union_CUlaunchAttributeValue_union
1474
1765
 
1475
1766
  # values for enumeration 'CUdriverProcAddress_flags_enum'
1476
1767
  CUdriverProcAddress_flags_enum__enumvalues = {
@@ -1485,6 +1776,19 @@ CUdriverProcAddress_flags_enum = ctypes.c_uint32 # enum
1485
1776
  CUdriverProcAddress_flags = CUdriverProcAddress_flags_enum
1486
1777
  CUdriverProcAddress_flags__enumvalues = CUdriverProcAddress_flags_enum__enumvalues
1487
1778
 
1779
+ # values for enumeration 'CUdriverProcAddressQueryResult_enum'
1780
+ CUdriverProcAddressQueryResult_enum__enumvalues = {
1781
+ 0: 'CU_GET_PROC_ADDRESS_SUCCESS',
1782
+ 1: 'CU_GET_PROC_ADDRESS_SYMBOL_NOT_FOUND',
1783
+ 2: 'CU_GET_PROC_ADDRESS_VERSION_NOT_SUFFICIENT',
1784
+ }
1785
+ CU_GET_PROC_ADDRESS_SUCCESS = 0
1786
+ CU_GET_PROC_ADDRESS_SYMBOL_NOT_FOUND = 1
1787
+ CU_GET_PROC_ADDRESS_VERSION_NOT_SUFFICIENT = 2
1788
+ CUdriverProcAddressQueryResult_enum = ctypes.c_uint32 # enum
1789
+ CUdriverProcAddressQueryResult = CUdriverProcAddressQueryResult_enum
1790
+ CUdriverProcAddressQueryResult__enumvalues = CUdriverProcAddressQueryResult_enum__enumvalues
1791
+
1488
1792
  # values for enumeration 'CUexecAffinityType_enum'
1489
1793
  CUexecAffinityType_enum__enumvalues = {
1490
1794
  0: 'CU_EXEC_AFFINITY_TYPE_SM_COUNT',
@@ -1523,6 +1827,31 @@ struct_CUexecAffinityParam_st._fields_ = [
1523
1827
  CUexecAffinityParam_v1 = struct_CUexecAffinityParam_st
1524
1828
  CUexecAffinityParam = struct_CUexecAffinityParam_st
1525
1829
 
1830
+ # values for enumeration 'CUlibraryOption_enum'
1831
+ CUlibraryOption_enum__enumvalues = {
1832
+ 0: 'CU_LIBRARY_HOST_UNIVERSAL_FUNCTION_AND_DATA_TABLE',
1833
+ 1: 'CU_LIBRARY_BINARY_IS_PRESERVED',
1834
+ 2: 'CU_LIBRARY_NUM_OPTIONS',
1835
+ }
1836
+ CU_LIBRARY_HOST_UNIVERSAL_FUNCTION_AND_DATA_TABLE = 0
1837
+ CU_LIBRARY_BINARY_IS_PRESERVED = 1
1838
+ CU_LIBRARY_NUM_OPTIONS = 2
1839
+ CUlibraryOption_enum = ctypes.c_uint32 # enum
1840
+ CUlibraryOption = CUlibraryOption_enum
1841
+ CUlibraryOption__enumvalues = CUlibraryOption_enum__enumvalues
1842
+ class struct_CUlibraryHostUniversalFunctionAndDataTable_st(Structure):
1843
+ pass
1844
+
1845
+ struct_CUlibraryHostUniversalFunctionAndDataTable_st._pack_ = 1 # source:False
1846
+ struct_CUlibraryHostUniversalFunctionAndDataTable_st._fields_ = [
1847
+ ('functionTable', ctypes.POINTER(None)),
1848
+ ('functionWindowSize', ctypes.c_uint64),
1849
+ ('dataTable', ctypes.POINTER(None)),
1850
+ ('dataWindowSize', ctypes.c_uint64),
1851
+ ]
1852
+
1853
+ CUlibraryHostUniversalFunctionAndDataTable = struct_CUlibraryHostUniversalFunctionAndDataTable_st
1854
+
1526
1855
  # values for enumeration 'cudaError_enum'
1527
1856
  cudaError_enum__enumvalues = {
1528
1857
  0: 'CUDA_SUCCESS',
@@ -1535,6 +1864,7 @@ cudaError_enum__enumvalues = {
1535
1864
  7: 'CUDA_ERROR_PROFILER_ALREADY_STARTED',
1536
1865
  8: 'CUDA_ERROR_PROFILER_ALREADY_STOPPED',
1537
1866
  34: 'CUDA_ERROR_STUB_LIBRARY',
1867
+ 46: 'CUDA_ERROR_DEVICE_UNAVAILABLE',
1538
1868
  100: 'CUDA_ERROR_NO_DEVICE',
1539
1869
  101: 'CUDA_ERROR_INVALID_DEVICE',
1540
1870
  102: 'CUDA_ERROR_DEVICE_NOT_LICENSED',
@@ -1599,6 +1929,9 @@ cudaError_enum__enumvalues = {
1599
1929
  807: 'CUDA_ERROR_MPS_SERVER_NOT_READY',
1600
1930
  808: 'CUDA_ERROR_MPS_MAX_CLIENTS_REACHED',
1601
1931
  809: 'CUDA_ERROR_MPS_MAX_CONNECTIONS_REACHED',
1932
+ 810: 'CUDA_ERROR_MPS_CLIENT_TERMINATED',
1933
+ 811: 'CUDA_ERROR_CDP_NOT_SUPPORTED',
1934
+ 812: 'CUDA_ERROR_CDP_VERSION_MISMATCH',
1602
1935
  900: 'CUDA_ERROR_STREAM_CAPTURE_UNSUPPORTED',
1603
1936
  901: 'CUDA_ERROR_STREAM_CAPTURE_INVALIDATED',
1604
1937
  902: 'CUDA_ERROR_STREAM_CAPTURE_MERGE',
@@ -1611,6 +1944,7 @@ cudaError_enum__enumvalues = {
1611
1944
  909: 'CUDA_ERROR_TIMEOUT',
1612
1945
  910: 'CUDA_ERROR_GRAPH_EXEC_UPDATE_FAILURE',
1613
1946
  911: 'CUDA_ERROR_EXTERNAL_DEVICE',
1947
+ 912: 'CUDA_ERROR_INVALID_CLUSTER_SIZE',
1614
1948
  999: 'CUDA_ERROR_UNKNOWN',
1615
1949
  }
1616
1950
  CUDA_SUCCESS = 0
@@ -1623,6 +1957,7 @@ CUDA_ERROR_PROFILER_NOT_INITIALIZED = 6
1623
1957
  CUDA_ERROR_PROFILER_ALREADY_STARTED = 7
1624
1958
  CUDA_ERROR_PROFILER_ALREADY_STOPPED = 8
1625
1959
  CUDA_ERROR_STUB_LIBRARY = 34
1960
+ CUDA_ERROR_DEVICE_UNAVAILABLE = 46
1626
1961
  CUDA_ERROR_NO_DEVICE = 100
1627
1962
  CUDA_ERROR_INVALID_DEVICE = 101
1628
1963
  CUDA_ERROR_DEVICE_NOT_LICENSED = 102
@@ -1687,6 +2022,9 @@ CUDA_ERROR_MPS_RPC_FAILURE = 806
1687
2022
  CUDA_ERROR_MPS_SERVER_NOT_READY = 807
1688
2023
  CUDA_ERROR_MPS_MAX_CLIENTS_REACHED = 808
1689
2024
  CUDA_ERROR_MPS_MAX_CONNECTIONS_REACHED = 809
2025
+ CUDA_ERROR_MPS_CLIENT_TERMINATED = 810
2026
+ CUDA_ERROR_CDP_NOT_SUPPORTED = 811
2027
+ CUDA_ERROR_CDP_VERSION_MISMATCH = 812
1690
2028
  CUDA_ERROR_STREAM_CAPTURE_UNSUPPORTED = 900
1691
2029
  CUDA_ERROR_STREAM_CAPTURE_INVALIDATED = 901
1692
2030
  CUDA_ERROR_STREAM_CAPTURE_MERGE = 902
@@ -1699,6 +2037,7 @@ CUDA_ERROR_STREAM_CAPTURE_WRONG_THREAD = 908
1699
2037
  CUDA_ERROR_TIMEOUT = 909
1700
2038
  CUDA_ERROR_GRAPH_EXEC_UPDATE_FAILURE = 910
1701
2039
  CUDA_ERROR_EXTERNAL_DEVICE = 911
2040
+ CUDA_ERROR_INVALID_CLUSTER_SIZE = 912
1702
2041
  CUDA_ERROR_UNKNOWN = 999
1703
2042
  cudaError_enum = ctypes.c_uint32 # enum
1704
2043
  CUresult = cudaError_enum
@@ -1875,6 +2214,18 @@ struct_CUDA_ARRAY_SPARSE_PROPERTIES_st._fields_ = [
1875
2214
 
1876
2215
  CUDA_ARRAY_SPARSE_PROPERTIES_v1 = struct_CUDA_ARRAY_SPARSE_PROPERTIES_st
1877
2216
  CUDA_ARRAY_SPARSE_PROPERTIES = struct_CUDA_ARRAY_SPARSE_PROPERTIES_st
2217
+ class struct_CUDA_ARRAY_MEMORY_REQUIREMENTS_st(Structure):
2218
+ pass
2219
+
2220
+ struct_CUDA_ARRAY_MEMORY_REQUIREMENTS_st._pack_ = 1 # source:False
2221
+ struct_CUDA_ARRAY_MEMORY_REQUIREMENTS_st._fields_ = [
2222
+ ('size', ctypes.c_uint64),
2223
+ ('alignment', ctypes.c_uint64),
2224
+ ('reserved', ctypes.c_uint32 * 4),
2225
+ ]
2226
+
2227
+ CUDA_ARRAY_MEMORY_REQUIREMENTS_v1 = struct_CUDA_ARRAY_MEMORY_REQUIREMENTS_st
2228
+ CUDA_ARRAY_MEMORY_REQUIREMENTS = struct_CUDA_ARRAY_MEMORY_REQUIREMENTS_st
1878
2229
  class struct_CUDA_RESOURCE_DESC_st(Structure):
1879
2230
  pass
1880
2231
 
@@ -2064,6 +2415,102 @@ struct_CUDA_RESOURCE_VIEW_DESC_st._fields_ = [
2064
2415
 
2065
2416
  CUDA_RESOURCE_VIEW_DESC_v1 = struct_CUDA_RESOURCE_VIEW_DESC_st
2066
2417
  CUDA_RESOURCE_VIEW_DESC = struct_CUDA_RESOURCE_VIEW_DESC_st
2418
+ class struct_CUtensorMap_st(Structure):
2419
+ pass
2420
+
2421
+ struct_CUtensorMap_st._pack_ = 1 # source:False
2422
+ struct_CUtensorMap_st._fields_ = [
2423
+ ('opaque', ctypes.c_uint64 * 16),
2424
+ ]
2425
+
2426
+ CUtensorMap = struct_CUtensorMap_st
2427
+
2428
+ # values for enumeration 'CUtensorMapDataType_enum'
2429
+ CUtensorMapDataType_enum__enumvalues = {
2430
+ 0: 'CU_TENSOR_MAP_DATA_TYPE_UINT8',
2431
+ 1: 'CU_TENSOR_MAP_DATA_TYPE_UINT16',
2432
+ 2: 'CU_TENSOR_MAP_DATA_TYPE_UINT32',
2433
+ 3: 'CU_TENSOR_MAP_DATA_TYPE_INT32',
2434
+ 4: 'CU_TENSOR_MAP_DATA_TYPE_UINT64',
2435
+ 5: 'CU_TENSOR_MAP_DATA_TYPE_INT64',
2436
+ 6: 'CU_TENSOR_MAP_DATA_TYPE_FLOAT16',
2437
+ 7: 'CU_TENSOR_MAP_DATA_TYPE_FLOAT32',
2438
+ 8: 'CU_TENSOR_MAP_DATA_TYPE_FLOAT64',
2439
+ 9: 'CU_TENSOR_MAP_DATA_TYPE_BFLOAT16',
2440
+ 10: 'CU_TENSOR_MAP_DATA_TYPE_FLOAT32_FTZ',
2441
+ 11: 'CU_TENSOR_MAP_DATA_TYPE_TFLOAT32',
2442
+ 12: 'CU_TENSOR_MAP_DATA_TYPE_TFLOAT32_FTZ',
2443
+ }
2444
+ CU_TENSOR_MAP_DATA_TYPE_UINT8 = 0
2445
+ CU_TENSOR_MAP_DATA_TYPE_UINT16 = 1
2446
+ CU_TENSOR_MAP_DATA_TYPE_UINT32 = 2
2447
+ CU_TENSOR_MAP_DATA_TYPE_INT32 = 3
2448
+ CU_TENSOR_MAP_DATA_TYPE_UINT64 = 4
2449
+ CU_TENSOR_MAP_DATA_TYPE_INT64 = 5
2450
+ CU_TENSOR_MAP_DATA_TYPE_FLOAT16 = 6
2451
+ CU_TENSOR_MAP_DATA_TYPE_FLOAT32 = 7
2452
+ CU_TENSOR_MAP_DATA_TYPE_FLOAT64 = 8
2453
+ CU_TENSOR_MAP_DATA_TYPE_BFLOAT16 = 9
2454
+ CU_TENSOR_MAP_DATA_TYPE_FLOAT32_FTZ = 10
2455
+ CU_TENSOR_MAP_DATA_TYPE_TFLOAT32 = 11
2456
+ CU_TENSOR_MAP_DATA_TYPE_TFLOAT32_FTZ = 12
2457
+ CUtensorMapDataType_enum = ctypes.c_uint32 # enum
2458
+ CUtensorMapDataType = CUtensorMapDataType_enum
2459
+ CUtensorMapDataType__enumvalues = CUtensorMapDataType_enum__enumvalues
2460
+
2461
+ # values for enumeration 'CUtensorMapInterleave_enum'
2462
+ CUtensorMapInterleave_enum__enumvalues = {
2463
+ 0: 'CU_TENSOR_MAP_INTERLEAVE_NONE',
2464
+ 1: 'CU_TENSOR_MAP_INTERLEAVE_16B',
2465
+ 2: 'CU_TENSOR_MAP_INTERLEAVE_32B',
2466
+ }
2467
+ CU_TENSOR_MAP_INTERLEAVE_NONE = 0
2468
+ CU_TENSOR_MAP_INTERLEAVE_16B = 1
2469
+ CU_TENSOR_MAP_INTERLEAVE_32B = 2
2470
+ CUtensorMapInterleave_enum = ctypes.c_uint32 # enum
2471
+ CUtensorMapInterleave = CUtensorMapInterleave_enum
2472
+ CUtensorMapInterleave__enumvalues = CUtensorMapInterleave_enum__enumvalues
2473
+
2474
+ # values for enumeration 'CUtensorMapSwizzle_enum'
2475
+ CUtensorMapSwizzle_enum__enumvalues = {
2476
+ 0: 'CU_TENSOR_MAP_SWIZZLE_NONE',
2477
+ 1: 'CU_TENSOR_MAP_SWIZZLE_32B',
2478
+ 2: 'CU_TENSOR_MAP_SWIZZLE_64B',
2479
+ 3: 'CU_TENSOR_MAP_SWIZZLE_128B',
2480
+ }
2481
+ CU_TENSOR_MAP_SWIZZLE_NONE = 0
2482
+ CU_TENSOR_MAP_SWIZZLE_32B = 1
2483
+ CU_TENSOR_MAP_SWIZZLE_64B = 2
2484
+ CU_TENSOR_MAP_SWIZZLE_128B = 3
2485
+ CUtensorMapSwizzle_enum = ctypes.c_uint32 # enum
2486
+ CUtensorMapSwizzle = CUtensorMapSwizzle_enum
2487
+ CUtensorMapSwizzle__enumvalues = CUtensorMapSwizzle_enum__enumvalues
2488
+
2489
+ # values for enumeration 'CUtensorMapL2promotion_enum'
2490
+ CUtensorMapL2promotion_enum__enumvalues = {
2491
+ 0: 'CU_TENSOR_MAP_L2_PROMOTION_NONE',
2492
+ 1: 'CU_TENSOR_MAP_L2_PROMOTION_L2_64B',
2493
+ 2: 'CU_TENSOR_MAP_L2_PROMOTION_L2_128B',
2494
+ 3: 'CU_TENSOR_MAP_L2_PROMOTION_L2_256B',
2495
+ }
2496
+ CU_TENSOR_MAP_L2_PROMOTION_NONE = 0
2497
+ CU_TENSOR_MAP_L2_PROMOTION_L2_64B = 1
2498
+ CU_TENSOR_MAP_L2_PROMOTION_L2_128B = 2
2499
+ CU_TENSOR_MAP_L2_PROMOTION_L2_256B = 3
2500
+ CUtensorMapL2promotion_enum = ctypes.c_uint32 # enum
2501
+ CUtensorMapL2promotion = CUtensorMapL2promotion_enum
2502
+ CUtensorMapL2promotion__enumvalues = CUtensorMapL2promotion_enum__enumvalues
2503
+
2504
+ # values for enumeration 'CUtensorMapFloatOOBfill_enum'
2505
+ CUtensorMapFloatOOBfill_enum__enumvalues = {
2506
+ 0: 'CU_TENSOR_MAP_FLOAT_OOB_FILL_NONE',
2507
+ 1: 'CU_TENSOR_MAP_FLOAT_OOB_FILL_NAN_REQUEST_ZERO_FMA',
2508
+ }
2509
+ CU_TENSOR_MAP_FLOAT_OOB_FILL_NONE = 0
2510
+ CU_TENSOR_MAP_FLOAT_OOB_FILL_NAN_REQUEST_ZERO_FMA = 1
2511
+ CUtensorMapFloatOOBfill_enum = ctypes.c_uint32 # enum
2512
+ CUtensorMapFloatOOBfill = CUtensorMapFloatOOBfill_enum
2513
+ CUtensorMapFloatOOBfill__enumvalues = CUtensorMapFloatOOBfill_enum__enumvalues
2067
2514
  class struct_CUDA_POINTER_ATTRIBUTE_P2P_TOKENS_st(Structure):
2068
2515
  pass
2069
2516
 
@@ -2456,6 +2903,17 @@ CUmemAllocationGranularity_flags_enum = ctypes.c_uint32 # enum
2456
2903
  CUmemAllocationGranularity_flags = CUmemAllocationGranularity_flags_enum
2457
2904
  CUmemAllocationGranularity_flags__enumvalues = CUmemAllocationGranularity_flags_enum__enumvalues
2458
2905
 
2906
+ # values for enumeration 'CUmemRangeHandleType_enum'
2907
+ CUmemRangeHandleType_enum__enumvalues = {
2908
+ 1: 'CU_MEM_RANGE_HANDLE_TYPE_DMA_BUF_FD',
2909
+ 2147483647: 'CU_MEM_RANGE_HANDLE_TYPE_MAX',
2910
+ }
2911
+ CU_MEM_RANGE_HANDLE_TYPE_DMA_BUF_FD = 1
2912
+ CU_MEM_RANGE_HANDLE_TYPE_MAX = 2147483647
2913
+ CUmemRangeHandleType_enum = ctypes.c_uint32 # enum
2914
+ CUmemRangeHandleType = CUmemRangeHandleType_enum
2915
+ CUmemRangeHandleType__enumvalues = CUmemRangeHandleType_enum__enumvalues
2916
+
2459
2917
  # values for enumeration 'CUarraySparseSubresourceType_enum'
2460
2918
  CUarraySparseSubresourceType_enum__enumvalues = {
2461
2919
  0: 'CU_ARRAY_SPARSE_SUBRESOURCE_TYPE_SPARSE_LEVEL',
@@ -2628,6 +3086,7 @@ CUgraphExecUpdateResult_enum__enumvalues = {
2628
3086
  5: 'CU_GRAPH_EXEC_UPDATE_ERROR_PARAMETERS_CHANGED',
2629
3087
  6: 'CU_GRAPH_EXEC_UPDATE_ERROR_NOT_SUPPORTED',
2630
3088
  7: 'CU_GRAPH_EXEC_UPDATE_ERROR_UNSUPPORTED_FUNCTION_CHANGE',
3089
+ 8: 'CU_GRAPH_EXEC_UPDATE_ERROR_ATTRIBUTES_CHANGED',
2631
3090
  }
2632
3091
  CU_GRAPH_EXEC_UPDATE_SUCCESS = 0
2633
3092
  CU_GRAPH_EXEC_UPDATE_ERROR = 1
@@ -2637,9 +3096,23 @@ CU_GRAPH_EXEC_UPDATE_ERROR_FUNCTION_CHANGED = 4
2637
3096
  CU_GRAPH_EXEC_UPDATE_ERROR_PARAMETERS_CHANGED = 5
2638
3097
  CU_GRAPH_EXEC_UPDATE_ERROR_NOT_SUPPORTED = 6
2639
3098
  CU_GRAPH_EXEC_UPDATE_ERROR_UNSUPPORTED_FUNCTION_CHANGE = 7
3099
+ CU_GRAPH_EXEC_UPDATE_ERROR_ATTRIBUTES_CHANGED = 8
2640
3100
  CUgraphExecUpdateResult_enum = ctypes.c_uint32 # enum
2641
3101
  CUgraphExecUpdateResult = CUgraphExecUpdateResult_enum
2642
3102
  CUgraphExecUpdateResult__enumvalues = CUgraphExecUpdateResult_enum__enumvalues
3103
+ class struct_CUgraphExecUpdateResultInfo_st(Structure):
3104
+ pass
3105
+
3106
+ struct_CUgraphExecUpdateResultInfo_st._pack_ = 1 # source:False
3107
+ struct_CUgraphExecUpdateResultInfo_st._fields_ = [
3108
+ ('result', CUgraphExecUpdateResult),
3109
+ ('PADDING_0', ctypes.c_ubyte * 4),
3110
+ ('errorNode', ctypes.POINTER(struct_CUgraphNode_st)),
3111
+ ('errorFromNode', ctypes.POINTER(struct_CUgraphNode_st)),
3112
+ ]
3113
+
3114
+ CUgraphExecUpdateResultInfo_v1 = struct_CUgraphExecUpdateResultInfo_st
3115
+ CUgraphExecUpdateResultInfo = struct_CUgraphExecUpdateResultInfo_st
2643
3116
 
2644
3117
  # values for enumeration 'CUmemPool_attribute_enum'
2645
3118
  CUmemPool_attribute_enum__enumvalues = {
@@ -2775,6 +3248,8 @@ CUgraphDebugDot_flags_enum__enumvalues = {
2775
3248
  1024: 'CU_GRAPH_DEBUG_DOT_FLAGS_HANDLES',
2776
3249
  2048: 'CU_GRAPH_DEBUG_DOT_FLAGS_MEM_ALLOC_NODE_PARAMS',
2777
3250
  4096: 'CU_GRAPH_DEBUG_DOT_FLAGS_MEM_FREE_NODE_PARAMS',
3251
+ 8192: 'CU_GRAPH_DEBUG_DOT_FLAGS_BATCH_MEM_OP_NODE_PARAMS',
3252
+ 16384: 'CU_GRAPH_DEBUG_DOT_FLAGS_EXTRA_TOPO_INFO',
2778
3253
  }
2779
3254
  CU_GRAPH_DEBUG_DOT_FLAGS_VERBOSE = 1
2780
3255
  CU_GRAPH_DEBUG_DOT_FLAGS_RUNTIME_TYPES = 2
@@ -2789,6 +3264,8 @@ CU_GRAPH_DEBUG_DOT_FLAGS_KERNEL_NODE_ATTRIBUTES = 512
2789
3264
  CU_GRAPH_DEBUG_DOT_FLAGS_HANDLES = 1024
2790
3265
  CU_GRAPH_DEBUG_DOT_FLAGS_MEM_ALLOC_NODE_PARAMS = 2048
2791
3266
  CU_GRAPH_DEBUG_DOT_FLAGS_MEM_FREE_NODE_PARAMS = 4096
3267
+ CU_GRAPH_DEBUG_DOT_FLAGS_BATCH_MEM_OP_NODE_PARAMS = 8192
3268
+ CU_GRAPH_DEBUG_DOT_FLAGS_EXTRA_TOPO_INFO = 16384
2792
3269
  CUgraphDebugDot_flags_enum = ctypes.c_uint32 # enum
2793
3270
  CUgraphDebugDot_flags = CUgraphDebugDot_flags_enum
2794
3271
  CUgraphDebugDot_flags__enumvalues = CUgraphDebugDot_flags_enum__enumvalues
@@ -2814,8 +3291,14 @@ CUuserObjectRetain_flags__enumvalues = CUuserObjectRetain_flags_enum__enumvalues
2814
3291
  # values for enumeration 'CUgraphInstantiate_flags_enum'
2815
3292
  CUgraphInstantiate_flags_enum__enumvalues = {
2816
3293
  1: 'CUDA_GRAPH_INSTANTIATE_FLAG_AUTO_FREE_ON_LAUNCH',
3294
+ 2: 'CUDA_GRAPH_INSTANTIATE_FLAG_UPLOAD',
3295
+ 4: 'CUDA_GRAPH_INSTANTIATE_FLAG_DEVICE_LAUNCH',
3296
+ 8: 'CUDA_GRAPH_INSTANTIATE_FLAG_USE_NODE_PRIORITY',
2817
3297
  }
2818
3298
  CUDA_GRAPH_INSTANTIATE_FLAG_AUTO_FREE_ON_LAUNCH = 1
3299
+ CUDA_GRAPH_INSTANTIATE_FLAG_UPLOAD = 2
3300
+ CUDA_GRAPH_INSTANTIATE_FLAG_DEVICE_LAUNCH = 4
3301
+ CUDA_GRAPH_INSTANTIATE_FLAG_USE_NODE_PRIORITY = 8
2819
3302
  CUgraphInstantiate_flags_enum = ctypes.c_uint32 # enum
2820
3303
  CUgraphInstantiate_flags = CUgraphInstantiate_flags_enum
2821
3304
  CUgraphInstantiate_flags__enumvalues = CUgraphInstantiate_flags_enum__enumvalues
@@ -2921,6 +3404,12 @@ try:
2921
3404
  cuDeviceGetDefaultMemPool.argtypes = [ctypes.POINTER(ctypes.POINTER(struct_CUmemPoolHandle_st)), CUdevice]
2922
3405
  except AttributeError:
2923
3406
  pass
3407
+ try:
3408
+ cuDeviceGetExecAffinitySupport = _libraries['libcuda.so'].cuDeviceGetExecAffinitySupport
3409
+ cuDeviceGetExecAffinitySupport.restype = CUresult
3410
+ cuDeviceGetExecAffinitySupport.argtypes = [ctypes.POINTER(ctypes.c_int32), CUexecAffinityType, CUdevice]
3411
+ except AttributeError:
3412
+ pass
2924
3413
  try:
2925
3414
  cuFlushGPUDirectRDMAWrites = _libraries['libcuda.so'].cuFlushGPUDirectRDMAWrites
2926
3415
  cuFlushGPUDirectRDMAWrites.restype = CUresult
@@ -2969,12 +3458,6 @@ try:
2969
3458
  cuDevicePrimaryCtxReset_v2.argtypes = [CUdevice]
2970
3459
  except AttributeError:
2971
3460
  pass
2972
- try:
2973
- cuDeviceGetExecAffinitySupport = _libraries['libcuda.so'].cuDeviceGetExecAffinitySupport
2974
- cuDeviceGetExecAffinitySupport.restype = CUresult
2975
- cuDeviceGetExecAffinitySupport.argtypes = [ctypes.POINTER(ctypes.c_int32), CUexecAffinityType, CUdevice]
2976
- except AttributeError:
2977
- pass
2978
3461
  try:
2979
3462
  cuCtxCreate_v2 = _libraries['libcuda.so'].cuCtxCreate_v2
2980
3463
  cuCtxCreate_v2.restype = CUresult
@@ -3029,6 +3512,12 @@ try:
3029
3512
  cuCtxGetFlags.argtypes = [ctypes.POINTER(ctypes.c_uint32)]
3030
3513
  except AttributeError:
3031
3514
  pass
3515
+ try:
3516
+ cuCtxGetId = _libraries['libcuda.so'].cuCtxGetId
3517
+ cuCtxGetId.restype = CUresult
3518
+ cuCtxGetId.argtypes = [CUcontext, ctypes.POINTER(ctypes.c_uint64)]
3519
+ except AttributeError:
3520
+ pass
3032
3521
  try:
3033
3522
  cuCtxSynchronize = _libraries['libcuda.so'].cuCtxSynchronize
3034
3523
  cuCtxSynchronize.restype = CUresult
@@ -3138,6 +3627,23 @@ try:
3138
3627
  cuModuleUnload.argtypes = [CUmodule]
3139
3628
  except AttributeError:
3140
3629
  pass
3630
+
3631
+ # values for enumeration 'CUmoduleLoadingMode_enum'
3632
+ CUmoduleLoadingMode_enum__enumvalues = {
3633
+ 1: 'CU_MODULE_EAGER_LOADING',
3634
+ 2: 'CU_MODULE_LAZY_LOADING',
3635
+ }
3636
+ CU_MODULE_EAGER_LOADING = 1
3637
+ CU_MODULE_LAZY_LOADING = 2
3638
+ CUmoduleLoadingMode_enum = ctypes.c_uint32 # enum
3639
+ CUmoduleLoadingMode = CUmoduleLoadingMode_enum
3640
+ CUmoduleLoadingMode__enumvalues = CUmoduleLoadingMode_enum__enumvalues
3641
+ try:
3642
+ cuModuleGetLoadingMode = _libraries['libcuda.so'].cuModuleGetLoadingMode
3643
+ cuModuleGetLoadingMode.restype = CUresult
3644
+ cuModuleGetLoadingMode.argtypes = [ctypes.POINTER(CUmoduleLoadingMode_enum)]
3645
+ except AttributeError:
3646
+ pass
3141
3647
  try:
3142
3648
  cuModuleGetFunction = _libraries['libcuda.so'].cuModuleGetFunction
3143
3649
  cuModuleGetFunction.restype = CUresult
@@ -3150,18 +3656,6 @@ try:
3150
3656
  cuModuleGetGlobal_v2.argtypes = [ctypes.POINTER(ctypes.c_uint64), ctypes.POINTER(ctypes.c_uint64), CUmodule, ctypes.POINTER(ctypes.c_char)]
3151
3657
  except AttributeError:
3152
3658
  pass
3153
- try:
3154
- cuModuleGetTexRef = _libraries['libcuda.so'].cuModuleGetTexRef
3155
- cuModuleGetTexRef.restype = CUresult
3156
- cuModuleGetTexRef.argtypes = [ctypes.POINTER(ctypes.POINTER(struct_CUtexref_st)), CUmodule, ctypes.POINTER(ctypes.c_char)]
3157
- except AttributeError:
3158
- pass
3159
- try:
3160
- cuModuleGetSurfRef = _libraries['libcuda.so'].cuModuleGetSurfRef
3161
- cuModuleGetSurfRef.restype = CUresult
3162
- cuModuleGetSurfRef.argtypes = [ctypes.POINTER(ctypes.POINTER(struct_CUsurfref_st)), CUmodule, ctypes.POINTER(ctypes.c_char)]
3163
- except AttributeError:
3164
- pass
3165
3659
  try:
3166
3660
  cuLinkCreate_v2 = _libraries['libcuda.so'].cuLinkCreate_v2
3167
3661
  cuLinkCreate_v2.restype = CUresult
@@ -3192,6 +3686,90 @@ try:
3192
3686
  cuLinkDestroy.argtypes = [CUlinkState]
3193
3687
  except AttributeError:
3194
3688
  pass
3689
+ try:
3690
+ cuModuleGetTexRef = _libraries['libcuda.so'].cuModuleGetTexRef
3691
+ cuModuleGetTexRef.restype = CUresult
3692
+ cuModuleGetTexRef.argtypes = [ctypes.POINTER(ctypes.POINTER(struct_CUtexref_st)), CUmodule, ctypes.POINTER(ctypes.c_char)]
3693
+ except AttributeError:
3694
+ pass
3695
+ try:
3696
+ cuModuleGetSurfRef = _libraries['libcuda.so'].cuModuleGetSurfRef
3697
+ cuModuleGetSurfRef.restype = CUresult
3698
+ cuModuleGetSurfRef.argtypes = [ctypes.POINTER(ctypes.POINTER(struct_CUsurfref_st)), CUmodule, ctypes.POINTER(ctypes.c_char)]
3699
+ except AttributeError:
3700
+ pass
3701
+ try:
3702
+ cuLibraryLoadData = _libraries['libcuda.so'].cuLibraryLoadData
3703
+ cuLibraryLoadData.restype = CUresult
3704
+ cuLibraryLoadData.argtypes = [ctypes.POINTER(ctypes.POINTER(struct_CUlib_st)), ctypes.POINTER(None), ctypes.POINTER(CUjit_option_enum), ctypes.POINTER(ctypes.POINTER(None)), ctypes.c_uint32, ctypes.POINTER(CUlibraryOption_enum), ctypes.POINTER(ctypes.POINTER(None)), ctypes.c_uint32]
3705
+ except AttributeError:
3706
+ pass
3707
+ try:
3708
+ cuLibraryLoadFromFile = _libraries['libcuda.so'].cuLibraryLoadFromFile
3709
+ cuLibraryLoadFromFile.restype = CUresult
3710
+ cuLibraryLoadFromFile.argtypes = [ctypes.POINTER(ctypes.POINTER(struct_CUlib_st)), ctypes.POINTER(ctypes.c_char), ctypes.POINTER(CUjit_option_enum), ctypes.POINTER(ctypes.POINTER(None)), ctypes.c_uint32, ctypes.POINTER(CUlibraryOption_enum), ctypes.POINTER(ctypes.POINTER(None)), ctypes.c_uint32]
3711
+ except AttributeError:
3712
+ pass
3713
+ try:
3714
+ cuLibraryUnload = _libraries['libcuda.so'].cuLibraryUnload
3715
+ cuLibraryUnload.restype = CUresult
3716
+ cuLibraryUnload.argtypes = [CUlibrary]
3717
+ except AttributeError:
3718
+ pass
3719
+ try:
3720
+ cuLibraryGetKernel = _libraries['libcuda.so'].cuLibraryGetKernel
3721
+ cuLibraryGetKernel.restype = CUresult
3722
+ cuLibraryGetKernel.argtypes = [ctypes.POINTER(ctypes.POINTER(struct_CUkern_st)), CUlibrary, ctypes.POINTER(ctypes.c_char)]
3723
+ except AttributeError:
3724
+ pass
3725
+ try:
3726
+ cuLibraryGetModule = _libraries['libcuda.so'].cuLibraryGetModule
3727
+ cuLibraryGetModule.restype = CUresult
3728
+ cuLibraryGetModule.argtypes = [ctypes.POINTER(ctypes.POINTER(struct_CUmod_st)), CUlibrary]
3729
+ except AttributeError:
3730
+ pass
3731
+ try:
3732
+ cuKernelGetFunction = _libraries['libcuda.so'].cuKernelGetFunction
3733
+ cuKernelGetFunction.restype = CUresult
3734
+ cuKernelGetFunction.argtypes = [ctypes.POINTER(ctypes.POINTER(struct_CUfunc_st)), CUkernel]
3735
+ except AttributeError:
3736
+ pass
3737
+ try:
3738
+ cuLibraryGetGlobal = _libraries['libcuda.so'].cuLibraryGetGlobal
3739
+ cuLibraryGetGlobal.restype = CUresult
3740
+ cuLibraryGetGlobal.argtypes = [ctypes.POINTER(ctypes.c_uint64), ctypes.POINTER(ctypes.c_uint64), CUlibrary, ctypes.POINTER(ctypes.c_char)]
3741
+ except AttributeError:
3742
+ pass
3743
+ try:
3744
+ cuLibraryGetManaged = _libraries['libcuda.so'].cuLibraryGetManaged
3745
+ cuLibraryGetManaged.restype = CUresult
3746
+ cuLibraryGetManaged.argtypes = [ctypes.POINTER(ctypes.c_uint64), ctypes.POINTER(ctypes.c_uint64), CUlibrary, ctypes.POINTER(ctypes.c_char)]
3747
+ except AttributeError:
3748
+ pass
3749
+ try:
3750
+ cuLibraryGetUnifiedFunction = _libraries['libcuda.so'].cuLibraryGetUnifiedFunction
3751
+ cuLibraryGetUnifiedFunction.restype = CUresult
3752
+ cuLibraryGetUnifiedFunction.argtypes = [ctypes.POINTER(ctypes.POINTER(None)), CUlibrary, ctypes.POINTER(ctypes.c_char)]
3753
+ except AttributeError:
3754
+ pass
3755
+ try:
3756
+ cuKernelGetAttribute = _libraries['libcuda.so'].cuKernelGetAttribute
3757
+ cuKernelGetAttribute.restype = CUresult
3758
+ cuKernelGetAttribute.argtypes = [ctypes.POINTER(ctypes.c_int32), CUfunction_attribute, CUkernel, CUdevice]
3759
+ except AttributeError:
3760
+ pass
3761
+ try:
3762
+ cuKernelSetAttribute = _libraries['libcuda.so'].cuKernelSetAttribute
3763
+ cuKernelSetAttribute.restype = CUresult
3764
+ cuKernelSetAttribute.argtypes = [CUfunction_attribute, ctypes.c_int32, CUkernel, CUdevice]
3765
+ except AttributeError:
3766
+ pass
3767
+ try:
3768
+ cuKernelSetCacheConfig = _libraries['libcuda.so'].cuKernelSetCacheConfig
3769
+ cuKernelSetCacheConfig.restype = CUresult
3770
+ cuKernelSetCacheConfig.argtypes = [CUkernel, CUfunc_cache, CUdevice]
3771
+ except AttributeError:
3772
+ pass
3195
3773
  try:
3196
3774
  cuMemGetInfo_v2 = _libraries['libcuda.so'].cuMemGetInfo_v2
3197
3775
  cuMemGetInfo_v2.restype = CUresult
@@ -3313,219 +3891,219 @@ try:
3313
3891
  except AttributeError:
3314
3892
  pass
3315
3893
  try:
3316
- cuMemcpy = _libraries['libcuda.so'].cuMemcpy
3317
- cuMemcpy.restype = CUresult
3318
- cuMemcpy.argtypes = [CUdeviceptr, CUdeviceptr, size_t]
3894
+ cuMemcpy_ptds = _libraries['libcuda.so'].cuMemcpy_ptds
3895
+ cuMemcpy_ptds.restype = CUresult
3896
+ cuMemcpy_ptds.argtypes = [CUdeviceptr, CUdeviceptr, size_t]
3319
3897
  except AttributeError:
3320
3898
  pass
3321
3899
  try:
3322
- cuMemcpyPeer = _libraries['libcuda.so'].cuMemcpyPeer
3323
- cuMemcpyPeer.restype = CUresult
3324
- cuMemcpyPeer.argtypes = [CUdeviceptr, CUcontext, CUdeviceptr, CUcontext, size_t]
3900
+ cuMemcpyPeer_ptds = _libraries['libcuda.so'].cuMemcpyPeer_ptds
3901
+ cuMemcpyPeer_ptds.restype = CUresult
3902
+ cuMemcpyPeer_ptds.argtypes = [CUdeviceptr, CUcontext, CUdeviceptr, CUcontext, size_t]
3325
3903
  except AttributeError:
3326
3904
  pass
3327
3905
  try:
3328
- cuMemcpyHtoD_v2 = _libraries['libcuda.so'].cuMemcpyHtoD_v2
3329
- cuMemcpyHtoD_v2.restype = CUresult
3330
- cuMemcpyHtoD_v2.argtypes = [CUdeviceptr, ctypes.POINTER(None), size_t]
3906
+ cuMemcpyHtoD_v2_ptds = _libraries['libcuda.so'].cuMemcpyHtoD_v2_ptds
3907
+ cuMemcpyHtoD_v2_ptds.restype = CUresult
3908
+ cuMemcpyHtoD_v2_ptds.argtypes = [CUdeviceptr, ctypes.POINTER(None), size_t]
3331
3909
  except AttributeError:
3332
3910
  pass
3333
3911
  try:
3334
- cuMemcpyDtoH_v2 = _libraries['libcuda.so'].cuMemcpyDtoH_v2
3335
- cuMemcpyDtoH_v2.restype = CUresult
3336
- cuMemcpyDtoH_v2.argtypes = [ctypes.POINTER(None), CUdeviceptr, size_t]
3912
+ cuMemcpyDtoH_v2_ptds = _libraries['libcuda.so'].cuMemcpyDtoH_v2_ptds
3913
+ cuMemcpyDtoH_v2_ptds.restype = CUresult
3914
+ cuMemcpyDtoH_v2_ptds.argtypes = [ctypes.POINTER(None), CUdeviceptr, size_t]
3337
3915
  except AttributeError:
3338
3916
  pass
3339
3917
  try:
3340
- cuMemcpyDtoD_v2 = _libraries['libcuda.so'].cuMemcpyDtoD_v2
3341
- cuMemcpyDtoD_v2.restype = CUresult
3342
- cuMemcpyDtoD_v2.argtypes = [CUdeviceptr, CUdeviceptr, size_t]
3918
+ cuMemcpyDtoD_v2_ptds = _libraries['libcuda.so'].cuMemcpyDtoD_v2_ptds
3919
+ cuMemcpyDtoD_v2_ptds.restype = CUresult
3920
+ cuMemcpyDtoD_v2_ptds.argtypes = [CUdeviceptr, CUdeviceptr, size_t]
3343
3921
  except AttributeError:
3344
3922
  pass
3345
3923
  try:
3346
- cuMemcpyDtoA_v2 = _libraries['libcuda.so'].cuMemcpyDtoA_v2
3347
- cuMemcpyDtoA_v2.restype = CUresult
3348
- cuMemcpyDtoA_v2.argtypes = [CUarray, size_t, CUdeviceptr, size_t]
3924
+ cuMemcpyDtoA_v2_ptds = _libraries['libcuda.so'].cuMemcpyDtoA_v2_ptds
3925
+ cuMemcpyDtoA_v2_ptds.restype = CUresult
3926
+ cuMemcpyDtoA_v2_ptds.argtypes = [CUarray, size_t, CUdeviceptr, size_t]
3349
3927
  except AttributeError:
3350
3928
  pass
3351
3929
  try:
3352
- cuMemcpyAtoD_v2 = _libraries['libcuda.so'].cuMemcpyAtoD_v2
3353
- cuMemcpyAtoD_v2.restype = CUresult
3354
- cuMemcpyAtoD_v2.argtypes = [CUdeviceptr, CUarray, size_t, size_t]
3930
+ cuMemcpyAtoD_v2_ptds = _libraries['libcuda.so'].cuMemcpyAtoD_v2_ptds
3931
+ cuMemcpyAtoD_v2_ptds.restype = CUresult
3932
+ cuMemcpyAtoD_v2_ptds.argtypes = [CUdeviceptr, CUarray, size_t, size_t]
3355
3933
  except AttributeError:
3356
3934
  pass
3357
3935
  try:
3358
- cuMemcpyHtoA_v2 = _libraries['libcuda.so'].cuMemcpyHtoA_v2
3359
- cuMemcpyHtoA_v2.restype = CUresult
3360
- cuMemcpyHtoA_v2.argtypes = [CUarray, size_t, ctypes.POINTER(None), size_t]
3936
+ cuMemcpyHtoA_v2_ptds = _libraries['libcuda.so'].cuMemcpyHtoA_v2_ptds
3937
+ cuMemcpyHtoA_v2_ptds.restype = CUresult
3938
+ cuMemcpyHtoA_v2_ptds.argtypes = [CUarray, size_t, ctypes.POINTER(None), size_t]
3361
3939
  except AttributeError:
3362
3940
  pass
3363
3941
  try:
3364
- cuMemcpyAtoH_v2 = _libraries['libcuda.so'].cuMemcpyAtoH_v2
3365
- cuMemcpyAtoH_v2.restype = CUresult
3366
- cuMemcpyAtoH_v2.argtypes = [ctypes.POINTER(None), CUarray, size_t, size_t]
3942
+ cuMemcpyAtoH_v2_ptds = _libraries['libcuda.so'].cuMemcpyAtoH_v2_ptds
3943
+ cuMemcpyAtoH_v2_ptds.restype = CUresult
3944
+ cuMemcpyAtoH_v2_ptds.argtypes = [ctypes.POINTER(None), CUarray, size_t, size_t]
3367
3945
  except AttributeError:
3368
3946
  pass
3369
3947
  try:
3370
- cuMemcpyAtoA_v2 = _libraries['libcuda.so'].cuMemcpyAtoA_v2
3371
- cuMemcpyAtoA_v2.restype = CUresult
3372
- cuMemcpyAtoA_v2.argtypes = [CUarray, size_t, CUarray, size_t, size_t]
3948
+ cuMemcpyAtoA_v2_ptds = _libraries['libcuda.so'].cuMemcpyAtoA_v2_ptds
3949
+ cuMemcpyAtoA_v2_ptds.restype = CUresult
3950
+ cuMemcpyAtoA_v2_ptds.argtypes = [CUarray, size_t, CUarray, size_t, size_t]
3373
3951
  except AttributeError:
3374
3952
  pass
3375
3953
  try:
3376
- cuMemcpy2D_v2 = _libraries['libcuda.so'].cuMemcpy2D_v2
3377
- cuMemcpy2D_v2.restype = CUresult
3378
- cuMemcpy2D_v2.argtypes = [ctypes.POINTER(struct_CUDA_MEMCPY2D_st)]
3954
+ cuMemcpy2D_v2_ptds = _libraries['libcuda.so'].cuMemcpy2D_v2_ptds
3955
+ cuMemcpy2D_v2_ptds.restype = CUresult
3956
+ cuMemcpy2D_v2_ptds.argtypes = [ctypes.POINTER(struct_CUDA_MEMCPY2D_st)]
3379
3957
  except AttributeError:
3380
3958
  pass
3381
3959
  try:
3382
- cuMemcpy2DUnaligned_v2 = _libraries['libcuda.so'].cuMemcpy2DUnaligned_v2
3383
- cuMemcpy2DUnaligned_v2.restype = CUresult
3384
- cuMemcpy2DUnaligned_v2.argtypes = [ctypes.POINTER(struct_CUDA_MEMCPY2D_st)]
3960
+ cuMemcpy2DUnaligned_v2_ptds = _libraries['libcuda.so'].cuMemcpy2DUnaligned_v2_ptds
3961
+ cuMemcpy2DUnaligned_v2_ptds.restype = CUresult
3962
+ cuMemcpy2DUnaligned_v2_ptds.argtypes = [ctypes.POINTER(struct_CUDA_MEMCPY2D_st)]
3385
3963
  except AttributeError:
3386
3964
  pass
3387
3965
  try:
3388
- cuMemcpy3D_v2 = _libraries['libcuda.so'].cuMemcpy3D_v2
3389
- cuMemcpy3D_v2.restype = CUresult
3390
- cuMemcpy3D_v2.argtypes = [ctypes.POINTER(struct_CUDA_MEMCPY3D_st)]
3966
+ cuMemcpy3D_v2_ptds = _libraries['libcuda.so'].cuMemcpy3D_v2_ptds
3967
+ cuMemcpy3D_v2_ptds.restype = CUresult
3968
+ cuMemcpy3D_v2_ptds.argtypes = [ctypes.POINTER(struct_CUDA_MEMCPY3D_st)]
3391
3969
  except AttributeError:
3392
3970
  pass
3393
3971
  try:
3394
- cuMemcpy3DPeer = _libraries['libcuda.so'].cuMemcpy3DPeer
3395
- cuMemcpy3DPeer.restype = CUresult
3396
- cuMemcpy3DPeer.argtypes = [ctypes.POINTER(struct_CUDA_MEMCPY3D_PEER_st)]
3972
+ cuMemcpy3DPeer_ptds = _libraries['libcuda.so'].cuMemcpy3DPeer_ptds
3973
+ cuMemcpy3DPeer_ptds.restype = CUresult
3974
+ cuMemcpy3DPeer_ptds.argtypes = [ctypes.POINTER(struct_CUDA_MEMCPY3D_PEER_st)]
3397
3975
  except AttributeError:
3398
3976
  pass
3399
3977
  try:
3400
- cuMemcpyAsync = _libraries['libcuda.so'].cuMemcpyAsync
3401
- cuMemcpyAsync.restype = CUresult
3402
- cuMemcpyAsync.argtypes = [CUdeviceptr, CUdeviceptr, size_t, CUstream]
3978
+ cuMemcpyAsync_ptsz = _libraries['libcuda.so'].cuMemcpyAsync_ptsz
3979
+ cuMemcpyAsync_ptsz.restype = CUresult
3980
+ cuMemcpyAsync_ptsz.argtypes = [CUdeviceptr, CUdeviceptr, size_t, CUstream]
3403
3981
  except AttributeError:
3404
3982
  pass
3405
3983
  try:
3406
- cuMemcpyPeerAsync = _libraries['libcuda.so'].cuMemcpyPeerAsync
3407
- cuMemcpyPeerAsync.restype = CUresult
3408
- cuMemcpyPeerAsync.argtypes = [CUdeviceptr, CUcontext, CUdeviceptr, CUcontext, size_t, CUstream]
3984
+ cuMemcpyPeerAsync_ptsz = _libraries['libcuda.so'].cuMemcpyPeerAsync_ptsz
3985
+ cuMemcpyPeerAsync_ptsz.restype = CUresult
3986
+ cuMemcpyPeerAsync_ptsz.argtypes = [CUdeviceptr, CUcontext, CUdeviceptr, CUcontext, size_t, CUstream]
3409
3987
  except AttributeError:
3410
3988
  pass
3411
3989
  try:
3412
- cuMemcpyHtoDAsync_v2 = _libraries['libcuda.so'].cuMemcpyHtoDAsync_v2
3413
- cuMemcpyHtoDAsync_v2.restype = CUresult
3414
- cuMemcpyHtoDAsync_v2.argtypes = [CUdeviceptr, ctypes.POINTER(None), size_t, CUstream]
3990
+ cuMemcpyHtoDAsync_v2_ptsz = _libraries['libcuda.so'].cuMemcpyHtoDAsync_v2_ptsz
3991
+ cuMemcpyHtoDAsync_v2_ptsz.restype = CUresult
3992
+ cuMemcpyHtoDAsync_v2_ptsz.argtypes = [CUdeviceptr, ctypes.POINTER(None), size_t, CUstream]
3415
3993
  except AttributeError:
3416
3994
  pass
3417
3995
  try:
3418
- cuMemcpyDtoHAsync_v2 = _libraries['libcuda.so'].cuMemcpyDtoHAsync_v2
3419
- cuMemcpyDtoHAsync_v2.restype = CUresult
3420
- cuMemcpyDtoHAsync_v2.argtypes = [ctypes.POINTER(None), CUdeviceptr, size_t, CUstream]
3996
+ cuMemcpyDtoHAsync_v2_ptsz = _libraries['libcuda.so'].cuMemcpyDtoHAsync_v2_ptsz
3997
+ cuMemcpyDtoHAsync_v2_ptsz.restype = CUresult
3998
+ cuMemcpyDtoHAsync_v2_ptsz.argtypes = [ctypes.POINTER(None), CUdeviceptr, size_t, CUstream]
3421
3999
  except AttributeError:
3422
4000
  pass
3423
4001
  try:
3424
- cuMemcpyDtoDAsync_v2 = _libraries['libcuda.so'].cuMemcpyDtoDAsync_v2
3425
- cuMemcpyDtoDAsync_v2.restype = CUresult
3426
- cuMemcpyDtoDAsync_v2.argtypes = [CUdeviceptr, CUdeviceptr, size_t, CUstream]
4002
+ cuMemcpyDtoDAsync_v2_ptsz = _libraries['libcuda.so'].cuMemcpyDtoDAsync_v2_ptsz
4003
+ cuMemcpyDtoDAsync_v2_ptsz.restype = CUresult
4004
+ cuMemcpyDtoDAsync_v2_ptsz.argtypes = [CUdeviceptr, CUdeviceptr, size_t, CUstream]
3427
4005
  except AttributeError:
3428
4006
  pass
3429
4007
  try:
3430
- cuMemcpyHtoAAsync_v2 = _libraries['libcuda.so'].cuMemcpyHtoAAsync_v2
3431
- cuMemcpyHtoAAsync_v2.restype = CUresult
3432
- cuMemcpyHtoAAsync_v2.argtypes = [CUarray, size_t, ctypes.POINTER(None), size_t, CUstream]
4008
+ cuMemcpyHtoAAsync_v2_ptsz = _libraries['libcuda.so'].cuMemcpyHtoAAsync_v2_ptsz
4009
+ cuMemcpyHtoAAsync_v2_ptsz.restype = CUresult
4010
+ cuMemcpyHtoAAsync_v2_ptsz.argtypes = [CUarray, size_t, ctypes.POINTER(None), size_t, CUstream]
3433
4011
  except AttributeError:
3434
4012
  pass
3435
4013
  try:
3436
- cuMemcpyAtoHAsync_v2 = _libraries['libcuda.so'].cuMemcpyAtoHAsync_v2
3437
- cuMemcpyAtoHAsync_v2.restype = CUresult
3438
- cuMemcpyAtoHAsync_v2.argtypes = [ctypes.POINTER(None), CUarray, size_t, size_t, CUstream]
4014
+ cuMemcpyAtoHAsync_v2_ptsz = _libraries['libcuda.so'].cuMemcpyAtoHAsync_v2_ptsz
4015
+ cuMemcpyAtoHAsync_v2_ptsz.restype = CUresult
4016
+ cuMemcpyAtoHAsync_v2_ptsz.argtypes = [ctypes.POINTER(None), CUarray, size_t, size_t, CUstream]
3439
4017
  except AttributeError:
3440
4018
  pass
3441
4019
  try:
3442
- cuMemcpy2DAsync_v2 = _libraries['libcuda.so'].cuMemcpy2DAsync_v2
3443
- cuMemcpy2DAsync_v2.restype = CUresult
3444
- cuMemcpy2DAsync_v2.argtypes = [ctypes.POINTER(struct_CUDA_MEMCPY2D_st), CUstream]
4020
+ cuMemcpy2DAsync_v2_ptsz = _libraries['libcuda.so'].cuMemcpy2DAsync_v2_ptsz
4021
+ cuMemcpy2DAsync_v2_ptsz.restype = CUresult
4022
+ cuMemcpy2DAsync_v2_ptsz.argtypes = [ctypes.POINTER(struct_CUDA_MEMCPY2D_st), CUstream]
3445
4023
  except AttributeError:
3446
4024
  pass
3447
4025
  try:
3448
- cuMemcpy3DAsync_v2 = _libraries['libcuda.so'].cuMemcpy3DAsync_v2
3449
- cuMemcpy3DAsync_v2.restype = CUresult
3450
- cuMemcpy3DAsync_v2.argtypes = [ctypes.POINTER(struct_CUDA_MEMCPY3D_st), CUstream]
4026
+ cuMemcpy3DAsync_v2_ptsz = _libraries['libcuda.so'].cuMemcpy3DAsync_v2_ptsz
4027
+ cuMemcpy3DAsync_v2_ptsz.restype = CUresult
4028
+ cuMemcpy3DAsync_v2_ptsz.argtypes = [ctypes.POINTER(struct_CUDA_MEMCPY3D_st), CUstream]
3451
4029
  except AttributeError:
3452
4030
  pass
3453
4031
  try:
3454
- cuMemcpy3DPeerAsync = _libraries['libcuda.so'].cuMemcpy3DPeerAsync
3455
- cuMemcpy3DPeerAsync.restype = CUresult
3456
- cuMemcpy3DPeerAsync.argtypes = [ctypes.POINTER(struct_CUDA_MEMCPY3D_PEER_st), CUstream]
4032
+ cuMemcpy3DPeerAsync_ptsz = _libraries['libcuda.so'].cuMemcpy3DPeerAsync_ptsz
4033
+ cuMemcpy3DPeerAsync_ptsz.restype = CUresult
4034
+ cuMemcpy3DPeerAsync_ptsz.argtypes = [ctypes.POINTER(struct_CUDA_MEMCPY3D_PEER_st), CUstream]
3457
4035
  except AttributeError:
3458
4036
  pass
3459
4037
  try:
3460
- cuMemsetD8_v2 = _libraries['libcuda.so'].cuMemsetD8_v2
3461
- cuMemsetD8_v2.restype = CUresult
3462
- cuMemsetD8_v2.argtypes = [CUdeviceptr, ctypes.c_ubyte, size_t]
4038
+ cuMemsetD8_v2_ptds = _libraries['libcuda.so'].cuMemsetD8_v2_ptds
4039
+ cuMemsetD8_v2_ptds.restype = CUresult
4040
+ cuMemsetD8_v2_ptds.argtypes = [CUdeviceptr, ctypes.c_ubyte, size_t]
3463
4041
  except AttributeError:
3464
4042
  pass
3465
4043
  try:
3466
- cuMemsetD16_v2 = _libraries['libcuda.so'].cuMemsetD16_v2
3467
- cuMemsetD16_v2.restype = CUresult
3468
- cuMemsetD16_v2.argtypes = [CUdeviceptr, ctypes.c_uint16, size_t]
4044
+ cuMemsetD16_v2_ptds = _libraries['libcuda.so'].cuMemsetD16_v2_ptds
4045
+ cuMemsetD16_v2_ptds.restype = CUresult
4046
+ cuMemsetD16_v2_ptds.argtypes = [CUdeviceptr, ctypes.c_uint16, size_t]
3469
4047
  except AttributeError:
3470
4048
  pass
3471
4049
  try:
3472
- cuMemsetD32_v2 = _libraries['libcuda.so'].cuMemsetD32_v2
3473
- cuMemsetD32_v2.restype = CUresult
3474
- cuMemsetD32_v2.argtypes = [CUdeviceptr, ctypes.c_uint32, size_t]
4050
+ cuMemsetD32_v2_ptds = _libraries['libcuda.so'].cuMemsetD32_v2_ptds
4051
+ cuMemsetD32_v2_ptds.restype = CUresult
4052
+ cuMemsetD32_v2_ptds.argtypes = [CUdeviceptr, ctypes.c_uint32, size_t]
3475
4053
  except AttributeError:
3476
4054
  pass
3477
4055
  try:
3478
- cuMemsetD2D8_v2 = _libraries['libcuda.so'].cuMemsetD2D8_v2
3479
- cuMemsetD2D8_v2.restype = CUresult
3480
- cuMemsetD2D8_v2.argtypes = [CUdeviceptr, size_t, ctypes.c_ubyte, size_t, size_t]
4056
+ cuMemsetD2D8_v2_ptds = _libraries['libcuda.so'].cuMemsetD2D8_v2_ptds
4057
+ cuMemsetD2D8_v2_ptds.restype = CUresult
4058
+ cuMemsetD2D8_v2_ptds.argtypes = [CUdeviceptr, size_t, ctypes.c_ubyte, size_t, size_t]
3481
4059
  except AttributeError:
3482
4060
  pass
3483
4061
  try:
3484
- cuMemsetD2D16_v2 = _libraries['libcuda.so'].cuMemsetD2D16_v2
3485
- cuMemsetD2D16_v2.restype = CUresult
3486
- cuMemsetD2D16_v2.argtypes = [CUdeviceptr, size_t, ctypes.c_uint16, size_t, size_t]
4062
+ cuMemsetD2D16_v2_ptds = _libraries['libcuda.so'].cuMemsetD2D16_v2_ptds
4063
+ cuMemsetD2D16_v2_ptds.restype = CUresult
4064
+ cuMemsetD2D16_v2_ptds.argtypes = [CUdeviceptr, size_t, ctypes.c_uint16, size_t, size_t]
3487
4065
  except AttributeError:
3488
4066
  pass
3489
4067
  try:
3490
- cuMemsetD2D32_v2 = _libraries['libcuda.so'].cuMemsetD2D32_v2
3491
- cuMemsetD2D32_v2.restype = CUresult
3492
- cuMemsetD2D32_v2.argtypes = [CUdeviceptr, size_t, ctypes.c_uint32, size_t, size_t]
4068
+ cuMemsetD2D32_v2_ptds = _libraries['libcuda.so'].cuMemsetD2D32_v2_ptds
4069
+ cuMemsetD2D32_v2_ptds.restype = CUresult
4070
+ cuMemsetD2D32_v2_ptds.argtypes = [CUdeviceptr, size_t, ctypes.c_uint32, size_t, size_t]
3493
4071
  except AttributeError:
3494
4072
  pass
3495
4073
  try:
3496
- cuMemsetD8Async = _libraries['libcuda.so'].cuMemsetD8Async
3497
- cuMemsetD8Async.restype = CUresult
3498
- cuMemsetD8Async.argtypes = [CUdeviceptr, ctypes.c_ubyte, size_t, CUstream]
4074
+ cuMemsetD8Async_ptsz = _libraries['libcuda.so'].cuMemsetD8Async_ptsz
4075
+ cuMemsetD8Async_ptsz.restype = CUresult
4076
+ cuMemsetD8Async_ptsz.argtypes = [CUdeviceptr, ctypes.c_ubyte, size_t, CUstream]
3499
4077
  except AttributeError:
3500
4078
  pass
3501
4079
  try:
3502
- cuMemsetD16Async = _libraries['libcuda.so'].cuMemsetD16Async
3503
- cuMemsetD16Async.restype = CUresult
3504
- cuMemsetD16Async.argtypes = [CUdeviceptr, ctypes.c_uint16, size_t, CUstream]
4080
+ cuMemsetD16Async_ptsz = _libraries['libcuda.so'].cuMemsetD16Async_ptsz
4081
+ cuMemsetD16Async_ptsz.restype = CUresult
4082
+ cuMemsetD16Async_ptsz.argtypes = [CUdeviceptr, ctypes.c_uint16, size_t, CUstream]
3505
4083
  except AttributeError:
3506
4084
  pass
3507
4085
  try:
3508
- cuMemsetD32Async = _libraries['libcuda.so'].cuMemsetD32Async
3509
- cuMemsetD32Async.restype = CUresult
3510
- cuMemsetD32Async.argtypes = [CUdeviceptr, ctypes.c_uint32, size_t, CUstream]
4086
+ cuMemsetD32Async_ptsz = _libraries['libcuda.so'].cuMemsetD32Async_ptsz
4087
+ cuMemsetD32Async_ptsz.restype = CUresult
4088
+ cuMemsetD32Async_ptsz.argtypes = [CUdeviceptr, ctypes.c_uint32, size_t, CUstream]
3511
4089
  except AttributeError:
3512
4090
  pass
3513
4091
  try:
3514
- cuMemsetD2D8Async = _libraries['libcuda.so'].cuMemsetD2D8Async
3515
- cuMemsetD2D8Async.restype = CUresult
3516
- cuMemsetD2D8Async.argtypes = [CUdeviceptr, size_t, ctypes.c_ubyte, size_t, size_t, CUstream]
4092
+ cuMemsetD2D8Async_ptsz = _libraries['libcuda.so'].cuMemsetD2D8Async_ptsz
4093
+ cuMemsetD2D8Async_ptsz.restype = CUresult
4094
+ cuMemsetD2D8Async_ptsz.argtypes = [CUdeviceptr, size_t, ctypes.c_ubyte, size_t, size_t, CUstream]
3517
4095
  except AttributeError:
3518
4096
  pass
3519
4097
  try:
3520
- cuMemsetD2D16Async = _libraries['libcuda.so'].cuMemsetD2D16Async
3521
- cuMemsetD2D16Async.restype = CUresult
3522
- cuMemsetD2D16Async.argtypes = [CUdeviceptr, size_t, ctypes.c_uint16, size_t, size_t, CUstream]
4098
+ cuMemsetD2D16Async_ptsz = _libraries['libcuda.so'].cuMemsetD2D16Async_ptsz
4099
+ cuMemsetD2D16Async_ptsz.restype = CUresult
4100
+ cuMemsetD2D16Async_ptsz.argtypes = [CUdeviceptr, size_t, ctypes.c_uint16, size_t, size_t, CUstream]
3523
4101
  except AttributeError:
3524
4102
  pass
3525
4103
  try:
3526
- cuMemsetD2D32Async = _libraries['libcuda.so'].cuMemsetD2D32Async
3527
- cuMemsetD2D32Async.restype = CUresult
3528
- cuMemsetD2D32Async.argtypes = [CUdeviceptr, size_t, ctypes.c_uint32, size_t, size_t, CUstream]
4104
+ cuMemsetD2D32Async_ptsz = _libraries['libcuda.so'].cuMemsetD2D32Async_ptsz
4105
+ cuMemsetD2D32Async_ptsz.restype = CUresult
4106
+ cuMemsetD2D32Async_ptsz.argtypes = [CUdeviceptr, size_t, ctypes.c_uint32, size_t, size_t, CUstream]
3529
4107
  except AttributeError:
3530
4108
  pass
3531
4109
  try:
@@ -3552,6 +4130,18 @@ try:
3552
4130
  cuMipmappedArrayGetSparseProperties.argtypes = [ctypes.POINTER(struct_CUDA_ARRAY_SPARSE_PROPERTIES_st), CUmipmappedArray]
3553
4131
  except AttributeError:
3554
4132
  pass
4133
+ try:
4134
+ cuArrayGetMemoryRequirements = _libraries['libcuda.so'].cuArrayGetMemoryRequirements
4135
+ cuArrayGetMemoryRequirements.restype = CUresult
4136
+ cuArrayGetMemoryRequirements.argtypes = [ctypes.POINTER(struct_CUDA_ARRAY_MEMORY_REQUIREMENTS_st), CUarray, CUdevice]
4137
+ except AttributeError:
4138
+ pass
4139
+ try:
4140
+ cuMipmappedArrayGetMemoryRequirements = _libraries['libcuda.so'].cuMipmappedArrayGetMemoryRequirements
4141
+ cuMipmappedArrayGetMemoryRequirements.restype = CUresult
4142
+ cuMipmappedArrayGetMemoryRequirements.argtypes = [ctypes.POINTER(struct_CUDA_ARRAY_MEMORY_REQUIREMENTS_st), CUmipmappedArray, CUdevice]
4143
+ except AttributeError:
4144
+ pass
3555
4145
  try:
3556
4146
  cuArrayGetPlane = _libraries['libcuda.so'].cuArrayGetPlane
3557
4147
  cuArrayGetPlane.restype = CUresult
@@ -3594,6 +4184,12 @@ try:
3594
4184
  cuMipmappedArrayDestroy.argtypes = [CUmipmappedArray]
3595
4185
  except AttributeError:
3596
4186
  pass
4187
+ try:
4188
+ cuMemGetHandleForAddressRange = _libraries['libcuda.so'].cuMemGetHandleForAddressRange
4189
+ cuMemGetHandleForAddressRange.restype = CUresult
4190
+ cuMemGetHandleForAddressRange.argtypes = [ctypes.POINTER(None), CUdeviceptr, size_t, CUmemRangeHandleType, ctypes.c_uint64]
4191
+ except AttributeError:
4192
+ pass
3597
4193
  try:
3598
4194
  cuMemAddressReserve = _libraries['libcuda.so'].cuMemAddressReserve
3599
4195
  cuMemAddressReserve.restype = CUresult
@@ -3625,9 +4221,9 @@ try:
3625
4221
  except AttributeError:
3626
4222
  pass
3627
4223
  try:
3628
- cuMemMapArrayAsync = _libraries['libcuda.so'].cuMemMapArrayAsync
3629
- cuMemMapArrayAsync.restype = CUresult
3630
- cuMemMapArrayAsync.argtypes = [ctypes.POINTER(struct_CUarrayMapInfo_st), ctypes.c_uint32, CUstream]
4224
+ cuMemMapArrayAsync_ptsz = _libraries['libcuda.so'].cuMemMapArrayAsync_ptsz
4225
+ cuMemMapArrayAsync_ptsz.restype = CUresult
4226
+ cuMemMapArrayAsync_ptsz.argtypes = [ctypes.POINTER(struct_CUarrayMapInfo_st), ctypes.c_uint32, CUstream]
3631
4227
  except AttributeError:
3632
4228
  pass
3633
4229
  try:
@@ -3679,15 +4275,15 @@ try:
3679
4275
  except AttributeError:
3680
4276
  pass
3681
4277
  try:
3682
- cuMemFreeAsync = _libraries['libcuda.so'].cuMemFreeAsync
3683
- cuMemFreeAsync.restype = CUresult
3684
- cuMemFreeAsync.argtypes = [CUdeviceptr, CUstream]
4278
+ cuMemFreeAsync_ptsz = _libraries['libcuda.so'].cuMemFreeAsync_ptsz
4279
+ cuMemFreeAsync_ptsz.restype = CUresult
4280
+ cuMemFreeAsync_ptsz.argtypes = [CUdeviceptr, CUstream]
3685
4281
  except AttributeError:
3686
4282
  pass
3687
4283
  try:
3688
- cuMemAllocAsync = _libraries['libcuda.so'].cuMemAllocAsync
3689
- cuMemAllocAsync.restype = CUresult
3690
- cuMemAllocAsync.argtypes = [ctypes.POINTER(ctypes.c_uint64), size_t, CUstream]
4284
+ cuMemAllocAsync_ptsz = _libraries['libcuda.so'].cuMemAllocAsync_ptsz
4285
+ cuMemAllocAsync_ptsz.restype = CUresult
4286
+ cuMemAllocAsync_ptsz.argtypes = [ctypes.POINTER(ctypes.c_uint64), size_t, CUstream]
3691
4287
  except AttributeError:
3692
4288
  pass
3693
4289
  try:
@@ -3733,9 +4329,9 @@ try:
3733
4329
  except AttributeError:
3734
4330
  pass
3735
4331
  try:
3736
- cuMemAllocFromPoolAsync = _libraries['libcuda.so'].cuMemAllocFromPoolAsync
3737
- cuMemAllocFromPoolAsync.restype = CUresult
3738
- cuMemAllocFromPoolAsync.argtypes = [ctypes.POINTER(ctypes.c_uint64), size_t, CUmemoryPool, CUstream]
4332
+ cuMemAllocFromPoolAsync_ptsz = _libraries['libcuda.so'].cuMemAllocFromPoolAsync_ptsz
4333
+ cuMemAllocFromPoolAsync_ptsz.restype = CUresult
4334
+ cuMemAllocFromPoolAsync_ptsz.argtypes = [ctypes.POINTER(ctypes.c_uint64), size_t, CUmemoryPool, CUstream]
3739
4335
  except AttributeError:
3740
4336
  pass
3741
4337
  try:
@@ -3769,9 +4365,9 @@ try:
3769
4365
  except AttributeError:
3770
4366
  pass
3771
4367
  try:
3772
- cuMemPrefetchAsync = _libraries['libcuda.so'].cuMemPrefetchAsync
3773
- cuMemPrefetchAsync.restype = CUresult
3774
- cuMemPrefetchAsync.argtypes = [CUdeviceptr, size_t, CUdevice, CUstream]
4368
+ cuMemPrefetchAsync_ptsz = _libraries['libcuda.so'].cuMemPrefetchAsync_ptsz
4369
+ cuMemPrefetchAsync_ptsz.restype = CUresult
4370
+ cuMemPrefetchAsync_ptsz.argtypes = [CUdeviceptr, size_t, CUdevice, CUstream]
3775
4371
  except AttributeError:
3776
4372
  pass
3777
4373
  try:
@@ -3817,93 +4413,93 @@ try:
3817
4413
  except AttributeError:
3818
4414
  pass
3819
4415
  try:
3820
- cuStreamGetPriority = _libraries['libcuda.so'].cuStreamGetPriority
3821
- cuStreamGetPriority.restype = CUresult
3822
- cuStreamGetPriority.argtypes = [CUstream, ctypes.POINTER(ctypes.c_int32)]
4416
+ cuStreamGetPriority_ptsz = _libraries['libcuda.so'].cuStreamGetPriority_ptsz
4417
+ cuStreamGetPriority_ptsz.restype = CUresult
4418
+ cuStreamGetPriority_ptsz.argtypes = [CUstream, ctypes.POINTER(ctypes.c_int32)]
3823
4419
  except AttributeError:
3824
4420
  pass
3825
4421
  try:
3826
- cuStreamGetFlags = _libraries['libcuda.so'].cuStreamGetFlags
3827
- cuStreamGetFlags.restype = CUresult
3828
- cuStreamGetFlags.argtypes = [CUstream, ctypes.POINTER(ctypes.c_uint32)]
4422
+ cuStreamGetFlags_ptsz = _libraries['libcuda.so'].cuStreamGetFlags_ptsz
4423
+ cuStreamGetFlags_ptsz.restype = CUresult
4424
+ cuStreamGetFlags_ptsz.argtypes = [CUstream, ctypes.POINTER(ctypes.c_uint32)]
3829
4425
  except AttributeError:
3830
4426
  pass
3831
4427
  try:
3832
- cuStreamGetCtx = _libraries['libcuda.so'].cuStreamGetCtx
3833
- cuStreamGetCtx.restype = CUresult
3834
- cuStreamGetCtx.argtypes = [CUstream, ctypes.POINTER(ctypes.POINTER(struct_CUctx_st))]
4428
+ cuStreamGetId_ptsz = _libraries['libcuda.so'].cuStreamGetId_ptsz
4429
+ cuStreamGetId_ptsz.restype = CUresult
4430
+ cuStreamGetId_ptsz.argtypes = [CUstream, ctypes.POINTER(ctypes.c_uint64)]
3835
4431
  except AttributeError:
3836
4432
  pass
3837
4433
  try:
3838
- cuStreamWaitEvent = _libraries['libcuda.so'].cuStreamWaitEvent
3839
- cuStreamWaitEvent.restype = CUresult
3840
- cuStreamWaitEvent.argtypes = [CUstream, CUevent, ctypes.c_uint32]
4434
+ cuStreamGetCtx_ptsz = _libraries['libcuda.so'].cuStreamGetCtx_ptsz
4435
+ cuStreamGetCtx_ptsz.restype = CUresult
4436
+ cuStreamGetCtx_ptsz.argtypes = [CUstream, ctypes.POINTER(ctypes.POINTER(struct_CUctx_st))]
3841
4437
  except AttributeError:
3842
4438
  pass
3843
4439
  try:
3844
- cuStreamAddCallback = _libraries['libcuda.so'].cuStreamAddCallback
3845
- cuStreamAddCallback.restype = CUresult
3846
- cuStreamAddCallback.argtypes = [CUstream, CUstreamCallback, ctypes.POINTER(None), ctypes.c_uint32]
4440
+ cuStreamWaitEvent_ptsz = _libraries['libcuda.so'].cuStreamWaitEvent_ptsz
4441
+ cuStreamWaitEvent_ptsz.restype = CUresult
4442
+ cuStreamWaitEvent_ptsz.argtypes = [CUstream, CUevent, ctypes.c_uint32]
3847
4443
  except AttributeError:
3848
4444
  pass
3849
4445
  try:
3850
- cuStreamBeginCapture_v2 = _libraries['libcuda.so'].cuStreamBeginCapture_v2
3851
- cuStreamBeginCapture_v2.restype = CUresult
3852
- cuStreamBeginCapture_v2.argtypes = [CUstream, CUstreamCaptureMode]
4446
+ cuStreamAddCallback_ptsz = _libraries['libcuda.so'].cuStreamAddCallback_ptsz
4447
+ cuStreamAddCallback_ptsz.restype = CUresult
4448
+ cuStreamAddCallback_ptsz.argtypes = [CUstream, CUstreamCallback, ctypes.POINTER(None), ctypes.c_uint32]
3853
4449
  except AttributeError:
3854
4450
  pass
3855
4451
  try:
3856
- cuThreadExchangeStreamCaptureMode = _libraries['libcuda.so'].cuThreadExchangeStreamCaptureMode
3857
- cuThreadExchangeStreamCaptureMode.restype = CUresult
3858
- cuThreadExchangeStreamCaptureMode.argtypes = [ctypes.POINTER(CUstreamCaptureMode_enum)]
4452
+ cuStreamBeginCapture_v2_ptsz = _libraries['libcuda.so'].cuStreamBeginCapture_v2_ptsz
4453
+ cuStreamBeginCapture_v2_ptsz.restype = CUresult
4454
+ cuStreamBeginCapture_v2_ptsz.argtypes = [CUstream, CUstreamCaptureMode]
3859
4455
  except AttributeError:
3860
4456
  pass
3861
4457
  try:
3862
- cuStreamEndCapture = _libraries['libcuda.so'].cuStreamEndCapture
3863
- cuStreamEndCapture.restype = CUresult
3864
- cuStreamEndCapture.argtypes = [CUstream, ctypes.POINTER(ctypes.POINTER(struct_CUgraph_st))]
4458
+ cuThreadExchangeStreamCaptureMode = _libraries['libcuda.so'].cuThreadExchangeStreamCaptureMode
4459
+ cuThreadExchangeStreamCaptureMode.restype = CUresult
4460
+ cuThreadExchangeStreamCaptureMode.argtypes = [ctypes.POINTER(CUstreamCaptureMode_enum)]
3865
4461
  except AttributeError:
3866
4462
  pass
3867
4463
  try:
3868
- cuStreamIsCapturing = _libraries['libcuda.so'].cuStreamIsCapturing
3869
- cuStreamIsCapturing.restype = CUresult
3870
- cuStreamIsCapturing.argtypes = [CUstream, ctypes.POINTER(CUstreamCaptureStatus_enum)]
4464
+ cuStreamEndCapture_ptsz = _libraries['libcuda.so'].cuStreamEndCapture_ptsz
4465
+ cuStreamEndCapture_ptsz.restype = CUresult
4466
+ cuStreamEndCapture_ptsz.argtypes = [CUstream, ctypes.POINTER(ctypes.POINTER(struct_CUgraph_st))]
3871
4467
  except AttributeError:
3872
4468
  pass
3873
4469
  try:
3874
- cuStreamGetCaptureInfo = _libraries['libcuda.so'].cuStreamGetCaptureInfo
3875
- cuStreamGetCaptureInfo.restype = CUresult
3876
- cuStreamGetCaptureInfo.argtypes = [CUstream, ctypes.POINTER(CUstreamCaptureStatus_enum), ctypes.POINTER(ctypes.c_uint64)]
4470
+ cuStreamIsCapturing_ptsz = _libraries['libcuda.so'].cuStreamIsCapturing_ptsz
4471
+ cuStreamIsCapturing_ptsz.restype = CUresult
4472
+ cuStreamIsCapturing_ptsz.argtypes = [CUstream, ctypes.POINTER(CUstreamCaptureStatus_enum)]
3877
4473
  except AttributeError:
3878
4474
  pass
3879
4475
  try:
3880
- cuStreamGetCaptureInfo_v2 = _libraries['libcuda.so'].cuStreamGetCaptureInfo_v2
3881
- cuStreamGetCaptureInfo_v2.restype = CUresult
3882
- cuStreamGetCaptureInfo_v2.argtypes = [CUstream, ctypes.POINTER(CUstreamCaptureStatus_enum), ctypes.POINTER(ctypes.c_uint64), ctypes.POINTER(ctypes.POINTER(struct_CUgraph_st)), ctypes.POINTER(ctypes.POINTER(ctypes.POINTER(struct_CUgraphNode_st))), ctypes.POINTER(ctypes.c_uint64)]
4476
+ cuStreamGetCaptureInfo_v2_ptsz = _libraries['libcuda.so'].cuStreamGetCaptureInfo_v2_ptsz
4477
+ cuStreamGetCaptureInfo_v2_ptsz.restype = CUresult
4478
+ cuStreamGetCaptureInfo_v2_ptsz.argtypes = [CUstream, ctypes.POINTER(CUstreamCaptureStatus_enum), ctypes.POINTER(ctypes.c_uint64), ctypes.POINTER(ctypes.POINTER(struct_CUgraph_st)), ctypes.POINTER(ctypes.POINTER(ctypes.POINTER(struct_CUgraphNode_st))), ctypes.POINTER(ctypes.c_uint64)]
3883
4479
  except AttributeError:
3884
4480
  pass
3885
4481
  try:
3886
- cuStreamUpdateCaptureDependencies = _libraries['libcuda.so'].cuStreamUpdateCaptureDependencies
3887
- cuStreamUpdateCaptureDependencies.restype = CUresult
3888
- cuStreamUpdateCaptureDependencies.argtypes = [CUstream, ctypes.POINTER(ctypes.POINTER(struct_CUgraphNode_st)), size_t, ctypes.c_uint32]
4482
+ cuStreamUpdateCaptureDependencies_ptsz = _libraries['libcuda.so'].cuStreamUpdateCaptureDependencies_ptsz
4483
+ cuStreamUpdateCaptureDependencies_ptsz.restype = CUresult
4484
+ cuStreamUpdateCaptureDependencies_ptsz.argtypes = [CUstream, ctypes.POINTER(ctypes.POINTER(struct_CUgraphNode_st)), size_t, ctypes.c_uint32]
3889
4485
  except AttributeError:
3890
4486
  pass
3891
4487
  try:
3892
- cuStreamAttachMemAsync = _libraries['libcuda.so'].cuStreamAttachMemAsync
3893
- cuStreamAttachMemAsync.restype = CUresult
3894
- cuStreamAttachMemAsync.argtypes = [CUstream, CUdeviceptr, size_t, ctypes.c_uint32]
4488
+ cuStreamAttachMemAsync_ptsz = _libraries['libcuda.so'].cuStreamAttachMemAsync_ptsz
4489
+ cuStreamAttachMemAsync_ptsz.restype = CUresult
4490
+ cuStreamAttachMemAsync_ptsz.argtypes = [CUstream, CUdeviceptr, size_t, ctypes.c_uint32]
3895
4491
  except AttributeError:
3896
4492
  pass
3897
4493
  try:
3898
- cuStreamQuery = _libraries['libcuda.so'].cuStreamQuery
3899
- cuStreamQuery.restype = CUresult
3900
- cuStreamQuery.argtypes = [CUstream]
4494
+ cuStreamQuery_ptsz = _libraries['libcuda.so'].cuStreamQuery_ptsz
4495
+ cuStreamQuery_ptsz.restype = CUresult
4496
+ cuStreamQuery_ptsz.argtypes = [CUstream]
3901
4497
  except AttributeError:
3902
4498
  pass
3903
4499
  try:
3904
- cuStreamSynchronize = _libraries['libcuda.so'].cuStreamSynchronize
3905
- cuStreamSynchronize.restype = CUresult
3906
- cuStreamSynchronize.argtypes = [CUstream]
4500
+ cuStreamSynchronize_ptsz = _libraries['libcuda.so'].cuStreamSynchronize_ptsz
4501
+ cuStreamSynchronize_ptsz.restype = CUresult
4502
+ cuStreamSynchronize_ptsz.argtypes = [CUstream]
3907
4503
  except AttributeError:
3908
4504
  pass
3909
4505
  try:
@@ -3913,21 +4509,21 @@ try:
3913
4509
  except AttributeError:
3914
4510
  pass
3915
4511
  try:
3916
- cuStreamCopyAttributes = _libraries['libcuda.so'].cuStreamCopyAttributes
3917
- cuStreamCopyAttributes.restype = CUresult
3918
- cuStreamCopyAttributes.argtypes = [CUstream, CUstream]
4512
+ cuStreamCopyAttributes_ptsz = _libraries['libcuda.so'].cuStreamCopyAttributes_ptsz
4513
+ cuStreamCopyAttributes_ptsz.restype = CUresult
4514
+ cuStreamCopyAttributes_ptsz.argtypes = [CUstream, CUstream]
3919
4515
  except AttributeError:
3920
4516
  pass
3921
4517
  try:
3922
- cuStreamGetAttribute = _libraries['libcuda.so'].cuStreamGetAttribute
3923
- cuStreamGetAttribute.restype = CUresult
3924
- cuStreamGetAttribute.argtypes = [CUstream, CUstreamAttrID, ctypes.POINTER(union_CUstreamAttrValue_union)]
4518
+ cuStreamGetAttribute_ptsz = _libraries['libcuda.so'].cuStreamGetAttribute_ptsz
4519
+ cuStreamGetAttribute_ptsz.restype = CUresult
4520
+ cuStreamGetAttribute_ptsz.argtypes = [CUstream, CUstreamAttrID, ctypes.POINTER(union_CUlaunchAttributeValue_union)]
3925
4521
  except AttributeError:
3926
4522
  pass
3927
4523
  try:
3928
- cuStreamSetAttribute = _libraries['libcuda.so'].cuStreamSetAttribute
3929
- cuStreamSetAttribute.restype = CUresult
3930
- cuStreamSetAttribute.argtypes = [CUstream, CUstreamAttrID, ctypes.POINTER(union_CUstreamAttrValue_union)]
4524
+ cuStreamSetAttribute_ptsz = _libraries['libcuda.so'].cuStreamSetAttribute_ptsz
4525
+ cuStreamSetAttribute_ptsz.restype = CUresult
4526
+ cuStreamSetAttribute_ptsz.argtypes = [CUstream, CUstreamAttrID, ctypes.POINTER(union_CUlaunchAttributeValue_union)]
3931
4527
  except AttributeError:
3932
4528
  pass
3933
4529
  try:
@@ -3937,15 +4533,15 @@ try:
3937
4533
  except AttributeError:
3938
4534
  pass
3939
4535
  try:
3940
- cuEventRecord = _libraries['libcuda.so'].cuEventRecord
3941
- cuEventRecord.restype = CUresult
3942
- cuEventRecord.argtypes = [CUevent, CUstream]
4536
+ cuEventRecord_ptsz = _libraries['libcuda.so'].cuEventRecord_ptsz
4537
+ cuEventRecord_ptsz.restype = CUresult
4538
+ cuEventRecord_ptsz.argtypes = [CUevent, CUstream]
3943
4539
  except AttributeError:
3944
4540
  pass
3945
4541
  try:
3946
- cuEventRecordWithFlags = _libraries['libcuda.so'].cuEventRecordWithFlags
3947
- cuEventRecordWithFlags.restype = CUresult
3948
- cuEventRecordWithFlags.argtypes = [CUevent, CUstream, ctypes.c_uint32]
4542
+ cuEventRecordWithFlags_ptsz = _libraries['libcuda.so'].cuEventRecordWithFlags_ptsz
4543
+ cuEventRecordWithFlags_ptsz.restype = CUresult
4544
+ cuEventRecordWithFlags_ptsz.argtypes = [CUevent, CUstream, ctypes.c_uint32]
3949
4545
  except AttributeError:
3950
4546
  pass
3951
4547
  try:
@@ -4003,15 +4599,15 @@ try:
4003
4599
  except AttributeError:
4004
4600
  pass
4005
4601
  try:
4006
- cuSignalExternalSemaphoresAsync = _libraries['libcuda.so'].cuSignalExternalSemaphoresAsync
4007
- cuSignalExternalSemaphoresAsync.restype = CUresult
4008
- cuSignalExternalSemaphoresAsync.argtypes = [ctypes.POINTER(ctypes.POINTER(struct_CUextSemaphore_st)), ctypes.POINTER(struct_CUDA_EXTERNAL_SEMAPHORE_SIGNAL_PARAMS_st), ctypes.c_uint32, CUstream]
4602
+ cuSignalExternalSemaphoresAsync_ptsz = _libraries['libcuda.so'].cuSignalExternalSemaphoresAsync_ptsz
4603
+ cuSignalExternalSemaphoresAsync_ptsz.restype = CUresult
4604
+ cuSignalExternalSemaphoresAsync_ptsz.argtypes = [ctypes.POINTER(ctypes.POINTER(struct_CUextSemaphore_st)), ctypes.POINTER(struct_CUDA_EXTERNAL_SEMAPHORE_SIGNAL_PARAMS_st), ctypes.c_uint32, CUstream]
4009
4605
  except AttributeError:
4010
4606
  pass
4011
4607
  try:
4012
- cuWaitExternalSemaphoresAsync = _libraries['libcuda.so'].cuWaitExternalSemaphoresAsync
4013
- cuWaitExternalSemaphoresAsync.restype = CUresult
4014
- cuWaitExternalSemaphoresAsync.argtypes = [ctypes.POINTER(ctypes.POINTER(struct_CUextSemaphore_st)), ctypes.POINTER(struct_CUDA_EXTERNAL_SEMAPHORE_WAIT_PARAMS_st), ctypes.c_uint32, CUstream]
4608
+ cuWaitExternalSemaphoresAsync_ptsz = _libraries['libcuda.so'].cuWaitExternalSemaphoresAsync_ptsz
4609
+ cuWaitExternalSemaphoresAsync_ptsz.restype = CUresult
4610
+ cuWaitExternalSemaphoresAsync_ptsz.argtypes = [ctypes.POINTER(ctypes.POINTER(struct_CUextSemaphore_st)), ctypes.POINTER(struct_CUDA_EXTERNAL_SEMAPHORE_WAIT_PARAMS_st), ctypes.c_uint32, CUstream]
4015
4611
  except AttributeError:
4016
4612
  pass
4017
4613
  try:
@@ -4021,33 +4617,33 @@ try:
4021
4617
  except AttributeError:
4022
4618
  pass
4023
4619
  try:
4024
- cuStreamWaitValue32 = _libraries['libcuda.so'].cuStreamWaitValue32
4025
- cuStreamWaitValue32.restype = CUresult
4026
- cuStreamWaitValue32.argtypes = [CUstream, CUdeviceptr, cuuint32_t, ctypes.c_uint32]
4620
+ cuStreamWaitValue32_v2_ptsz = _libraries['libcuda.so'].cuStreamWaitValue32_v2_ptsz
4621
+ cuStreamWaitValue32_v2_ptsz.restype = CUresult
4622
+ cuStreamWaitValue32_v2_ptsz.argtypes = [CUstream, CUdeviceptr, cuuint32_t, ctypes.c_uint32]
4027
4623
  except AttributeError:
4028
4624
  pass
4029
4625
  try:
4030
- cuStreamWaitValue64 = _libraries['libcuda.so'].cuStreamWaitValue64
4031
- cuStreamWaitValue64.restype = CUresult
4032
- cuStreamWaitValue64.argtypes = [CUstream, CUdeviceptr, cuuint64_t, ctypes.c_uint32]
4626
+ cuStreamWaitValue64_v2_ptsz = _libraries['libcuda.so'].cuStreamWaitValue64_v2_ptsz
4627
+ cuStreamWaitValue64_v2_ptsz.restype = CUresult
4628
+ cuStreamWaitValue64_v2_ptsz.argtypes = [CUstream, CUdeviceptr, cuuint64_t, ctypes.c_uint32]
4033
4629
  except AttributeError:
4034
4630
  pass
4035
4631
  try:
4036
- cuStreamWriteValue32 = _libraries['libcuda.so'].cuStreamWriteValue32
4037
- cuStreamWriteValue32.restype = CUresult
4038
- cuStreamWriteValue32.argtypes = [CUstream, CUdeviceptr, cuuint32_t, ctypes.c_uint32]
4632
+ cuStreamWriteValue32_v2_ptsz = _libraries['libcuda.so'].cuStreamWriteValue32_v2_ptsz
4633
+ cuStreamWriteValue32_v2_ptsz.restype = CUresult
4634
+ cuStreamWriteValue32_v2_ptsz.argtypes = [CUstream, CUdeviceptr, cuuint32_t, ctypes.c_uint32]
4039
4635
  except AttributeError:
4040
4636
  pass
4041
4637
  try:
4042
- cuStreamWriteValue64 = _libraries['libcuda.so'].cuStreamWriteValue64
4043
- cuStreamWriteValue64.restype = CUresult
4044
- cuStreamWriteValue64.argtypes = [CUstream, CUdeviceptr, cuuint64_t, ctypes.c_uint32]
4638
+ cuStreamWriteValue64_v2_ptsz = _libraries['libcuda.so'].cuStreamWriteValue64_v2_ptsz
4639
+ cuStreamWriteValue64_v2_ptsz.restype = CUresult
4640
+ cuStreamWriteValue64_v2_ptsz.argtypes = [CUstream, CUdeviceptr, cuuint64_t, ctypes.c_uint32]
4045
4641
  except AttributeError:
4046
4642
  pass
4047
4643
  try:
4048
- cuStreamBatchMemOp = _libraries['libcuda.so'].cuStreamBatchMemOp
4049
- cuStreamBatchMemOp.restype = CUresult
4050
- cuStreamBatchMemOp.argtypes = [CUstream, ctypes.c_uint32, ctypes.POINTER(union_CUstreamBatchMemOpParams_union), ctypes.c_uint32]
4644
+ cuStreamBatchMemOp_v2_ptsz = _libraries['libcuda.so'].cuStreamBatchMemOp_v2_ptsz
4645
+ cuStreamBatchMemOp_v2_ptsz.restype = CUresult
4646
+ cuStreamBatchMemOp_v2_ptsz.argtypes = [CUstream, ctypes.c_uint32, ctypes.POINTER(union_CUstreamBatchMemOpParams_union), ctypes.c_uint32]
4051
4647
  except AttributeError:
4052
4648
  pass
4053
4649
  try:
@@ -4081,15 +4677,21 @@ try:
4081
4677
  except AttributeError:
4082
4678
  pass
4083
4679
  try:
4084
- cuLaunchKernel = _libraries['libcuda.so'].cuLaunchKernel
4085
- cuLaunchKernel.restype = CUresult
4086
- cuLaunchKernel.argtypes = [CUfunction, ctypes.c_uint32, ctypes.c_uint32, ctypes.c_uint32, ctypes.c_uint32, ctypes.c_uint32, ctypes.c_uint32, ctypes.c_uint32, CUstream, ctypes.POINTER(ctypes.POINTER(None)), ctypes.POINTER(ctypes.POINTER(None))]
4680
+ cuLaunchKernel_ptsz = _libraries['libcuda.so'].cuLaunchKernel_ptsz
4681
+ cuLaunchKernel_ptsz.restype = CUresult
4682
+ cuLaunchKernel_ptsz.argtypes = [CUfunction, ctypes.c_uint32, ctypes.c_uint32, ctypes.c_uint32, ctypes.c_uint32, ctypes.c_uint32, ctypes.c_uint32, ctypes.c_uint32, CUstream, ctypes.POINTER(ctypes.POINTER(None)), ctypes.POINTER(ctypes.POINTER(None))]
4087
4683
  except AttributeError:
4088
4684
  pass
4089
4685
  try:
4090
- cuLaunchCooperativeKernel = _libraries['libcuda.so'].cuLaunchCooperativeKernel
4091
- cuLaunchCooperativeKernel.restype = CUresult
4092
- cuLaunchCooperativeKernel.argtypes = [CUfunction, ctypes.c_uint32, ctypes.c_uint32, ctypes.c_uint32, ctypes.c_uint32, ctypes.c_uint32, ctypes.c_uint32, ctypes.c_uint32, CUstream, ctypes.POINTER(ctypes.POINTER(None))]
4686
+ cuLaunchKernelEx_ptsz = _libraries['libcuda.so'].cuLaunchKernelEx_ptsz
4687
+ cuLaunchKernelEx_ptsz.restype = CUresult
4688
+ cuLaunchKernelEx_ptsz.argtypes = [ctypes.POINTER(struct_CUlaunchConfig_st), CUfunction, ctypes.POINTER(ctypes.POINTER(None)), ctypes.POINTER(ctypes.POINTER(None))]
4689
+ except AttributeError:
4690
+ pass
4691
+ try:
4692
+ cuLaunchCooperativeKernel_ptsz = _libraries['libcuda.so'].cuLaunchCooperativeKernel_ptsz
4693
+ cuLaunchCooperativeKernel_ptsz.restype = CUresult
4694
+ cuLaunchCooperativeKernel_ptsz.argtypes = [CUfunction, ctypes.c_uint32, ctypes.c_uint32, ctypes.c_uint32, ctypes.c_uint32, ctypes.c_uint32, ctypes.c_uint32, ctypes.c_uint32, CUstream, ctypes.POINTER(ctypes.POINTER(None))]
4093
4695
  except AttributeError:
4094
4696
  pass
4095
4697
  try:
@@ -4099,9 +4701,9 @@ try:
4099
4701
  except AttributeError:
4100
4702
  pass
4101
4703
  try:
4102
- cuLaunchHostFunc = _libraries['libcuda.so'].cuLaunchHostFunc
4103
- cuLaunchHostFunc.restype = CUresult
4104
- cuLaunchHostFunc.argtypes = [CUstream, CUhostFn, ctypes.POINTER(None)]
4704
+ cuLaunchHostFunc_ptsz = _libraries['libcuda.so'].cuLaunchHostFunc_ptsz
4705
+ cuLaunchHostFunc_ptsz.restype = CUresult
4706
+ cuLaunchHostFunc_ptsz.argtypes = [CUstream, CUhostFn, ctypes.POINTER(None)]
4105
4707
  except AttributeError:
4106
4708
  pass
4107
4709
  try:
@@ -4171,21 +4773,21 @@ try:
4171
4773
  except AttributeError:
4172
4774
  pass
4173
4775
  try:
4174
- cuGraphAddKernelNode = _libraries['libcuda.so'].cuGraphAddKernelNode
4175
- cuGraphAddKernelNode.restype = CUresult
4176
- cuGraphAddKernelNode.argtypes = [ctypes.POINTER(ctypes.POINTER(struct_CUgraphNode_st)), CUgraph, ctypes.POINTER(ctypes.POINTER(struct_CUgraphNode_st)), size_t, ctypes.POINTER(struct_CUDA_KERNEL_NODE_PARAMS_st)]
4776
+ cuGraphAddKernelNode_v2 = _libraries['libcuda.so'].cuGraphAddKernelNode_v2
4777
+ cuGraphAddKernelNode_v2.restype = CUresult
4778
+ cuGraphAddKernelNode_v2.argtypes = [ctypes.POINTER(ctypes.POINTER(struct_CUgraphNode_st)), CUgraph, ctypes.POINTER(ctypes.POINTER(struct_CUgraphNode_st)), size_t, ctypes.POINTER(struct_CUDA_KERNEL_NODE_PARAMS_v2_st)]
4177
4779
  except AttributeError:
4178
4780
  pass
4179
4781
  try:
4180
- cuGraphKernelNodeGetParams = _libraries['libcuda.so'].cuGraphKernelNodeGetParams
4181
- cuGraphKernelNodeGetParams.restype = CUresult
4182
- cuGraphKernelNodeGetParams.argtypes = [CUgraphNode, ctypes.POINTER(struct_CUDA_KERNEL_NODE_PARAMS_st)]
4782
+ cuGraphKernelNodeGetParams_v2 = _libraries['libcuda.so'].cuGraphKernelNodeGetParams_v2
4783
+ cuGraphKernelNodeGetParams_v2.restype = CUresult
4784
+ cuGraphKernelNodeGetParams_v2.argtypes = [CUgraphNode, ctypes.POINTER(struct_CUDA_KERNEL_NODE_PARAMS_v2_st)]
4183
4785
  except AttributeError:
4184
4786
  pass
4185
4787
  try:
4186
- cuGraphKernelNodeSetParams = _libraries['libcuda.so'].cuGraphKernelNodeSetParams
4187
- cuGraphKernelNodeSetParams.restype = CUresult
4188
- cuGraphKernelNodeSetParams.argtypes = [CUgraphNode, ctypes.POINTER(struct_CUDA_KERNEL_NODE_PARAMS_st)]
4788
+ cuGraphKernelNodeSetParams_v2 = _libraries['libcuda.so'].cuGraphKernelNodeSetParams_v2
4789
+ cuGraphKernelNodeSetParams_v2.restype = CUresult
4790
+ cuGraphKernelNodeSetParams_v2.argtypes = [CUgraphNode, ctypes.POINTER(struct_CUDA_KERNEL_NODE_PARAMS_v2_st)]
4189
4791
  except AttributeError:
4190
4792
  pass
4191
4793
  try:
@@ -4332,6 +4934,30 @@ try:
4332
4934
  cuGraphExternalSemaphoresWaitNodeSetParams.argtypes = [CUgraphNode, ctypes.POINTER(struct_CUDA_EXT_SEM_WAIT_NODE_PARAMS_st)]
4333
4935
  except AttributeError:
4334
4936
  pass
4937
+ try:
4938
+ cuGraphAddBatchMemOpNode = _libraries['libcuda.so'].cuGraphAddBatchMemOpNode
4939
+ cuGraphAddBatchMemOpNode.restype = CUresult
4940
+ cuGraphAddBatchMemOpNode.argtypes = [ctypes.POINTER(ctypes.POINTER(struct_CUgraphNode_st)), CUgraph, ctypes.POINTER(ctypes.POINTER(struct_CUgraphNode_st)), size_t, ctypes.POINTER(struct_CUDA_BATCH_MEM_OP_NODE_PARAMS_st)]
4941
+ except AttributeError:
4942
+ pass
4943
+ try:
4944
+ cuGraphBatchMemOpNodeGetParams = _libraries['libcuda.so'].cuGraphBatchMemOpNodeGetParams
4945
+ cuGraphBatchMemOpNodeGetParams.restype = CUresult
4946
+ cuGraphBatchMemOpNodeGetParams.argtypes = [CUgraphNode, ctypes.POINTER(struct_CUDA_BATCH_MEM_OP_NODE_PARAMS_st)]
4947
+ except AttributeError:
4948
+ pass
4949
+ try:
4950
+ cuGraphBatchMemOpNodeSetParams = _libraries['libcuda.so'].cuGraphBatchMemOpNodeSetParams
4951
+ cuGraphBatchMemOpNodeSetParams.restype = CUresult
4952
+ cuGraphBatchMemOpNodeSetParams.argtypes = [CUgraphNode, ctypes.POINTER(struct_CUDA_BATCH_MEM_OP_NODE_PARAMS_st)]
4953
+ except AttributeError:
4954
+ pass
4955
+ try:
4956
+ cuGraphExecBatchMemOpNodeSetParams = _libraries['libcuda.so'].cuGraphExecBatchMemOpNodeSetParams
4957
+ cuGraphExecBatchMemOpNodeSetParams.restype = CUresult
4958
+ cuGraphExecBatchMemOpNodeSetParams.argtypes = [CUgraphExec, CUgraphNode, ctypes.POINTER(struct_CUDA_BATCH_MEM_OP_NODE_PARAMS_st)]
4959
+ except AttributeError:
4960
+ pass
4335
4961
  try:
4336
4962
  cuGraphAddMemAllocNode = _libraries['libcuda.so'].cuGraphAddMemAllocNode
4337
4963
  cuGraphAddMemAllocNode.restype = CUresult
@@ -4440,12 +5066,6 @@ try:
4440
5066
  cuGraphDestroyNode.argtypes = [CUgraphNode]
4441
5067
  except AttributeError:
4442
5068
  pass
4443
- try:
4444
- cuGraphInstantiate_v2 = _libraries['libcuda.so'].cuGraphInstantiate_v2
4445
- cuGraphInstantiate_v2.restype = CUresult
4446
- cuGraphInstantiate_v2.argtypes = [ctypes.POINTER(ctypes.POINTER(struct_CUgraphExec_st)), CUgraph, ctypes.POINTER(ctypes.POINTER(struct_CUgraphNode_st)), ctypes.POINTER(ctypes.c_char), size_t]
4447
- except AttributeError:
4448
- pass
4449
5069
  try:
4450
5070
  cuGraphInstantiateWithFlags = _libraries['libcuda.so'].cuGraphInstantiateWithFlags
4451
5071
  cuGraphInstantiateWithFlags.restype = CUresult
@@ -4453,9 +5073,21 @@ try:
4453
5073
  except AttributeError:
4454
5074
  pass
4455
5075
  try:
4456
- cuGraphExecKernelNodeSetParams = _libraries['libcuda.so'].cuGraphExecKernelNodeSetParams
4457
- cuGraphExecKernelNodeSetParams.restype = CUresult
4458
- cuGraphExecKernelNodeSetParams.argtypes = [CUgraphExec, CUgraphNode, ctypes.POINTER(struct_CUDA_KERNEL_NODE_PARAMS_st)]
5076
+ cuGraphInstantiateWithParams_ptsz = _libraries['libcuda.so'].cuGraphInstantiateWithParams_ptsz
5077
+ cuGraphInstantiateWithParams_ptsz.restype = CUresult
5078
+ cuGraphInstantiateWithParams_ptsz.argtypes = [ctypes.POINTER(ctypes.POINTER(struct_CUgraphExec_st)), CUgraph, ctypes.POINTER(struct_CUDA_GRAPH_INSTANTIATE_PARAMS_st)]
5079
+ except AttributeError:
5080
+ pass
5081
+ try:
5082
+ cuGraphExecGetFlags = _libraries['libcuda.so'].cuGraphExecGetFlags
5083
+ cuGraphExecGetFlags.restype = CUresult
5084
+ cuGraphExecGetFlags.argtypes = [CUgraphExec, ctypes.POINTER(ctypes.c_uint64)]
5085
+ except AttributeError:
5086
+ pass
5087
+ try:
5088
+ cuGraphExecKernelNodeSetParams_v2 = _libraries['libcuda.so'].cuGraphExecKernelNodeSetParams_v2
5089
+ cuGraphExecKernelNodeSetParams_v2.restype = CUresult
5090
+ cuGraphExecKernelNodeSetParams_v2.argtypes = [CUgraphExec, CUgraphNode, ctypes.POINTER(struct_CUDA_KERNEL_NODE_PARAMS_v2_st)]
4459
5091
  except AttributeError:
4460
5092
  pass
4461
5093
  try:
@@ -4507,15 +5139,27 @@ try:
4507
5139
  except AttributeError:
4508
5140
  pass
4509
5141
  try:
4510
- cuGraphUpload = _libraries['libcuda.so'].cuGraphUpload
4511
- cuGraphUpload.restype = CUresult
4512
- cuGraphUpload.argtypes = [CUgraphExec, CUstream]
5142
+ cuGraphNodeSetEnabled = _libraries['libcuda.so'].cuGraphNodeSetEnabled
5143
+ cuGraphNodeSetEnabled.restype = CUresult
5144
+ cuGraphNodeSetEnabled.argtypes = [CUgraphExec, CUgraphNode, ctypes.c_uint32]
4513
5145
  except AttributeError:
4514
5146
  pass
4515
5147
  try:
4516
- cuGraphLaunch = _libraries['libcuda.so'].cuGraphLaunch
4517
- cuGraphLaunch.restype = CUresult
4518
- cuGraphLaunch.argtypes = [CUgraphExec, CUstream]
5148
+ cuGraphNodeGetEnabled = _libraries['libcuda.so'].cuGraphNodeGetEnabled
5149
+ cuGraphNodeGetEnabled.restype = CUresult
5150
+ cuGraphNodeGetEnabled.argtypes = [CUgraphExec, CUgraphNode, ctypes.POINTER(ctypes.c_uint32)]
5151
+ except AttributeError:
5152
+ pass
5153
+ try:
5154
+ cuGraphUpload_ptsz = _libraries['libcuda.so'].cuGraphUpload_ptsz
5155
+ cuGraphUpload_ptsz.restype = CUresult
5156
+ cuGraphUpload_ptsz.argtypes = [CUgraphExec, CUstream]
5157
+ except AttributeError:
5158
+ pass
5159
+ try:
5160
+ cuGraphLaunch_ptsz = _libraries['libcuda.so'].cuGraphLaunch_ptsz
5161
+ cuGraphLaunch_ptsz.restype = CUresult
5162
+ cuGraphLaunch_ptsz.argtypes = [CUgraphExec, CUstream]
4519
5163
  except AttributeError:
4520
5164
  pass
4521
5165
  try:
@@ -4531,9 +5175,9 @@ try:
4531
5175
  except AttributeError:
4532
5176
  pass
4533
5177
  try:
4534
- cuGraphExecUpdate = _libraries['libcuda.so'].cuGraphExecUpdate
4535
- cuGraphExecUpdate.restype = CUresult
4536
- cuGraphExecUpdate.argtypes = [CUgraphExec, CUgraph, ctypes.POINTER(ctypes.POINTER(struct_CUgraphNode_st)), ctypes.POINTER(CUgraphExecUpdateResult_enum)]
5178
+ cuGraphExecUpdate_v2 = _libraries['libcuda.so'].cuGraphExecUpdate_v2
5179
+ cuGraphExecUpdate_v2.restype = CUresult
5180
+ cuGraphExecUpdate_v2.argtypes = [CUgraphExec, CUgraph, ctypes.POINTER(struct_CUgraphExecUpdateResultInfo_st)]
4537
5181
  except AttributeError:
4538
5182
  pass
4539
5183
  try:
@@ -4545,13 +5189,13 @@ except AttributeError:
4545
5189
  try:
4546
5190
  cuGraphKernelNodeGetAttribute = _libraries['libcuda.so'].cuGraphKernelNodeGetAttribute
4547
5191
  cuGraphKernelNodeGetAttribute.restype = CUresult
4548
- cuGraphKernelNodeGetAttribute.argtypes = [CUgraphNode, CUkernelNodeAttrID, ctypes.POINTER(union_CUkernelNodeAttrValue_union)]
5192
+ cuGraphKernelNodeGetAttribute.argtypes = [CUgraphNode, CUkernelNodeAttrID, ctypes.POINTER(union_CUlaunchAttributeValue_union)]
4549
5193
  except AttributeError:
4550
5194
  pass
4551
5195
  try:
4552
5196
  cuGraphKernelNodeSetAttribute = _libraries['libcuda.so'].cuGraphKernelNodeSetAttribute
4553
5197
  cuGraphKernelNodeSetAttribute.restype = CUresult
4554
- cuGraphKernelNodeSetAttribute.argtypes = [CUgraphNode, CUkernelNodeAttrID, ctypes.POINTER(union_CUkernelNodeAttrValue_union)]
5198
+ cuGraphKernelNodeSetAttribute.argtypes = [CUgraphNode, CUkernelNodeAttrID, ctypes.POINTER(union_CUlaunchAttributeValue_union)]
4555
5199
  except AttributeError:
4556
5200
  pass
4557
5201
  try:
@@ -4620,6 +5264,18 @@ try:
4620
5264
  cuOccupancyAvailableDynamicSMemPerBlock.argtypes = [ctypes.POINTER(ctypes.c_uint64), CUfunction, ctypes.c_int32, ctypes.c_int32]
4621
5265
  except AttributeError:
4622
5266
  pass
5267
+ try:
5268
+ cuOccupancyMaxPotentialClusterSize = _libraries['libcuda.so'].cuOccupancyMaxPotentialClusterSize
5269
+ cuOccupancyMaxPotentialClusterSize.restype = CUresult
5270
+ cuOccupancyMaxPotentialClusterSize.argtypes = [ctypes.POINTER(ctypes.c_int32), CUfunction, ctypes.POINTER(struct_CUlaunchConfig_st)]
5271
+ except AttributeError:
5272
+ pass
5273
+ try:
5274
+ cuOccupancyMaxActiveClusters = _libraries['libcuda.so'].cuOccupancyMaxActiveClusters
5275
+ cuOccupancyMaxActiveClusters.restype = CUresult
5276
+ cuOccupancyMaxActiveClusters.argtypes = [ctypes.POINTER(ctypes.c_int32), CUfunction, ctypes.POINTER(struct_CUlaunchConfig_st)]
5277
+ except AttributeError:
5278
+ pass
4623
5279
  try:
4624
5280
  cuTexRefSetArray = _libraries['libcuda.so'].cuTexRefSetArray
4625
5281
  cuTexRefSetArray.restype = CUresult
@@ -4842,6 +5498,24 @@ try:
4842
5498
  cuSurfObjectGetResourceDesc.argtypes = [ctypes.POINTER(struct_CUDA_RESOURCE_DESC_st), CUsurfObject]
4843
5499
  except AttributeError:
4844
5500
  pass
5501
+ try:
5502
+ cuTensorMapEncodeTiled = _libraries['libcuda.so'].cuTensorMapEncodeTiled
5503
+ cuTensorMapEncodeTiled.restype = CUresult
5504
+ cuTensorMapEncodeTiled.argtypes = [ctypes.POINTER(struct_CUtensorMap_st), CUtensorMapDataType, cuuint32_t, ctypes.POINTER(None), ctypes.POINTER(ctypes.c_uint64), ctypes.POINTER(ctypes.c_uint64), ctypes.POINTER(ctypes.c_uint32), ctypes.POINTER(ctypes.c_uint32), CUtensorMapInterleave, CUtensorMapSwizzle, CUtensorMapL2promotion, CUtensorMapFloatOOBfill]
5505
+ except AttributeError:
5506
+ pass
5507
+ try:
5508
+ cuTensorMapEncodeIm2col = _libraries['libcuda.so'].cuTensorMapEncodeIm2col
5509
+ cuTensorMapEncodeIm2col.restype = CUresult
5510
+ cuTensorMapEncodeIm2col.argtypes = [ctypes.POINTER(struct_CUtensorMap_st), CUtensorMapDataType, cuuint32_t, ctypes.POINTER(None), ctypes.POINTER(ctypes.c_uint64), ctypes.POINTER(ctypes.c_uint64), ctypes.POINTER(ctypes.c_int32), ctypes.POINTER(ctypes.c_int32), cuuint32_t, cuuint32_t, ctypes.POINTER(ctypes.c_uint32), CUtensorMapInterleave, CUtensorMapSwizzle, CUtensorMapL2promotion, CUtensorMapFloatOOBfill]
5511
+ except AttributeError:
5512
+ pass
5513
+ try:
5514
+ cuTensorMapReplaceAddress = _libraries['libcuda.so'].cuTensorMapReplaceAddress
5515
+ cuTensorMapReplaceAddress.restype = CUresult
5516
+ cuTensorMapReplaceAddress.argtypes = [ctypes.POINTER(struct_CUtensorMap_st), ctypes.POINTER(None)]
5517
+ except AttributeError:
5518
+ pass
4845
5519
  try:
4846
5520
  cuDeviceCanAccessPeer = _libraries['libcuda.so'].cuDeviceCanAccessPeer
4847
5521
  cuDeviceCanAccessPeer.restype = CUresult
@@ -4897,21 +5571,21 @@ try:
4897
5571
  except AttributeError:
4898
5572
  pass
4899
5573
  try:
4900
- cuGraphicsMapResources = _libraries['libcuda.so'].cuGraphicsMapResources
4901
- cuGraphicsMapResources.restype = CUresult
4902
- cuGraphicsMapResources.argtypes = [ctypes.c_uint32, ctypes.POINTER(ctypes.POINTER(struct_CUgraphicsResource_st)), CUstream]
5574
+ cuGraphicsMapResources_ptsz = _libraries['libcuda.so'].cuGraphicsMapResources_ptsz
5575
+ cuGraphicsMapResources_ptsz.restype = CUresult
5576
+ cuGraphicsMapResources_ptsz.argtypes = [ctypes.c_uint32, ctypes.POINTER(ctypes.POINTER(struct_CUgraphicsResource_st)), CUstream]
4903
5577
  except AttributeError:
4904
5578
  pass
4905
5579
  try:
4906
- cuGraphicsUnmapResources = _libraries['libcuda.so'].cuGraphicsUnmapResources
4907
- cuGraphicsUnmapResources.restype = CUresult
4908
- cuGraphicsUnmapResources.argtypes = [ctypes.c_uint32, ctypes.POINTER(ctypes.POINTER(struct_CUgraphicsResource_st)), CUstream]
5580
+ cuGraphicsUnmapResources_ptsz = _libraries['libcuda.so'].cuGraphicsUnmapResources_ptsz
5581
+ cuGraphicsUnmapResources_ptsz.restype = CUresult
5582
+ cuGraphicsUnmapResources_ptsz.argtypes = [ctypes.c_uint32, ctypes.POINTER(ctypes.POINTER(struct_CUgraphicsResource_st)), CUstream]
4909
5583
  except AttributeError:
4910
5584
  pass
4911
5585
  try:
4912
- cuGetProcAddress = _libraries['libcuda.so'].cuGetProcAddress
4913
- cuGetProcAddress.restype = CUresult
4914
- cuGetProcAddress.argtypes = [ctypes.POINTER(ctypes.c_char), ctypes.POINTER(ctypes.POINTER(None)), ctypes.c_int32, cuuint64_t]
5586
+ cuGetProcAddress_v2 = _libraries['libcuda.so'].cuGetProcAddress_v2
5587
+ cuGetProcAddress_v2.restype = CUresult
5588
+ cuGetProcAddress_v2.argtypes = [ctypes.POINTER(ctypes.c_char), ctypes.POINTER(ctypes.POINTER(None)), ctypes.c_int32, cuuint64_t, ctypes.POINTER(CUdriverProcAddressQueryResult_enum)]
4915
5589
  except AttributeError:
4916
5590
  pass
4917
5591
  try:
@@ -4920,28 +5594,1056 @@ try:
4920
5594
  cuGetExportTable.argtypes = [ctypes.POINTER(ctypes.POINTER(None)), ctypes.POINTER(struct_CUuuid_st)]
4921
5595
  except AttributeError:
4922
5596
  pass
5597
+ try:
5598
+ cuMemHostRegister = _libraries['libcuda.so'].cuMemHostRegister
5599
+ cuMemHostRegister.restype = CUresult
5600
+ cuMemHostRegister.argtypes = [ctypes.POINTER(None), size_t, ctypes.c_uint32]
5601
+ except AttributeError:
5602
+ pass
5603
+ try:
5604
+ cuGraphicsResourceSetMapFlags = _libraries['libcuda.so'].cuGraphicsResourceSetMapFlags
5605
+ cuGraphicsResourceSetMapFlags.restype = CUresult
5606
+ cuGraphicsResourceSetMapFlags.argtypes = [CUgraphicsResource, ctypes.c_uint32]
5607
+ except AttributeError:
5608
+ pass
5609
+ try:
5610
+ cuLinkCreate = _libraries['libcuda.so'].cuLinkCreate
5611
+ cuLinkCreate.restype = CUresult
5612
+ cuLinkCreate.argtypes = [ctypes.c_uint32, ctypes.POINTER(CUjit_option_enum), ctypes.POINTER(ctypes.POINTER(None)), ctypes.POINTER(ctypes.POINTER(struct_CUlinkState_st))]
5613
+ except AttributeError:
5614
+ pass
5615
+ try:
5616
+ cuLinkAddData = _libraries['libcuda.so'].cuLinkAddData
5617
+ cuLinkAddData.restype = CUresult
5618
+ cuLinkAddData.argtypes = [CUlinkState, CUjitInputType, ctypes.POINTER(None), size_t, ctypes.POINTER(ctypes.c_char), ctypes.c_uint32, ctypes.POINTER(CUjit_option_enum), ctypes.POINTER(ctypes.POINTER(None))]
5619
+ except AttributeError:
5620
+ pass
5621
+ try:
5622
+ cuLinkAddFile = _libraries['libcuda.so'].cuLinkAddFile
5623
+ cuLinkAddFile.restype = CUresult
5624
+ cuLinkAddFile.argtypes = [CUlinkState, CUjitInputType, ctypes.POINTER(ctypes.c_char), ctypes.c_uint32, ctypes.POINTER(CUjit_option_enum), ctypes.POINTER(ctypes.POINTER(None))]
5625
+ except AttributeError:
5626
+ pass
5627
+ try:
5628
+ cuTexRefSetAddress2D_v2 = _libraries['libcuda.so'].cuTexRefSetAddress2D_v2
5629
+ cuTexRefSetAddress2D_v2.restype = CUresult
5630
+ cuTexRefSetAddress2D_v2.argtypes = [CUtexref, ctypes.POINTER(struct_CUDA_ARRAY_DESCRIPTOR_st), CUdeviceptr, size_t]
5631
+ except AttributeError:
5632
+ pass
5633
+ CUdeviceptr_v1 = ctypes.c_uint32
5634
+ class struct_CUDA_MEMCPY2D_v1_st(Structure):
5635
+ pass
5636
+
5637
+ struct_CUDA_MEMCPY2D_v1_st._pack_ = 1 # source:False
5638
+ struct_CUDA_MEMCPY2D_v1_st._fields_ = [
5639
+ ('srcXInBytes', ctypes.c_uint32),
5640
+ ('srcY', ctypes.c_uint32),
5641
+ ('srcMemoryType', CUmemorytype),
5642
+ ('PADDING_0', ctypes.c_ubyte * 4),
5643
+ ('srcHost', ctypes.POINTER(None)),
5644
+ ('srcDevice', ctypes.c_uint32),
5645
+ ('PADDING_1', ctypes.c_ubyte * 4),
5646
+ ('srcArray', ctypes.POINTER(struct_CUarray_st)),
5647
+ ('srcPitch', ctypes.c_uint32),
5648
+ ('dstXInBytes', ctypes.c_uint32),
5649
+ ('dstY', ctypes.c_uint32),
5650
+ ('dstMemoryType', CUmemorytype),
5651
+ ('dstHost', ctypes.POINTER(None)),
5652
+ ('dstDevice', ctypes.c_uint32),
5653
+ ('PADDING_2', ctypes.c_ubyte * 4),
5654
+ ('dstArray', ctypes.POINTER(struct_CUarray_st)),
5655
+ ('dstPitch', ctypes.c_uint32),
5656
+ ('WidthInBytes', ctypes.c_uint32),
5657
+ ('Height', ctypes.c_uint32),
5658
+ ('PADDING_3', ctypes.c_ubyte * 4),
5659
+ ]
5660
+
5661
+ CUDA_MEMCPY2D_v1 = struct_CUDA_MEMCPY2D_v1_st
5662
+ class struct_CUDA_MEMCPY3D_v1_st(Structure):
5663
+ pass
5664
+
5665
+ struct_CUDA_MEMCPY3D_v1_st._pack_ = 1 # source:False
5666
+ struct_CUDA_MEMCPY3D_v1_st._fields_ = [
5667
+ ('srcXInBytes', ctypes.c_uint32),
5668
+ ('srcY', ctypes.c_uint32),
5669
+ ('srcZ', ctypes.c_uint32),
5670
+ ('srcLOD', ctypes.c_uint32),
5671
+ ('srcMemoryType', CUmemorytype),
5672
+ ('PADDING_0', ctypes.c_ubyte * 4),
5673
+ ('srcHost', ctypes.POINTER(None)),
5674
+ ('srcDevice', ctypes.c_uint32),
5675
+ ('PADDING_1', ctypes.c_ubyte * 4),
5676
+ ('srcArray', ctypes.POINTER(struct_CUarray_st)),
5677
+ ('reserved0', ctypes.POINTER(None)),
5678
+ ('srcPitch', ctypes.c_uint32),
5679
+ ('srcHeight', ctypes.c_uint32),
5680
+ ('dstXInBytes', ctypes.c_uint32),
5681
+ ('dstY', ctypes.c_uint32),
5682
+ ('dstZ', ctypes.c_uint32),
5683
+ ('dstLOD', ctypes.c_uint32),
5684
+ ('dstMemoryType', CUmemorytype),
5685
+ ('PADDING_2', ctypes.c_ubyte * 4),
5686
+ ('dstHost', ctypes.POINTER(None)),
5687
+ ('dstDevice', ctypes.c_uint32),
5688
+ ('PADDING_3', ctypes.c_ubyte * 4),
5689
+ ('dstArray', ctypes.POINTER(struct_CUarray_st)),
5690
+ ('reserved1', ctypes.POINTER(None)),
5691
+ ('dstPitch', ctypes.c_uint32),
5692
+ ('dstHeight', ctypes.c_uint32),
5693
+ ('WidthInBytes', ctypes.c_uint32),
5694
+ ('Height', ctypes.c_uint32),
5695
+ ('Depth', ctypes.c_uint32),
5696
+ ('PADDING_4', ctypes.c_ubyte * 4),
5697
+ ]
5698
+
5699
+ CUDA_MEMCPY3D_v1 = struct_CUDA_MEMCPY3D_v1_st
5700
+ class struct_CUDA_ARRAY_DESCRIPTOR_v1_st(Structure):
5701
+ pass
5702
+
5703
+ struct_CUDA_ARRAY_DESCRIPTOR_v1_st._pack_ = 1 # source:False
5704
+ struct_CUDA_ARRAY_DESCRIPTOR_v1_st._fields_ = [
5705
+ ('Width', ctypes.c_uint32),
5706
+ ('Height', ctypes.c_uint32),
5707
+ ('Format', CUarray_format),
5708
+ ('NumChannels', ctypes.c_uint32),
5709
+ ]
5710
+
5711
+ CUDA_ARRAY_DESCRIPTOR_v1 = struct_CUDA_ARRAY_DESCRIPTOR_v1_st
5712
+ class struct_CUDA_ARRAY3D_DESCRIPTOR_v1_st(Structure):
5713
+ pass
5714
+
5715
+ struct_CUDA_ARRAY3D_DESCRIPTOR_v1_st._pack_ = 1 # source:False
5716
+ struct_CUDA_ARRAY3D_DESCRIPTOR_v1_st._fields_ = [
5717
+ ('Width', ctypes.c_uint32),
5718
+ ('Height', ctypes.c_uint32),
5719
+ ('Depth', ctypes.c_uint32),
5720
+ ('Format', CUarray_format),
5721
+ ('NumChannels', ctypes.c_uint32),
5722
+ ('Flags', ctypes.c_uint32),
5723
+ ]
5724
+
5725
+ CUDA_ARRAY3D_DESCRIPTOR_v1 = struct_CUDA_ARRAY3D_DESCRIPTOR_v1_st
5726
+ try:
5727
+ cuDeviceTotalMem = _libraries['libcuda.so'].cuDeviceTotalMem
5728
+ cuDeviceTotalMem.restype = CUresult
5729
+ cuDeviceTotalMem.argtypes = [ctypes.POINTER(ctypes.c_uint32), CUdevice]
5730
+ except AttributeError:
5731
+ pass
5732
+ try:
5733
+ cuCtxCreate = _libraries['libcuda.so'].cuCtxCreate
5734
+ cuCtxCreate.restype = CUresult
5735
+ cuCtxCreate.argtypes = [ctypes.POINTER(ctypes.POINTER(struct_CUctx_st)), ctypes.c_uint32, CUdevice]
5736
+ except AttributeError:
5737
+ pass
5738
+ try:
5739
+ cuModuleGetGlobal = _libraries['libcuda.so'].cuModuleGetGlobal
5740
+ cuModuleGetGlobal.restype = CUresult
5741
+ cuModuleGetGlobal.argtypes = [ctypes.POINTER(ctypes.c_uint32), ctypes.POINTER(ctypes.c_uint32), CUmodule, ctypes.POINTER(ctypes.c_char)]
5742
+ except AttributeError:
5743
+ pass
5744
+ try:
5745
+ cuMemGetInfo = _libraries['libcuda.so'].cuMemGetInfo
5746
+ cuMemGetInfo.restype = CUresult
5747
+ cuMemGetInfo.argtypes = [ctypes.POINTER(ctypes.c_uint32), ctypes.POINTER(ctypes.c_uint32)]
5748
+ except AttributeError:
5749
+ pass
5750
+ try:
5751
+ cuMemAlloc = _libraries['libcuda.so'].cuMemAlloc
5752
+ cuMemAlloc.restype = CUresult
5753
+ cuMemAlloc.argtypes = [ctypes.POINTER(ctypes.c_uint32), ctypes.c_uint32]
5754
+ except AttributeError:
5755
+ pass
5756
+ try:
5757
+ cuMemAllocPitch = _libraries['libcuda.so'].cuMemAllocPitch
5758
+ cuMemAllocPitch.restype = CUresult
5759
+ cuMemAllocPitch.argtypes = [ctypes.POINTER(ctypes.c_uint32), ctypes.POINTER(ctypes.c_uint32), ctypes.c_uint32, ctypes.c_uint32, ctypes.c_uint32]
5760
+ except AttributeError:
5761
+ pass
5762
+ try:
5763
+ cuMemFree = _libraries['libcuda.so'].cuMemFree
5764
+ cuMemFree.restype = CUresult
5765
+ cuMemFree.argtypes = [CUdeviceptr_v1]
5766
+ except AttributeError:
5767
+ pass
5768
+ try:
5769
+ cuMemGetAddressRange = _libraries['libcuda.so'].cuMemGetAddressRange
5770
+ cuMemGetAddressRange.restype = CUresult
5771
+ cuMemGetAddressRange.argtypes = [ctypes.POINTER(ctypes.c_uint32), ctypes.POINTER(ctypes.c_uint32), CUdeviceptr_v1]
5772
+ except AttributeError:
5773
+ pass
5774
+ try:
5775
+ cuMemAllocHost = _libraries['libcuda.so'].cuMemAllocHost
5776
+ cuMemAllocHost.restype = CUresult
5777
+ cuMemAllocHost.argtypes = [ctypes.POINTER(ctypes.POINTER(None)), ctypes.c_uint32]
5778
+ except AttributeError:
5779
+ pass
5780
+ try:
5781
+ cuMemHostGetDevicePointer = _libraries['libcuda.so'].cuMemHostGetDevicePointer
5782
+ cuMemHostGetDevicePointer.restype = CUresult
5783
+ cuMemHostGetDevicePointer.argtypes = [ctypes.POINTER(ctypes.c_uint32), ctypes.POINTER(None), ctypes.c_uint32]
5784
+ except AttributeError:
5785
+ pass
5786
+ try:
5787
+ cuMemcpyHtoD = _libraries['libcuda.so'].cuMemcpyHtoD
5788
+ cuMemcpyHtoD.restype = CUresult
5789
+ cuMemcpyHtoD.argtypes = [CUdeviceptr_v1, ctypes.POINTER(None), ctypes.c_uint32]
5790
+ except AttributeError:
5791
+ pass
5792
+ try:
5793
+ cuMemcpyDtoH = _libraries['libcuda.so'].cuMemcpyDtoH
5794
+ cuMemcpyDtoH.restype = CUresult
5795
+ cuMemcpyDtoH.argtypes = [ctypes.POINTER(None), CUdeviceptr_v1, ctypes.c_uint32]
5796
+ except AttributeError:
5797
+ pass
5798
+ try:
5799
+ cuMemcpyDtoD = _libraries['libcuda.so'].cuMemcpyDtoD
5800
+ cuMemcpyDtoD.restype = CUresult
5801
+ cuMemcpyDtoD.argtypes = [CUdeviceptr_v1, CUdeviceptr_v1, ctypes.c_uint32]
5802
+ except AttributeError:
5803
+ pass
5804
+ try:
5805
+ cuMemcpyDtoA = _libraries['libcuda.so'].cuMemcpyDtoA
5806
+ cuMemcpyDtoA.restype = CUresult
5807
+ cuMemcpyDtoA.argtypes = [CUarray, ctypes.c_uint32, CUdeviceptr_v1, ctypes.c_uint32]
5808
+ except AttributeError:
5809
+ pass
5810
+ try:
5811
+ cuMemcpyAtoD = _libraries['libcuda.so'].cuMemcpyAtoD
5812
+ cuMemcpyAtoD.restype = CUresult
5813
+ cuMemcpyAtoD.argtypes = [CUdeviceptr_v1, CUarray, ctypes.c_uint32, ctypes.c_uint32]
5814
+ except AttributeError:
5815
+ pass
5816
+ try:
5817
+ cuMemcpyHtoA = _libraries['libcuda.so'].cuMemcpyHtoA
5818
+ cuMemcpyHtoA.restype = CUresult
5819
+ cuMemcpyHtoA.argtypes = [CUarray, ctypes.c_uint32, ctypes.POINTER(None), ctypes.c_uint32]
5820
+ except AttributeError:
5821
+ pass
5822
+ try:
5823
+ cuMemcpyAtoH = _libraries['libcuda.so'].cuMemcpyAtoH
5824
+ cuMemcpyAtoH.restype = CUresult
5825
+ cuMemcpyAtoH.argtypes = [ctypes.POINTER(None), CUarray, ctypes.c_uint32, ctypes.c_uint32]
5826
+ except AttributeError:
5827
+ pass
5828
+ try:
5829
+ cuMemcpyAtoA = _libraries['libcuda.so'].cuMemcpyAtoA
5830
+ cuMemcpyAtoA.restype = CUresult
5831
+ cuMemcpyAtoA.argtypes = [CUarray, ctypes.c_uint32, CUarray, ctypes.c_uint32, ctypes.c_uint32]
5832
+ except AttributeError:
5833
+ pass
5834
+ try:
5835
+ cuMemcpyHtoAAsync = _libraries['libcuda.so'].cuMemcpyHtoAAsync
5836
+ cuMemcpyHtoAAsync.restype = CUresult
5837
+ cuMemcpyHtoAAsync.argtypes = [CUarray, ctypes.c_uint32, ctypes.POINTER(None), ctypes.c_uint32, CUstream]
5838
+ except AttributeError:
5839
+ pass
5840
+ try:
5841
+ cuMemcpyAtoHAsync = _libraries['libcuda.so'].cuMemcpyAtoHAsync
5842
+ cuMemcpyAtoHAsync.restype = CUresult
5843
+ cuMemcpyAtoHAsync.argtypes = [ctypes.POINTER(None), CUarray, ctypes.c_uint32, ctypes.c_uint32, CUstream]
5844
+ except AttributeError:
5845
+ pass
5846
+ try:
5847
+ cuMemcpy2D = _libraries['libcuda.so'].cuMemcpy2D
5848
+ cuMemcpy2D.restype = CUresult
5849
+ cuMemcpy2D.argtypes = [ctypes.POINTER(struct_CUDA_MEMCPY2D_v1_st)]
5850
+ except AttributeError:
5851
+ pass
5852
+ try:
5853
+ cuMemcpy2DUnaligned = _libraries['libcuda.so'].cuMemcpy2DUnaligned
5854
+ cuMemcpy2DUnaligned.restype = CUresult
5855
+ cuMemcpy2DUnaligned.argtypes = [ctypes.POINTER(struct_CUDA_MEMCPY2D_v1_st)]
5856
+ except AttributeError:
5857
+ pass
5858
+ try:
5859
+ cuMemcpy3D = _libraries['libcuda.so'].cuMemcpy3D
5860
+ cuMemcpy3D.restype = CUresult
5861
+ cuMemcpy3D.argtypes = [ctypes.POINTER(struct_CUDA_MEMCPY3D_v1_st)]
5862
+ except AttributeError:
5863
+ pass
5864
+ try:
5865
+ cuMemcpyHtoDAsync = _libraries['libcuda.so'].cuMemcpyHtoDAsync
5866
+ cuMemcpyHtoDAsync.restype = CUresult
5867
+ cuMemcpyHtoDAsync.argtypes = [CUdeviceptr_v1, ctypes.POINTER(None), ctypes.c_uint32, CUstream]
5868
+ except AttributeError:
5869
+ pass
5870
+ try:
5871
+ cuMemcpyDtoHAsync = _libraries['libcuda.so'].cuMemcpyDtoHAsync
5872
+ cuMemcpyDtoHAsync.restype = CUresult
5873
+ cuMemcpyDtoHAsync.argtypes = [ctypes.POINTER(None), CUdeviceptr_v1, ctypes.c_uint32, CUstream]
5874
+ except AttributeError:
5875
+ pass
5876
+ try:
5877
+ cuMemcpyDtoDAsync = _libraries['libcuda.so'].cuMemcpyDtoDAsync
5878
+ cuMemcpyDtoDAsync.restype = CUresult
5879
+ cuMemcpyDtoDAsync.argtypes = [CUdeviceptr_v1, CUdeviceptr_v1, ctypes.c_uint32, CUstream]
5880
+ except AttributeError:
5881
+ pass
5882
+ try:
5883
+ cuMemcpy2DAsync = _libraries['libcuda.so'].cuMemcpy2DAsync
5884
+ cuMemcpy2DAsync.restype = CUresult
5885
+ cuMemcpy2DAsync.argtypes = [ctypes.POINTER(struct_CUDA_MEMCPY2D_v1_st), CUstream]
5886
+ except AttributeError:
5887
+ pass
5888
+ try:
5889
+ cuMemcpy3DAsync = _libraries['libcuda.so'].cuMemcpy3DAsync
5890
+ cuMemcpy3DAsync.restype = CUresult
5891
+ cuMemcpy3DAsync.argtypes = [ctypes.POINTER(struct_CUDA_MEMCPY3D_v1_st), CUstream]
5892
+ except AttributeError:
5893
+ pass
5894
+ try:
5895
+ cuMemsetD8 = _libraries['libcuda.so'].cuMemsetD8
5896
+ cuMemsetD8.restype = CUresult
5897
+ cuMemsetD8.argtypes = [CUdeviceptr_v1, ctypes.c_ubyte, ctypes.c_uint32]
5898
+ except AttributeError:
5899
+ pass
5900
+ try:
5901
+ cuMemsetD16 = _libraries['libcuda.so'].cuMemsetD16
5902
+ cuMemsetD16.restype = CUresult
5903
+ cuMemsetD16.argtypes = [CUdeviceptr_v1, ctypes.c_uint16, ctypes.c_uint32]
5904
+ except AttributeError:
5905
+ pass
5906
+ try:
5907
+ cuMemsetD32 = _libraries['libcuda.so'].cuMemsetD32
5908
+ cuMemsetD32.restype = CUresult
5909
+ cuMemsetD32.argtypes = [CUdeviceptr_v1, ctypes.c_uint32, ctypes.c_uint32]
5910
+ except AttributeError:
5911
+ pass
5912
+ try:
5913
+ cuMemsetD2D8 = _libraries['libcuda.so'].cuMemsetD2D8
5914
+ cuMemsetD2D8.restype = CUresult
5915
+ cuMemsetD2D8.argtypes = [CUdeviceptr_v1, ctypes.c_uint32, ctypes.c_ubyte, ctypes.c_uint32, ctypes.c_uint32]
5916
+ except AttributeError:
5917
+ pass
5918
+ try:
5919
+ cuMemsetD2D16 = _libraries['libcuda.so'].cuMemsetD2D16
5920
+ cuMemsetD2D16.restype = CUresult
5921
+ cuMemsetD2D16.argtypes = [CUdeviceptr_v1, ctypes.c_uint32, ctypes.c_uint16, ctypes.c_uint32, ctypes.c_uint32]
5922
+ except AttributeError:
5923
+ pass
5924
+ try:
5925
+ cuMemsetD2D32 = _libraries['libcuda.so'].cuMemsetD2D32
5926
+ cuMemsetD2D32.restype = CUresult
5927
+ cuMemsetD2D32.argtypes = [CUdeviceptr_v1, ctypes.c_uint32, ctypes.c_uint32, ctypes.c_uint32, ctypes.c_uint32]
5928
+ except AttributeError:
5929
+ pass
5930
+ try:
5931
+ cuArrayCreate = _libraries['libcuda.so'].cuArrayCreate
5932
+ cuArrayCreate.restype = CUresult
5933
+ cuArrayCreate.argtypes = [ctypes.POINTER(ctypes.POINTER(struct_CUarray_st)), ctypes.POINTER(struct_CUDA_ARRAY_DESCRIPTOR_v1_st)]
5934
+ except AttributeError:
5935
+ pass
5936
+ try:
5937
+ cuArrayGetDescriptor = _libraries['libcuda.so'].cuArrayGetDescriptor
5938
+ cuArrayGetDescriptor.restype = CUresult
5939
+ cuArrayGetDescriptor.argtypes = [ctypes.POINTER(struct_CUDA_ARRAY_DESCRIPTOR_v1_st), CUarray]
5940
+ except AttributeError:
5941
+ pass
5942
+ try:
5943
+ cuArray3DCreate = _libraries['libcuda.so'].cuArray3DCreate
5944
+ cuArray3DCreate.restype = CUresult
5945
+ cuArray3DCreate.argtypes = [ctypes.POINTER(ctypes.POINTER(struct_CUarray_st)), ctypes.POINTER(struct_CUDA_ARRAY3D_DESCRIPTOR_v1_st)]
5946
+ except AttributeError:
5947
+ pass
5948
+ try:
5949
+ cuArray3DGetDescriptor = _libraries['libcuda.so'].cuArray3DGetDescriptor
5950
+ cuArray3DGetDescriptor.restype = CUresult
5951
+ cuArray3DGetDescriptor.argtypes = [ctypes.POINTER(struct_CUDA_ARRAY3D_DESCRIPTOR_v1_st), CUarray]
5952
+ except AttributeError:
5953
+ pass
5954
+ try:
5955
+ cuTexRefSetAddress = _libraries['libcuda.so'].cuTexRefSetAddress
5956
+ cuTexRefSetAddress.restype = CUresult
5957
+ cuTexRefSetAddress.argtypes = [ctypes.POINTER(ctypes.c_uint32), CUtexref, CUdeviceptr_v1, ctypes.c_uint32]
5958
+ except AttributeError:
5959
+ pass
5960
+ try:
5961
+ cuTexRefSetAddress2D = _libraries['libcuda.so'].cuTexRefSetAddress2D
5962
+ cuTexRefSetAddress2D.restype = CUresult
5963
+ cuTexRefSetAddress2D.argtypes = [CUtexref, ctypes.POINTER(struct_CUDA_ARRAY_DESCRIPTOR_v1_st), CUdeviceptr_v1, ctypes.c_uint32]
5964
+ except AttributeError:
5965
+ pass
5966
+ try:
5967
+ cuTexRefGetAddress = _libraries['libcuda.so'].cuTexRefGetAddress
5968
+ cuTexRefGetAddress.restype = CUresult
5969
+ cuTexRefGetAddress.argtypes = [ctypes.POINTER(ctypes.c_uint32), CUtexref]
5970
+ except AttributeError:
5971
+ pass
5972
+ try:
5973
+ cuGraphicsResourceGetMappedPointer = _libraries['libcuda.so'].cuGraphicsResourceGetMappedPointer
5974
+ cuGraphicsResourceGetMappedPointer.restype = CUresult
5975
+ cuGraphicsResourceGetMappedPointer.argtypes = [ctypes.POINTER(ctypes.c_uint32), ctypes.POINTER(ctypes.c_uint32), CUgraphicsResource]
5976
+ except AttributeError:
5977
+ pass
5978
+ try:
5979
+ cuCtxDestroy = _libraries['libcuda.so'].cuCtxDestroy
5980
+ cuCtxDestroy.restype = CUresult
5981
+ cuCtxDestroy.argtypes = [CUcontext]
5982
+ except AttributeError:
5983
+ pass
5984
+ try:
5985
+ cuCtxPopCurrent = _libraries['libcuda.so'].cuCtxPopCurrent
5986
+ cuCtxPopCurrent.restype = CUresult
5987
+ cuCtxPopCurrent.argtypes = [ctypes.POINTER(ctypes.POINTER(struct_CUctx_st))]
5988
+ except AttributeError:
5989
+ pass
5990
+ try:
5991
+ cuCtxPushCurrent = _libraries['libcuda.so'].cuCtxPushCurrent
5992
+ cuCtxPushCurrent.restype = CUresult
5993
+ cuCtxPushCurrent.argtypes = [CUcontext]
5994
+ except AttributeError:
5995
+ pass
5996
+ try:
5997
+ cuStreamDestroy = _libraries['libcuda.so'].cuStreamDestroy
5998
+ cuStreamDestroy.restype = CUresult
5999
+ cuStreamDestroy.argtypes = [CUstream]
6000
+ except AttributeError:
6001
+ pass
6002
+ try:
6003
+ cuEventDestroy = _libraries['libcuda.so'].cuEventDestroy
6004
+ cuEventDestroy.restype = CUresult
6005
+ cuEventDestroy.argtypes = [CUevent]
6006
+ except AttributeError:
6007
+ pass
6008
+ try:
6009
+ cuDevicePrimaryCtxRelease = _libraries['libcuda.so'].cuDevicePrimaryCtxRelease
6010
+ cuDevicePrimaryCtxRelease.restype = CUresult
6011
+ cuDevicePrimaryCtxRelease.argtypes = [CUdevice]
6012
+ except AttributeError:
6013
+ pass
6014
+ try:
6015
+ cuDevicePrimaryCtxReset = _libraries['libcuda.so'].cuDevicePrimaryCtxReset
6016
+ cuDevicePrimaryCtxReset.restype = CUresult
6017
+ cuDevicePrimaryCtxReset.argtypes = [CUdevice]
6018
+ except AttributeError:
6019
+ pass
6020
+ try:
6021
+ cuDevicePrimaryCtxSetFlags = _libraries['libcuda.so'].cuDevicePrimaryCtxSetFlags
6022
+ cuDevicePrimaryCtxSetFlags.restype = CUresult
6023
+ cuDevicePrimaryCtxSetFlags.argtypes = [CUdevice, ctypes.c_uint32]
6024
+ except AttributeError:
6025
+ pass
6026
+ try:
6027
+ cuMemcpyHtoD_v2 = _libraries['libcuda.so'].cuMemcpyHtoD_v2
6028
+ cuMemcpyHtoD_v2.restype = CUresult
6029
+ cuMemcpyHtoD_v2.argtypes = [CUdeviceptr, ctypes.POINTER(None), size_t]
6030
+ except AttributeError:
6031
+ pass
6032
+ try:
6033
+ cuMemcpyDtoH_v2 = _libraries['libcuda.so'].cuMemcpyDtoH_v2
6034
+ cuMemcpyDtoH_v2.restype = CUresult
6035
+ cuMemcpyDtoH_v2.argtypes = [ctypes.POINTER(None), CUdeviceptr, size_t]
6036
+ except AttributeError:
6037
+ pass
6038
+ try:
6039
+ cuMemcpyDtoD_v2 = _libraries['libcuda.so'].cuMemcpyDtoD_v2
6040
+ cuMemcpyDtoD_v2.restype = CUresult
6041
+ cuMemcpyDtoD_v2.argtypes = [CUdeviceptr, CUdeviceptr, size_t]
6042
+ except AttributeError:
6043
+ pass
6044
+ try:
6045
+ cuMemcpyDtoA_v2 = _libraries['libcuda.so'].cuMemcpyDtoA_v2
6046
+ cuMemcpyDtoA_v2.restype = CUresult
6047
+ cuMemcpyDtoA_v2.argtypes = [CUarray, size_t, CUdeviceptr, size_t]
6048
+ except AttributeError:
6049
+ pass
6050
+ try:
6051
+ cuMemcpyAtoD_v2 = _libraries['libcuda.so'].cuMemcpyAtoD_v2
6052
+ cuMemcpyAtoD_v2.restype = CUresult
6053
+ cuMemcpyAtoD_v2.argtypes = [CUdeviceptr, CUarray, size_t, size_t]
6054
+ except AttributeError:
6055
+ pass
6056
+ try:
6057
+ cuMemcpyHtoA_v2 = _libraries['libcuda.so'].cuMemcpyHtoA_v2
6058
+ cuMemcpyHtoA_v2.restype = CUresult
6059
+ cuMemcpyHtoA_v2.argtypes = [CUarray, size_t, ctypes.POINTER(None), size_t]
6060
+ except AttributeError:
6061
+ pass
6062
+ try:
6063
+ cuMemcpyAtoH_v2 = _libraries['libcuda.so'].cuMemcpyAtoH_v2
6064
+ cuMemcpyAtoH_v2.restype = CUresult
6065
+ cuMemcpyAtoH_v2.argtypes = [ctypes.POINTER(None), CUarray, size_t, size_t]
6066
+ except AttributeError:
6067
+ pass
6068
+ try:
6069
+ cuMemcpyAtoA_v2 = _libraries['libcuda.so'].cuMemcpyAtoA_v2
6070
+ cuMemcpyAtoA_v2.restype = CUresult
6071
+ cuMemcpyAtoA_v2.argtypes = [CUarray, size_t, CUarray, size_t, size_t]
6072
+ except AttributeError:
6073
+ pass
6074
+ try:
6075
+ cuMemcpyHtoAAsync_v2 = _libraries['libcuda.so'].cuMemcpyHtoAAsync_v2
6076
+ cuMemcpyHtoAAsync_v2.restype = CUresult
6077
+ cuMemcpyHtoAAsync_v2.argtypes = [CUarray, size_t, ctypes.POINTER(None), size_t, CUstream]
6078
+ except AttributeError:
6079
+ pass
6080
+ try:
6081
+ cuMemcpyAtoHAsync_v2 = _libraries['libcuda.so'].cuMemcpyAtoHAsync_v2
6082
+ cuMemcpyAtoHAsync_v2.restype = CUresult
6083
+ cuMemcpyAtoHAsync_v2.argtypes = [ctypes.POINTER(None), CUarray, size_t, size_t, CUstream]
6084
+ except AttributeError:
6085
+ pass
6086
+ try:
6087
+ cuMemcpy2D_v2 = _libraries['libcuda.so'].cuMemcpy2D_v2
6088
+ cuMemcpy2D_v2.restype = CUresult
6089
+ cuMemcpy2D_v2.argtypes = [ctypes.POINTER(struct_CUDA_MEMCPY2D_st)]
6090
+ except AttributeError:
6091
+ pass
6092
+ try:
6093
+ cuMemcpy2DUnaligned_v2 = _libraries['libcuda.so'].cuMemcpy2DUnaligned_v2
6094
+ cuMemcpy2DUnaligned_v2.restype = CUresult
6095
+ cuMemcpy2DUnaligned_v2.argtypes = [ctypes.POINTER(struct_CUDA_MEMCPY2D_st)]
6096
+ except AttributeError:
6097
+ pass
6098
+ try:
6099
+ cuMemcpy3D_v2 = _libraries['libcuda.so'].cuMemcpy3D_v2
6100
+ cuMemcpy3D_v2.restype = CUresult
6101
+ cuMemcpy3D_v2.argtypes = [ctypes.POINTER(struct_CUDA_MEMCPY3D_st)]
6102
+ except AttributeError:
6103
+ pass
6104
+ try:
6105
+ cuMemcpyHtoDAsync_v2 = _libraries['libcuda.so'].cuMemcpyHtoDAsync_v2
6106
+ cuMemcpyHtoDAsync_v2.restype = CUresult
6107
+ cuMemcpyHtoDAsync_v2.argtypes = [CUdeviceptr, ctypes.POINTER(None), size_t, CUstream]
6108
+ except AttributeError:
6109
+ pass
6110
+ try:
6111
+ cuMemcpyDtoHAsync_v2 = _libraries['libcuda.so'].cuMemcpyDtoHAsync_v2
6112
+ cuMemcpyDtoHAsync_v2.restype = CUresult
6113
+ cuMemcpyDtoHAsync_v2.argtypes = [ctypes.POINTER(None), CUdeviceptr, size_t, CUstream]
6114
+ except AttributeError:
6115
+ pass
6116
+ try:
6117
+ cuMemcpyDtoDAsync_v2 = _libraries['libcuda.so'].cuMemcpyDtoDAsync_v2
6118
+ cuMemcpyDtoDAsync_v2.restype = CUresult
6119
+ cuMemcpyDtoDAsync_v2.argtypes = [CUdeviceptr, CUdeviceptr, size_t, CUstream]
6120
+ except AttributeError:
6121
+ pass
6122
+ try:
6123
+ cuMemcpy2DAsync_v2 = _libraries['libcuda.so'].cuMemcpy2DAsync_v2
6124
+ cuMemcpy2DAsync_v2.restype = CUresult
6125
+ cuMemcpy2DAsync_v2.argtypes = [ctypes.POINTER(struct_CUDA_MEMCPY2D_st), CUstream]
6126
+ except AttributeError:
6127
+ pass
6128
+ try:
6129
+ cuMemcpy3DAsync_v2 = _libraries['libcuda.so'].cuMemcpy3DAsync_v2
6130
+ cuMemcpy3DAsync_v2.restype = CUresult
6131
+ cuMemcpy3DAsync_v2.argtypes = [ctypes.POINTER(struct_CUDA_MEMCPY3D_st), CUstream]
6132
+ except AttributeError:
6133
+ pass
6134
+ try:
6135
+ cuMemsetD8_v2 = _libraries['libcuda.so'].cuMemsetD8_v2
6136
+ cuMemsetD8_v2.restype = CUresult
6137
+ cuMemsetD8_v2.argtypes = [CUdeviceptr, ctypes.c_ubyte, size_t]
6138
+ except AttributeError:
6139
+ pass
6140
+ try:
6141
+ cuMemsetD16_v2 = _libraries['libcuda.so'].cuMemsetD16_v2
6142
+ cuMemsetD16_v2.restype = CUresult
6143
+ cuMemsetD16_v2.argtypes = [CUdeviceptr, ctypes.c_uint16, size_t]
6144
+ except AttributeError:
6145
+ pass
6146
+ try:
6147
+ cuMemsetD32_v2 = _libraries['libcuda.so'].cuMemsetD32_v2
6148
+ cuMemsetD32_v2.restype = CUresult
6149
+ cuMemsetD32_v2.argtypes = [CUdeviceptr, ctypes.c_uint32, size_t]
6150
+ except AttributeError:
6151
+ pass
6152
+ try:
6153
+ cuMemsetD2D8_v2 = _libraries['libcuda.so'].cuMemsetD2D8_v2
6154
+ cuMemsetD2D8_v2.restype = CUresult
6155
+ cuMemsetD2D8_v2.argtypes = [CUdeviceptr, size_t, ctypes.c_ubyte, size_t, size_t]
6156
+ except AttributeError:
6157
+ pass
6158
+ try:
6159
+ cuMemsetD2D16_v2 = _libraries['libcuda.so'].cuMemsetD2D16_v2
6160
+ cuMemsetD2D16_v2.restype = CUresult
6161
+ cuMemsetD2D16_v2.argtypes = [CUdeviceptr, size_t, ctypes.c_uint16, size_t, size_t]
6162
+ except AttributeError:
6163
+ pass
6164
+ try:
6165
+ cuMemsetD2D32_v2 = _libraries['libcuda.so'].cuMemsetD2D32_v2
6166
+ cuMemsetD2D32_v2.restype = CUresult
6167
+ cuMemsetD2D32_v2.argtypes = [CUdeviceptr, size_t, ctypes.c_uint32, size_t, size_t]
6168
+ except AttributeError:
6169
+ pass
6170
+ try:
6171
+ cuMemcpy = _libraries['libcuda.so'].cuMemcpy
6172
+ cuMemcpy.restype = CUresult
6173
+ cuMemcpy.argtypes = [CUdeviceptr, CUdeviceptr, size_t]
6174
+ except AttributeError:
6175
+ pass
6176
+ try:
6177
+ cuMemcpyAsync = _libraries['libcuda.so'].cuMemcpyAsync
6178
+ cuMemcpyAsync.restype = CUresult
6179
+ cuMemcpyAsync.argtypes = [CUdeviceptr, CUdeviceptr, size_t, CUstream]
6180
+ except AttributeError:
6181
+ pass
6182
+ try:
6183
+ cuMemcpyPeer = _libraries['libcuda.so'].cuMemcpyPeer
6184
+ cuMemcpyPeer.restype = CUresult
6185
+ cuMemcpyPeer.argtypes = [CUdeviceptr, CUcontext, CUdeviceptr, CUcontext, size_t]
6186
+ except AttributeError:
6187
+ pass
6188
+ try:
6189
+ cuMemcpyPeerAsync = _libraries['libcuda.so'].cuMemcpyPeerAsync
6190
+ cuMemcpyPeerAsync.restype = CUresult
6191
+ cuMemcpyPeerAsync.argtypes = [CUdeviceptr, CUcontext, CUdeviceptr, CUcontext, size_t, CUstream]
6192
+ except AttributeError:
6193
+ pass
6194
+ try:
6195
+ cuMemcpy3DPeer = _libraries['libcuda.so'].cuMemcpy3DPeer
6196
+ cuMemcpy3DPeer.restype = CUresult
6197
+ cuMemcpy3DPeer.argtypes = [ctypes.POINTER(struct_CUDA_MEMCPY3D_PEER_st)]
6198
+ except AttributeError:
6199
+ pass
6200
+ try:
6201
+ cuMemcpy3DPeerAsync = _libraries['libcuda.so'].cuMemcpy3DPeerAsync
6202
+ cuMemcpy3DPeerAsync.restype = CUresult
6203
+ cuMemcpy3DPeerAsync.argtypes = [ctypes.POINTER(struct_CUDA_MEMCPY3D_PEER_st), CUstream]
6204
+ except AttributeError:
6205
+ pass
6206
+ try:
6207
+ cuMemsetD8Async = _libraries['libcuda.so'].cuMemsetD8Async
6208
+ cuMemsetD8Async.restype = CUresult
6209
+ cuMemsetD8Async.argtypes = [CUdeviceptr, ctypes.c_ubyte, size_t, CUstream]
6210
+ except AttributeError:
6211
+ pass
6212
+ try:
6213
+ cuMemsetD16Async = _libraries['libcuda.so'].cuMemsetD16Async
6214
+ cuMemsetD16Async.restype = CUresult
6215
+ cuMemsetD16Async.argtypes = [CUdeviceptr, ctypes.c_uint16, size_t, CUstream]
6216
+ except AttributeError:
6217
+ pass
6218
+ try:
6219
+ cuMemsetD32Async = _libraries['libcuda.so'].cuMemsetD32Async
6220
+ cuMemsetD32Async.restype = CUresult
6221
+ cuMemsetD32Async.argtypes = [CUdeviceptr, ctypes.c_uint32, size_t, CUstream]
6222
+ except AttributeError:
6223
+ pass
6224
+ try:
6225
+ cuMemsetD2D8Async = _libraries['libcuda.so'].cuMemsetD2D8Async
6226
+ cuMemsetD2D8Async.restype = CUresult
6227
+ cuMemsetD2D8Async.argtypes = [CUdeviceptr, size_t, ctypes.c_ubyte, size_t, size_t, CUstream]
6228
+ except AttributeError:
6229
+ pass
6230
+ try:
6231
+ cuMemsetD2D16Async = _libraries['libcuda.so'].cuMemsetD2D16Async
6232
+ cuMemsetD2D16Async.restype = CUresult
6233
+ cuMemsetD2D16Async.argtypes = [CUdeviceptr, size_t, ctypes.c_uint16, size_t, size_t, CUstream]
6234
+ except AttributeError:
6235
+ pass
6236
+ try:
6237
+ cuMemsetD2D32Async = _libraries['libcuda.so'].cuMemsetD2D32Async
6238
+ cuMemsetD2D32Async.restype = CUresult
6239
+ cuMemsetD2D32Async.argtypes = [CUdeviceptr, size_t, ctypes.c_uint32, size_t, size_t, CUstream]
6240
+ except AttributeError:
6241
+ pass
6242
+ try:
6243
+ cuStreamGetPriority = _libraries['libcuda.so'].cuStreamGetPriority
6244
+ cuStreamGetPriority.restype = CUresult
6245
+ cuStreamGetPriority.argtypes = [CUstream, ctypes.POINTER(ctypes.c_int32)]
6246
+ except AttributeError:
6247
+ pass
6248
+ try:
6249
+ cuStreamGetId = _libraries['libcuda.so'].cuStreamGetId
6250
+ cuStreamGetId.restype = CUresult
6251
+ cuStreamGetId.argtypes = [CUstream, ctypes.POINTER(ctypes.c_uint64)]
6252
+ except AttributeError:
6253
+ pass
6254
+ try:
6255
+ cuStreamGetFlags = _libraries['libcuda.so'].cuStreamGetFlags
6256
+ cuStreamGetFlags.restype = CUresult
6257
+ cuStreamGetFlags.argtypes = [CUstream, ctypes.POINTER(ctypes.c_uint32)]
6258
+ except AttributeError:
6259
+ pass
6260
+ try:
6261
+ cuStreamGetCtx = _libraries['libcuda.so'].cuStreamGetCtx
6262
+ cuStreamGetCtx.restype = CUresult
6263
+ cuStreamGetCtx.argtypes = [CUstream, ctypes.POINTER(ctypes.POINTER(struct_CUctx_st))]
6264
+ except AttributeError:
6265
+ pass
6266
+ try:
6267
+ cuStreamWaitEvent = _libraries['libcuda.so'].cuStreamWaitEvent
6268
+ cuStreamWaitEvent.restype = CUresult
6269
+ cuStreamWaitEvent.argtypes = [CUstream, CUevent, ctypes.c_uint32]
6270
+ except AttributeError:
6271
+ pass
6272
+ try:
6273
+ cuStreamAddCallback = _libraries['libcuda.so'].cuStreamAddCallback
6274
+ cuStreamAddCallback.restype = CUresult
6275
+ cuStreamAddCallback.argtypes = [CUstream, CUstreamCallback, ctypes.POINTER(None), ctypes.c_uint32]
6276
+ except AttributeError:
6277
+ pass
6278
+ try:
6279
+ cuStreamAttachMemAsync = _libraries['libcuda.so'].cuStreamAttachMemAsync
6280
+ cuStreamAttachMemAsync.restype = CUresult
6281
+ cuStreamAttachMemAsync.argtypes = [CUstream, CUdeviceptr, size_t, ctypes.c_uint32]
6282
+ except AttributeError:
6283
+ pass
6284
+ try:
6285
+ cuStreamQuery = _libraries['libcuda.so'].cuStreamQuery
6286
+ cuStreamQuery.restype = CUresult
6287
+ cuStreamQuery.argtypes = [CUstream]
6288
+ except AttributeError:
6289
+ pass
6290
+ try:
6291
+ cuStreamSynchronize = _libraries['libcuda.so'].cuStreamSynchronize
6292
+ cuStreamSynchronize.restype = CUresult
6293
+ cuStreamSynchronize.argtypes = [CUstream]
6294
+ except AttributeError:
6295
+ pass
6296
+ try:
6297
+ cuEventRecord = _libraries['libcuda.so'].cuEventRecord
6298
+ cuEventRecord.restype = CUresult
6299
+ cuEventRecord.argtypes = [CUevent, CUstream]
6300
+ except AttributeError:
6301
+ pass
6302
+ try:
6303
+ cuEventRecordWithFlags = _libraries['libcuda.so'].cuEventRecordWithFlags
6304
+ cuEventRecordWithFlags.restype = CUresult
6305
+ cuEventRecordWithFlags.argtypes = [CUevent, CUstream, ctypes.c_uint32]
6306
+ except AttributeError:
6307
+ pass
6308
+ try:
6309
+ cuLaunchKernel = _libraries['libcuda.so'].cuLaunchKernel
6310
+ cuLaunchKernel.restype = CUresult
6311
+ cuLaunchKernel.argtypes = [CUfunction, ctypes.c_uint32, ctypes.c_uint32, ctypes.c_uint32, ctypes.c_uint32, ctypes.c_uint32, ctypes.c_uint32, ctypes.c_uint32, CUstream, ctypes.POINTER(ctypes.POINTER(None)), ctypes.POINTER(ctypes.POINTER(None))]
6312
+ except AttributeError:
6313
+ pass
6314
+ try:
6315
+ cuLaunchKernelEx = _libraries['libcuda.so'].cuLaunchKernelEx
6316
+ cuLaunchKernelEx.restype = CUresult
6317
+ cuLaunchKernelEx.argtypes = [ctypes.POINTER(struct_CUlaunchConfig_st), CUfunction, ctypes.POINTER(ctypes.POINTER(None)), ctypes.POINTER(ctypes.POINTER(None))]
6318
+ except AttributeError:
6319
+ pass
6320
+ try:
6321
+ cuLaunchHostFunc = _libraries['libcuda.so'].cuLaunchHostFunc
6322
+ cuLaunchHostFunc.restype = CUresult
6323
+ cuLaunchHostFunc.argtypes = [CUstream, CUhostFn, ctypes.POINTER(None)]
6324
+ except AttributeError:
6325
+ pass
6326
+ try:
6327
+ cuGraphicsMapResources = _libraries['libcuda.so'].cuGraphicsMapResources
6328
+ cuGraphicsMapResources.restype = CUresult
6329
+ cuGraphicsMapResources.argtypes = [ctypes.c_uint32, ctypes.POINTER(ctypes.POINTER(struct_CUgraphicsResource_st)), CUstream]
6330
+ except AttributeError:
6331
+ pass
6332
+ try:
6333
+ cuGraphicsUnmapResources = _libraries['libcuda.so'].cuGraphicsUnmapResources
6334
+ cuGraphicsUnmapResources.restype = CUresult
6335
+ cuGraphicsUnmapResources.argtypes = [ctypes.c_uint32, ctypes.POINTER(ctypes.POINTER(struct_CUgraphicsResource_st)), CUstream]
6336
+ except AttributeError:
6337
+ pass
6338
+ try:
6339
+ cuStreamWriteValue32 = _libraries['libcuda.so'].cuStreamWriteValue32
6340
+ cuStreamWriteValue32.restype = CUresult
6341
+ cuStreamWriteValue32.argtypes = [CUstream, CUdeviceptr, cuuint32_t, ctypes.c_uint32]
6342
+ except AttributeError:
6343
+ pass
6344
+ try:
6345
+ cuStreamWaitValue32 = _libraries['libcuda.so'].cuStreamWaitValue32
6346
+ cuStreamWaitValue32.restype = CUresult
6347
+ cuStreamWaitValue32.argtypes = [CUstream, CUdeviceptr, cuuint32_t, ctypes.c_uint32]
6348
+ except AttributeError:
6349
+ pass
6350
+ try:
6351
+ cuStreamWriteValue64 = _libraries['libcuda.so'].cuStreamWriteValue64
6352
+ cuStreamWriteValue64.restype = CUresult
6353
+ cuStreamWriteValue64.argtypes = [CUstream, CUdeviceptr, cuuint64_t, ctypes.c_uint32]
6354
+ except AttributeError:
6355
+ pass
6356
+ try:
6357
+ cuStreamWaitValue64 = _libraries['libcuda.so'].cuStreamWaitValue64
6358
+ cuStreamWaitValue64.restype = CUresult
6359
+ cuStreamWaitValue64.argtypes = [CUstream, CUdeviceptr, cuuint64_t, ctypes.c_uint32]
6360
+ except AttributeError:
6361
+ pass
6362
+ try:
6363
+ cuStreamBatchMemOp = _libraries['libcuda.so'].cuStreamBatchMemOp
6364
+ cuStreamBatchMemOp.restype = CUresult
6365
+ cuStreamBatchMemOp.argtypes = [CUstream, ctypes.c_uint32, ctypes.POINTER(union_CUstreamBatchMemOpParams_union), ctypes.c_uint32]
6366
+ except AttributeError:
6367
+ pass
6368
+ try:
6369
+ cuStreamWriteValue32_ptsz = _libraries['libcuda.so'].cuStreamWriteValue32_ptsz
6370
+ cuStreamWriteValue32_ptsz.restype = CUresult
6371
+ cuStreamWriteValue32_ptsz.argtypes = [CUstream, CUdeviceptr, cuuint32_t, ctypes.c_uint32]
6372
+ except AttributeError:
6373
+ pass
6374
+ try:
6375
+ cuStreamWaitValue32_ptsz = _libraries['libcuda.so'].cuStreamWaitValue32_ptsz
6376
+ cuStreamWaitValue32_ptsz.restype = CUresult
6377
+ cuStreamWaitValue32_ptsz.argtypes = [CUstream, CUdeviceptr, cuuint32_t, ctypes.c_uint32]
6378
+ except AttributeError:
6379
+ pass
6380
+ try:
6381
+ cuStreamWriteValue64_ptsz = _libraries['libcuda.so'].cuStreamWriteValue64_ptsz
6382
+ cuStreamWriteValue64_ptsz.restype = CUresult
6383
+ cuStreamWriteValue64_ptsz.argtypes = [CUstream, CUdeviceptr, cuuint64_t, ctypes.c_uint32]
6384
+ except AttributeError:
6385
+ pass
6386
+ try:
6387
+ cuStreamWaitValue64_ptsz = _libraries['libcuda.so'].cuStreamWaitValue64_ptsz
6388
+ cuStreamWaitValue64_ptsz.restype = CUresult
6389
+ cuStreamWaitValue64_ptsz.argtypes = [CUstream, CUdeviceptr, cuuint64_t, ctypes.c_uint32]
6390
+ except AttributeError:
6391
+ pass
6392
+ try:
6393
+ cuStreamBatchMemOp_ptsz = _libraries['libcuda.so'].cuStreamBatchMemOp_ptsz
6394
+ cuStreamBatchMemOp_ptsz.restype = CUresult
6395
+ cuStreamBatchMemOp_ptsz.argtypes = [CUstream, ctypes.c_uint32, ctypes.POINTER(union_CUstreamBatchMemOpParams_union), ctypes.c_uint32]
6396
+ except AttributeError:
6397
+ pass
6398
+ try:
6399
+ cuStreamWriteValue32_v2 = _libraries['libcuda.so'].cuStreamWriteValue32_v2
6400
+ cuStreamWriteValue32_v2.restype = CUresult
6401
+ cuStreamWriteValue32_v2.argtypes = [CUstream, CUdeviceptr, cuuint32_t, ctypes.c_uint32]
6402
+ except AttributeError:
6403
+ pass
6404
+ try:
6405
+ cuStreamWaitValue32_v2 = _libraries['libcuda.so'].cuStreamWaitValue32_v2
6406
+ cuStreamWaitValue32_v2.restype = CUresult
6407
+ cuStreamWaitValue32_v2.argtypes = [CUstream, CUdeviceptr, cuuint32_t, ctypes.c_uint32]
6408
+ except AttributeError:
6409
+ pass
6410
+ try:
6411
+ cuStreamWriteValue64_v2 = _libraries['libcuda.so'].cuStreamWriteValue64_v2
6412
+ cuStreamWriteValue64_v2.restype = CUresult
6413
+ cuStreamWriteValue64_v2.argtypes = [CUstream, CUdeviceptr, cuuint64_t, ctypes.c_uint32]
6414
+ except AttributeError:
6415
+ pass
6416
+ try:
6417
+ cuStreamWaitValue64_v2 = _libraries['libcuda.so'].cuStreamWaitValue64_v2
6418
+ cuStreamWaitValue64_v2.restype = CUresult
6419
+ cuStreamWaitValue64_v2.argtypes = [CUstream, CUdeviceptr, cuuint64_t, ctypes.c_uint32]
6420
+ except AttributeError:
6421
+ pass
6422
+ try:
6423
+ cuStreamBatchMemOp_v2 = _libraries['libcuda.so'].cuStreamBatchMemOp_v2
6424
+ cuStreamBatchMemOp_v2.restype = CUresult
6425
+ cuStreamBatchMemOp_v2.argtypes = [CUstream, ctypes.c_uint32, ctypes.POINTER(union_CUstreamBatchMemOpParams_union), ctypes.c_uint32]
6426
+ except AttributeError:
6427
+ pass
6428
+ try:
6429
+ cuMemPrefetchAsync = _libraries['libcuda.so'].cuMemPrefetchAsync
6430
+ cuMemPrefetchAsync.restype = CUresult
6431
+ cuMemPrefetchAsync.argtypes = [CUdeviceptr, size_t, CUdevice, CUstream]
6432
+ except AttributeError:
6433
+ pass
6434
+ try:
6435
+ cuLaunchCooperativeKernel = _libraries['libcuda.so'].cuLaunchCooperativeKernel
6436
+ cuLaunchCooperativeKernel.restype = CUresult
6437
+ cuLaunchCooperativeKernel.argtypes = [CUfunction, ctypes.c_uint32, ctypes.c_uint32, ctypes.c_uint32, ctypes.c_uint32, ctypes.c_uint32, ctypes.c_uint32, ctypes.c_uint32, CUstream, ctypes.POINTER(ctypes.POINTER(None))]
6438
+ except AttributeError:
6439
+ pass
6440
+ try:
6441
+ cuSignalExternalSemaphoresAsync = _libraries['libcuda.so'].cuSignalExternalSemaphoresAsync
6442
+ cuSignalExternalSemaphoresAsync.restype = CUresult
6443
+ cuSignalExternalSemaphoresAsync.argtypes = [ctypes.POINTER(ctypes.POINTER(struct_CUextSemaphore_st)), ctypes.POINTER(struct_CUDA_EXTERNAL_SEMAPHORE_SIGNAL_PARAMS_st), ctypes.c_uint32, CUstream]
6444
+ except AttributeError:
6445
+ pass
6446
+ try:
6447
+ cuWaitExternalSemaphoresAsync = _libraries['libcuda.so'].cuWaitExternalSemaphoresAsync
6448
+ cuWaitExternalSemaphoresAsync.restype = CUresult
6449
+ cuWaitExternalSemaphoresAsync.argtypes = [ctypes.POINTER(ctypes.POINTER(struct_CUextSemaphore_st)), ctypes.POINTER(struct_CUDA_EXTERNAL_SEMAPHORE_WAIT_PARAMS_st), ctypes.c_uint32, CUstream]
6450
+ except AttributeError:
6451
+ pass
6452
+ try:
6453
+ cuStreamBeginCapture = _libraries['libcuda.so'].cuStreamBeginCapture
6454
+ cuStreamBeginCapture.restype = CUresult
6455
+ cuStreamBeginCapture.argtypes = [CUstream]
6456
+ except AttributeError:
6457
+ pass
6458
+ try:
6459
+ cuStreamBeginCapture_ptsz = _libraries['libcuda.so'].cuStreamBeginCapture_ptsz
6460
+ cuStreamBeginCapture_ptsz.restype = CUresult
6461
+ cuStreamBeginCapture_ptsz.argtypes = [CUstream]
6462
+ except AttributeError:
6463
+ pass
6464
+ try:
6465
+ cuStreamBeginCapture_v2 = _libraries['libcuda.so'].cuStreamBeginCapture_v2
6466
+ cuStreamBeginCapture_v2.restype = CUresult
6467
+ cuStreamBeginCapture_v2.argtypes = [CUstream, CUstreamCaptureMode]
6468
+ except AttributeError:
6469
+ pass
6470
+ try:
6471
+ cuStreamEndCapture = _libraries['libcuda.so'].cuStreamEndCapture
6472
+ cuStreamEndCapture.restype = CUresult
6473
+ cuStreamEndCapture.argtypes = [CUstream, ctypes.POINTER(ctypes.POINTER(struct_CUgraph_st))]
6474
+ except AttributeError:
6475
+ pass
6476
+ try:
6477
+ cuStreamIsCapturing = _libraries['libcuda.so'].cuStreamIsCapturing
6478
+ cuStreamIsCapturing.restype = CUresult
6479
+ cuStreamIsCapturing.argtypes = [CUstream, ctypes.POINTER(CUstreamCaptureStatus_enum)]
6480
+ except AttributeError:
6481
+ pass
6482
+ try:
6483
+ cuStreamGetCaptureInfo = _libraries['libcuda.so'].cuStreamGetCaptureInfo
6484
+ cuStreamGetCaptureInfo.restype = CUresult
6485
+ cuStreamGetCaptureInfo.argtypes = [CUstream, ctypes.POINTER(CUstreamCaptureStatus_enum), ctypes.POINTER(ctypes.c_uint64)]
6486
+ except AttributeError:
6487
+ pass
6488
+ try:
6489
+ cuStreamGetCaptureInfo_ptsz = _libraries['libcuda.so'].cuStreamGetCaptureInfo_ptsz
6490
+ cuStreamGetCaptureInfo_ptsz.restype = CUresult
6491
+ cuStreamGetCaptureInfo_ptsz.argtypes = [CUstream, ctypes.POINTER(CUstreamCaptureStatus_enum), ctypes.POINTER(ctypes.c_uint64)]
6492
+ except AttributeError:
6493
+ pass
6494
+ try:
6495
+ cuStreamGetCaptureInfo_v2 = _libraries['libcuda.so'].cuStreamGetCaptureInfo_v2
6496
+ cuStreamGetCaptureInfo_v2.restype = CUresult
6497
+ cuStreamGetCaptureInfo_v2.argtypes = [CUstream, ctypes.POINTER(CUstreamCaptureStatus_enum), ctypes.POINTER(ctypes.c_uint64), ctypes.POINTER(ctypes.POINTER(struct_CUgraph_st)), ctypes.POINTER(ctypes.POINTER(ctypes.POINTER(struct_CUgraphNode_st))), ctypes.POINTER(ctypes.c_uint64)]
6498
+ except AttributeError:
6499
+ pass
6500
+ try:
6501
+ cuGraphAddKernelNode = _libraries['libcuda.so'].cuGraphAddKernelNode
6502
+ cuGraphAddKernelNode.restype = CUresult
6503
+ cuGraphAddKernelNode.argtypes = [ctypes.POINTER(ctypes.POINTER(struct_CUgraphNode_st)), CUgraph, ctypes.POINTER(ctypes.POINTER(struct_CUgraphNode_st)), size_t, ctypes.POINTER(struct_CUDA_KERNEL_NODE_PARAMS_st)]
6504
+ except AttributeError:
6505
+ pass
6506
+ try:
6507
+ cuGraphKernelNodeGetParams = _libraries['libcuda.so'].cuGraphKernelNodeGetParams
6508
+ cuGraphKernelNodeGetParams.restype = CUresult
6509
+ cuGraphKernelNodeGetParams.argtypes = [CUgraphNode, ctypes.POINTER(struct_CUDA_KERNEL_NODE_PARAMS_st)]
6510
+ except AttributeError:
6511
+ pass
6512
+ try:
6513
+ cuGraphKernelNodeSetParams = _libraries['libcuda.so'].cuGraphKernelNodeSetParams
6514
+ cuGraphKernelNodeSetParams.restype = CUresult
6515
+ cuGraphKernelNodeSetParams.argtypes = [CUgraphNode, ctypes.POINTER(struct_CUDA_KERNEL_NODE_PARAMS_st)]
6516
+ except AttributeError:
6517
+ pass
6518
+ try:
6519
+ cuGraphExecKernelNodeSetParams = _libraries['libcuda.so'].cuGraphExecKernelNodeSetParams
6520
+ cuGraphExecKernelNodeSetParams.restype = CUresult
6521
+ cuGraphExecKernelNodeSetParams.argtypes = [CUgraphExec, CUgraphNode, ctypes.POINTER(struct_CUDA_KERNEL_NODE_PARAMS_st)]
6522
+ except AttributeError:
6523
+ pass
6524
+ try:
6525
+ cuGraphInstantiateWithParams = _libraries['libcuda.so'].cuGraphInstantiateWithParams
6526
+ cuGraphInstantiateWithParams.restype = CUresult
6527
+ cuGraphInstantiateWithParams.argtypes = [ctypes.POINTER(ctypes.POINTER(struct_CUgraphExec_st)), CUgraph, ctypes.POINTER(struct_CUDA_GRAPH_INSTANTIATE_PARAMS_st)]
6528
+ except AttributeError:
6529
+ pass
6530
+ try:
6531
+ cuGraphExecUpdate = _libraries['libcuda.so'].cuGraphExecUpdate
6532
+ cuGraphExecUpdate.restype = CUresult
6533
+ cuGraphExecUpdate.argtypes = [CUgraphExec, CUgraph, ctypes.POINTER(ctypes.POINTER(struct_CUgraphNode_st)), ctypes.POINTER(CUgraphExecUpdateResult_enum)]
6534
+ except AttributeError:
6535
+ pass
6536
+ try:
6537
+ cuGraphUpload = _libraries['libcuda.so'].cuGraphUpload
6538
+ cuGraphUpload.restype = CUresult
6539
+ cuGraphUpload.argtypes = [CUgraphExec, CUstream]
6540
+ except AttributeError:
6541
+ pass
6542
+ try:
6543
+ cuGraphLaunch = _libraries['libcuda.so'].cuGraphLaunch
6544
+ cuGraphLaunch.restype = CUresult
6545
+ cuGraphLaunch.argtypes = [CUgraphExec, CUstream]
6546
+ except AttributeError:
6547
+ pass
6548
+ try:
6549
+ cuStreamCopyAttributes = _libraries['libcuda.so'].cuStreamCopyAttributes
6550
+ cuStreamCopyAttributes.restype = CUresult
6551
+ cuStreamCopyAttributes.argtypes = [CUstream, CUstream]
6552
+ except AttributeError:
6553
+ pass
6554
+ try:
6555
+ cuStreamGetAttribute = _libraries['libcuda.so'].cuStreamGetAttribute
6556
+ cuStreamGetAttribute.restype = CUresult
6557
+ cuStreamGetAttribute.argtypes = [CUstream, CUstreamAttrID, ctypes.POINTER(union_CUlaunchAttributeValue_union)]
6558
+ except AttributeError:
6559
+ pass
6560
+ try:
6561
+ cuStreamSetAttribute = _libraries['libcuda.so'].cuStreamSetAttribute
6562
+ cuStreamSetAttribute.restype = CUresult
6563
+ cuStreamSetAttribute.argtypes = [CUstream, CUstreamAttrID, ctypes.POINTER(union_CUlaunchAttributeValue_union)]
6564
+ except AttributeError:
6565
+ pass
6566
+ try:
6567
+ cuIpcOpenMemHandle = _libraries['libcuda.so'].cuIpcOpenMemHandle
6568
+ cuIpcOpenMemHandle.restype = CUresult
6569
+ cuIpcOpenMemHandle.argtypes = [ctypes.POINTER(ctypes.c_uint64), CUipcMemHandle, ctypes.c_uint32]
6570
+ except AttributeError:
6571
+ pass
6572
+ try:
6573
+ cuGraphInstantiate = _libraries['libcuda.so'].cuGraphInstantiate
6574
+ cuGraphInstantiate.restype = CUresult
6575
+ cuGraphInstantiate.argtypes = [ctypes.POINTER(ctypes.POINTER(struct_CUgraphExec_st)), CUgraph, ctypes.POINTER(ctypes.POINTER(struct_CUgraphNode_st)), ctypes.POINTER(ctypes.c_char), size_t]
6576
+ except AttributeError:
6577
+ pass
6578
+ try:
6579
+ cuGraphInstantiate_v2 = _libraries['libcuda.so'].cuGraphInstantiate_v2
6580
+ cuGraphInstantiate_v2.restype = CUresult
6581
+ cuGraphInstantiate_v2.argtypes = [ctypes.POINTER(ctypes.POINTER(struct_CUgraphExec_st)), CUgraph, ctypes.POINTER(ctypes.POINTER(struct_CUgraphNode_st)), ctypes.POINTER(ctypes.c_char), size_t]
6582
+ except AttributeError:
6583
+ pass
6584
+ try:
6585
+ cuMemMapArrayAsync = _libraries['libcuda.so'].cuMemMapArrayAsync
6586
+ cuMemMapArrayAsync.restype = CUresult
6587
+ cuMemMapArrayAsync.argtypes = [ctypes.POINTER(struct_CUarrayMapInfo_st), ctypes.c_uint32, CUstream]
6588
+ except AttributeError:
6589
+ pass
6590
+ try:
6591
+ cuMemFreeAsync = _libraries['libcuda.so'].cuMemFreeAsync
6592
+ cuMemFreeAsync.restype = CUresult
6593
+ cuMemFreeAsync.argtypes = [CUdeviceptr, CUstream]
6594
+ except AttributeError:
6595
+ pass
6596
+ try:
6597
+ cuMemAllocAsync = _libraries['libcuda.so'].cuMemAllocAsync
6598
+ cuMemAllocAsync.restype = CUresult
6599
+ cuMemAllocAsync.argtypes = [ctypes.POINTER(ctypes.c_uint64), size_t, CUstream]
6600
+ except AttributeError:
6601
+ pass
6602
+ try:
6603
+ cuMemAllocFromPoolAsync = _libraries['libcuda.so'].cuMemAllocFromPoolAsync
6604
+ cuMemAllocFromPoolAsync.restype = CUresult
6605
+ cuMemAllocFromPoolAsync.argtypes = [ctypes.POINTER(ctypes.c_uint64), size_t, CUmemoryPool, CUstream]
6606
+ except AttributeError:
6607
+ pass
6608
+ try:
6609
+ cuStreamUpdateCaptureDependencies = _libraries['libcuda.so'].cuStreamUpdateCaptureDependencies
6610
+ cuStreamUpdateCaptureDependencies.restype = CUresult
6611
+ cuStreamUpdateCaptureDependencies.argtypes = [CUstream, ctypes.POINTER(ctypes.POINTER(struct_CUgraphNode_st)), size_t, ctypes.c_uint32]
6612
+ except AttributeError:
6613
+ pass
6614
+ try:
6615
+ cuGetProcAddress = _libraries['libcuda.so'].cuGetProcAddress
6616
+ cuGetProcAddress.restype = CUresult
6617
+ cuGetProcAddress.argtypes = [ctypes.POINTER(ctypes.c_char), ctypes.POINTER(ctypes.POINTER(None)), ctypes.c_int32, cuuint64_t]
6618
+ except AttributeError:
6619
+ pass
4923
6620
  __all__ = \
4924
- ['CUDA_ARRAY3D_DESCRIPTOR', 'CUDA_ARRAY3D_DESCRIPTOR_v2',
4925
- 'CUDA_ARRAY_DESCRIPTOR', 'CUDA_ARRAY_DESCRIPTOR_v2',
6621
+ ['CUDA_ARRAY3D_DESCRIPTOR', 'CUDA_ARRAY3D_DESCRIPTOR_v1',
6622
+ 'CUDA_ARRAY3D_DESCRIPTOR_v2', 'CUDA_ARRAY_DESCRIPTOR',
6623
+ 'CUDA_ARRAY_DESCRIPTOR_v1', 'CUDA_ARRAY_DESCRIPTOR_v2',
6624
+ 'CUDA_ARRAY_MEMORY_REQUIREMENTS',
6625
+ 'CUDA_ARRAY_MEMORY_REQUIREMENTS_v1',
4926
6626
  'CUDA_ARRAY_SPARSE_PROPERTIES', 'CUDA_ARRAY_SPARSE_PROPERTIES_v1',
4927
- 'CUDA_ERROR_ALREADY_ACQUIRED', 'CUDA_ERROR_ALREADY_MAPPED',
4928
- 'CUDA_ERROR_ARRAY_IS_MAPPED', 'CUDA_ERROR_ASSERT',
4929
- 'CUDA_ERROR_CAPTURED_EVENT',
6627
+ 'CUDA_BATCH_MEM_OP_NODE_PARAMS', 'CUDA_ERROR_ALREADY_ACQUIRED',
6628
+ 'CUDA_ERROR_ALREADY_MAPPED', 'CUDA_ERROR_ARRAY_IS_MAPPED',
6629
+ 'CUDA_ERROR_ASSERT', 'CUDA_ERROR_CAPTURED_EVENT',
6630
+ 'CUDA_ERROR_CDP_NOT_SUPPORTED', 'CUDA_ERROR_CDP_VERSION_MISMATCH',
4930
6631
  'CUDA_ERROR_COMPAT_NOT_SUPPORTED_ON_DEVICE',
4931
6632
  'CUDA_ERROR_CONTEXT_ALREADY_CURRENT',
4932
6633
  'CUDA_ERROR_CONTEXT_ALREADY_IN_USE',
4933
6634
  'CUDA_ERROR_CONTEXT_IS_DESTROYED',
4934
6635
  'CUDA_ERROR_COOPERATIVE_LAUNCH_TOO_LARGE',
4935
6636
  'CUDA_ERROR_DEINITIALIZED', 'CUDA_ERROR_DEVICE_NOT_LICENSED',
4936
- 'CUDA_ERROR_ECC_UNCORRECTABLE', 'CUDA_ERROR_EXTERNAL_DEVICE',
4937
- 'CUDA_ERROR_FILE_NOT_FOUND',
6637
+ 'CUDA_ERROR_DEVICE_UNAVAILABLE', 'CUDA_ERROR_ECC_UNCORRECTABLE',
6638
+ 'CUDA_ERROR_EXTERNAL_DEVICE', 'CUDA_ERROR_FILE_NOT_FOUND',
4938
6639
  'CUDA_ERROR_GRAPH_EXEC_UPDATE_FAILURE',
4939
6640
  'CUDA_ERROR_HARDWARE_STACK_ERROR',
4940
6641
  'CUDA_ERROR_HOST_MEMORY_ALREADY_REGISTERED',
4941
6642
  'CUDA_ERROR_HOST_MEMORY_NOT_REGISTERED',
4942
6643
  'CUDA_ERROR_ILLEGAL_ADDRESS', 'CUDA_ERROR_ILLEGAL_INSTRUCTION',
4943
6644
  'CUDA_ERROR_ILLEGAL_STATE', 'CUDA_ERROR_INVALID_ADDRESS_SPACE',
4944
- 'CUDA_ERROR_INVALID_CONTEXT', 'CUDA_ERROR_INVALID_DEVICE',
6645
+ 'CUDA_ERROR_INVALID_CLUSTER_SIZE', 'CUDA_ERROR_INVALID_CONTEXT',
6646
+ 'CUDA_ERROR_INVALID_DEVICE',
4945
6647
  'CUDA_ERROR_INVALID_GRAPHICS_CONTEXT',
4946
6648
  'CUDA_ERROR_INVALID_HANDLE', 'CUDA_ERROR_INVALID_IMAGE',
4947
6649
  'CUDA_ERROR_INVALID_PC', 'CUDA_ERROR_INVALID_PTX',
@@ -4951,6 +6653,7 @@ __all__ = \
4951
6653
  'CUDA_ERROR_LAUNCH_INCOMPATIBLE_TEXTURING',
4952
6654
  'CUDA_ERROR_LAUNCH_OUT_OF_RESOURCES', 'CUDA_ERROR_LAUNCH_TIMEOUT',
4953
6655
  'CUDA_ERROR_MAP_FAILED', 'CUDA_ERROR_MISALIGNED_ADDRESS',
6656
+ 'CUDA_ERROR_MPS_CLIENT_TERMINATED',
4954
6657
  'CUDA_ERROR_MPS_CONNECTION_FAILED',
4955
6658
  'CUDA_ERROR_MPS_MAX_CLIENTS_REACHED',
4956
6659
  'CUDA_ERROR_MPS_MAX_CONNECTIONS_REACHED',
@@ -5002,12 +6705,21 @@ __all__ = \
5002
6705
  'CUDA_EXT_SEM_SIGNAL_NODE_PARAMS_v1',
5003
6706
  'CUDA_EXT_SEM_WAIT_NODE_PARAMS',
5004
6707
  'CUDA_EXT_SEM_WAIT_NODE_PARAMS_v1',
6708
+ 'CUDA_GRAPH_INSTANTIATE_ERROR',
5005
6709
  'CUDA_GRAPH_INSTANTIATE_FLAG_AUTO_FREE_ON_LAUNCH',
6710
+ 'CUDA_GRAPH_INSTANTIATE_FLAG_DEVICE_LAUNCH',
6711
+ 'CUDA_GRAPH_INSTANTIATE_FLAG_UPLOAD',
6712
+ 'CUDA_GRAPH_INSTANTIATE_FLAG_USE_NODE_PRIORITY',
6713
+ 'CUDA_GRAPH_INSTANTIATE_INVALID_STRUCTURE',
6714
+ 'CUDA_GRAPH_INSTANTIATE_MULTIPLE_CTXS_NOT_SUPPORTED',
6715
+ 'CUDA_GRAPH_INSTANTIATE_NODE_OPERATION_NOT_SUPPORTED',
6716
+ 'CUDA_GRAPH_INSTANTIATE_PARAMS', 'CUDA_GRAPH_INSTANTIATE_SUCCESS',
5006
6717
  'CUDA_HOST_NODE_PARAMS', 'CUDA_HOST_NODE_PARAMS_v1',
5007
6718
  'CUDA_KERNEL_NODE_PARAMS', 'CUDA_KERNEL_NODE_PARAMS_v1',
5008
- 'CUDA_LAUNCH_PARAMS', 'CUDA_LAUNCH_PARAMS_v1', 'CUDA_MEMCPY2D',
6719
+ 'CUDA_KERNEL_NODE_PARAMS_v2', 'CUDA_LAUNCH_PARAMS',
6720
+ 'CUDA_LAUNCH_PARAMS_v1', 'CUDA_MEMCPY2D', 'CUDA_MEMCPY2D_v1',
5009
6721
  'CUDA_MEMCPY2D_v2', 'CUDA_MEMCPY3D', 'CUDA_MEMCPY3D_PEER',
5010
- 'CUDA_MEMCPY3D_PEER_v1', 'CUDA_MEMCPY3D_v2',
6722
+ 'CUDA_MEMCPY3D_PEER_v1', 'CUDA_MEMCPY3D_v1', 'CUDA_MEMCPY3D_v2',
5011
6723
  'CUDA_MEMSET_NODE_PARAMS', 'CUDA_MEMSET_NODE_PARAMS_v1',
5012
6724
  'CUDA_MEM_ALLOC_NODE_PARAMS',
5013
6725
  'CUDA_POINTER_ATTRIBUTE_ACCESS_FLAGS',
@@ -5040,12 +6752,14 @@ __all__ = \
5040
6752
  'CU_AD_FORMAT_UNSIGNED_INT32', 'CU_AD_FORMAT_UNSIGNED_INT8',
5041
6753
  'CU_ARRAY_SPARSE_SUBRESOURCE_TYPE_MIPTAIL',
5042
6754
  'CU_ARRAY_SPARSE_SUBRESOURCE_TYPE_SPARSE_LEVEL',
5043
- 'CU_COMPUTEMODE_DEFAULT', 'CU_COMPUTEMODE_EXCLUSIVE_PROCESS',
5044
- 'CU_COMPUTEMODE_PROHIBITED', 'CU_CTX_BLOCKING_SYNC',
5045
- 'CU_CTX_FLAGS_MASK', 'CU_CTX_LMEM_RESIZE_TO_MAX',
5046
- 'CU_CTX_MAP_HOST', 'CU_CTX_SCHED_AUTO',
5047
- 'CU_CTX_SCHED_BLOCKING_SYNC', 'CU_CTX_SCHED_MASK',
5048
- 'CU_CTX_SCHED_SPIN', 'CU_CTX_SCHED_YIELD',
6755
+ 'CU_CLUSTER_SCHEDULING_POLICY_DEFAULT',
6756
+ 'CU_CLUSTER_SCHEDULING_POLICY_LOAD_BALANCING',
6757
+ 'CU_CLUSTER_SCHEDULING_POLICY_SPREAD', 'CU_COMPUTEMODE_DEFAULT',
6758
+ 'CU_COMPUTEMODE_EXCLUSIVE_PROCESS', 'CU_COMPUTEMODE_PROHIBITED',
6759
+ 'CU_CTX_BLOCKING_SYNC', 'CU_CTX_FLAGS_MASK',
6760
+ 'CU_CTX_LMEM_RESIZE_TO_MAX', 'CU_CTX_MAP_HOST',
6761
+ 'CU_CTX_SCHED_AUTO', 'CU_CTX_SCHED_BLOCKING_SYNC',
6762
+ 'CU_CTX_SCHED_MASK', 'CU_CTX_SCHED_SPIN', 'CU_CTX_SCHED_YIELD',
5049
6763
  'CU_CUBEMAP_FACE_NEGATIVE_X', 'CU_CUBEMAP_FACE_NEGATIVE_Y',
5050
6764
  'CU_CUBEMAP_FACE_NEGATIVE_Z', 'CU_CUBEMAP_FACE_POSITIVE_X',
5051
6765
  'CU_CUBEMAP_FACE_POSITIVE_Y', 'CU_CUBEMAP_FACE_POSITIVE_Z',
@@ -5054,10 +6768,13 @@ __all__ = \
5054
6768
  'CU_DEVICE_ATTRIBUTE_CAN_MAP_HOST_MEMORY',
5055
6769
  'CU_DEVICE_ATTRIBUTE_CAN_TEX2D_GATHER',
5056
6770
  'CU_DEVICE_ATTRIBUTE_CAN_USE_64_BIT_STREAM_MEM_OPS',
6771
+ 'CU_DEVICE_ATTRIBUTE_CAN_USE_64_BIT_STREAM_MEM_OPS_V1',
5057
6772
  'CU_DEVICE_ATTRIBUTE_CAN_USE_HOST_POINTER_FOR_REGISTERED_MEM',
5058
- 'CU_DEVICE_ATTRIBUTE_CAN_USE_STREAM_MEM_OPS',
6773
+ 'CU_DEVICE_ATTRIBUTE_CAN_USE_STREAM_MEM_OPS_V1',
5059
6774
  'CU_DEVICE_ATTRIBUTE_CAN_USE_STREAM_WAIT_VALUE_NOR',
6775
+ 'CU_DEVICE_ATTRIBUTE_CAN_USE_STREAM_WAIT_VALUE_NOR_V1',
5060
6776
  'CU_DEVICE_ATTRIBUTE_CLOCK_RATE',
6777
+ 'CU_DEVICE_ATTRIBUTE_CLUSTER_LAUNCH',
5061
6778
  'CU_DEVICE_ATTRIBUTE_COMPUTE_CAPABILITY_MAJOR',
5062
6779
  'CU_DEVICE_ATTRIBUTE_COMPUTE_CAPABILITY_MINOR',
5063
6780
  'CU_DEVICE_ATTRIBUTE_COMPUTE_MODE',
@@ -5066,7 +6783,9 @@ __all__ = \
5066
6783
  'CU_DEVICE_ATTRIBUTE_CONCURRENT_MANAGED_ACCESS',
5067
6784
  'CU_DEVICE_ATTRIBUTE_COOPERATIVE_LAUNCH',
5068
6785
  'CU_DEVICE_ATTRIBUTE_COOPERATIVE_MULTI_DEVICE_LAUNCH',
6786
+ 'CU_DEVICE_ATTRIBUTE_DEFERRED_MAPPING_CUDA_ARRAY_SUPPORTED',
5069
6787
  'CU_DEVICE_ATTRIBUTE_DIRECT_MANAGED_MEM_ACCESS_FROM_HOST',
6788
+ 'CU_DEVICE_ATTRIBUTE_DMA_BUF_SUPPORTED',
5070
6789
  'CU_DEVICE_ATTRIBUTE_ECC_ENABLED',
5071
6790
  'CU_DEVICE_ATTRIBUTE_GENERIC_COMPRESSION_SUPPORTED',
5072
6791
  'CU_DEVICE_ATTRIBUTE_GLOBAL_L1_CACHE_SUPPORTED',
@@ -5082,6 +6801,7 @@ __all__ = \
5082
6801
  'CU_DEVICE_ATTRIBUTE_HOST_NATIVE_ATOMIC_SUPPORTED',
5083
6802
  'CU_DEVICE_ATTRIBUTE_HOST_REGISTER_SUPPORTED',
5084
6803
  'CU_DEVICE_ATTRIBUTE_INTEGRATED',
6804
+ 'CU_DEVICE_ATTRIBUTE_IPC_EVENT_SUPPORTED',
5085
6805
  'CU_DEVICE_ATTRIBUTE_KERNEL_EXEC_TIMEOUT',
5086
6806
  'CU_DEVICE_ATTRIBUTE_L2_CACHE_SIZE',
5087
6807
  'CU_DEVICE_ATTRIBUTE_LOCAL_L1_CACHE_SUPPORTED',
@@ -5149,6 +6869,7 @@ __all__ = \
5149
6869
  'CU_DEVICE_ATTRIBUTE_MEMORY_CLOCK_RATE',
5150
6870
  'CU_DEVICE_ATTRIBUTE_MEMORY_POOLS_SUPPORTED',
5151
6871
  'CU_DEVICE_ATTRIBUTE_MEMPOOL_SUPPORTED_HANDLE_TYPES',
6872
+ 'CU_DEVICE_ATTRIBUTE_MEM_SYNC_DOMAIN_COUNT',
5152
6873
  'CU_DEVICE_ATTRIBUTE_MULTIPROCESSOR_COUNT',
5153
6874
  'CU_DEVICE_ATTRIBUTE_MULTI_GPU_BOARD',
5154
6875
  'CU_DEVICE_ATTRIBUTE_MULTI_GPU_BOARD_GROUP_ID',
@@ -5166,11 +6887,13 @@ __all__ = \
5166
6887
  'CU_DEVICE_ATTRIBUTE_STREAM_PRIORITIES_SUPPORTED',
5167
6888
  'CU_DEVICE_ATTRIBUTE_SURFACE_ALIGNMENT',
5168
6889
  'CU_DEVICE_ATTRIBUTE_TCC_DRIVER',
6890
+ 'CU_DEVICE_ATTRIBUTE_TENSOR_MAP_ACCESS_SUPPORTED',
5169
6891
  'CU_DEVICE_ATTRIBUTE_TEXTURE_ALIGNMENT',
5170
6892
  'CU_DEVICE_ATTRIBUTE_TEXTURE_PITCH_ALIGNMENT',
5171
6893
  'CU_DEVICE_ATTRIBUTE_TIMELINE_SEMAPHORE_INTEROP_SUPPORTED',
5172
6894
  'CU_DEVICE_ATTRIBUTE_TOTAL_CONSTANT_MEMORY',
5173
6895
  'CU_DEVICE_ATTRIBUTE_UNIFIED_ADDRESSING',
6896
+ 'CU_DEVICE_ATTRIBUTE_UNIFIED_FUNCTION_POINTERS',
5174
6897
  'CU_DEVICE_ATTRIBUTE_VIRTUAL_ADDRESS_MANAGEMENT_SUPPORTED',
5175
6898
  'CU_DEVICE_ATTRIBUTE_VIRTUAL_MEMORY_MANAGEMENT_SUPPORTED',
5176
6899
  'CU_DEVICE_ATTRIBUTE_WARP_SIZE',
@@ -5182,6 +6905,8 @@ __all__ = \
5182
6905
  'CU_EVENT_BLOCKING_SYNC', 'CU_EVENT_DEFAULT',
5183
6906
  'CU_EVENT_DISABLE_TIMING', 'CU_EVENT_INTERPROCESS',
5184
6907
  'CU_EVENT_RECORD_DEFAULT', 'CU_EVENT_RECORD_EXTERNAL',
6908
+ 'CU_EVENT_SCHED_AUTO', 'CU_EVENT_SCHED_BLOCKING_SYNC',
6909
+ 'CU_EVENT_SCHED_SPIN', 'CU_EVENT_SCHED_YIELD',
5185
6910
  'CU_EVENT_WAIT_DEFAULT', 'CU_EVENT_WAIT_EXTERNAL',
5186
6911
  'CU_EXEC_AFFINITY_TYPE_MAX', 'CU_EXEC_AFFINITY_TYPE_SM_COUNT',
5187
6912
  'CU_EXTERNAL_MEMORY_HANDLE_TYPE_D3D11_RESOURCE',
@@ -5209,19 +6934,28 @@ __all__ = \
5209
6934
  'CU_FLUSH_GPU_DIRECT_RDMA_WRITES_TO_OWNER',
5210
6935
  'CU_FUNC_ATTRIBUTE_BINARY_VERSION',
5211
6936
  'CU_FUNC_ATTRIBUTE_CACHE_MODE_CA',
6937
+ 'CU_FUNC_ATTRIBUTE_CLUSTER_SCHEDULING_POLICY_PREFERENCE',
6938
+ 'CU_FUNC_ATTRIBUTE_CLUSTER_SIZE_MUST_BE_SET',
5212
6939
  'CU_FUNC_ATTRIBUTE_CONST_SIZE_BYTES',
5213
6940
  'CU_FUNC_ATTRIBUTE_LOCAL_SIZE_BYTES', 'CU_FUNC_ATTRIBUTE_MAX',
5214
6941
  'CU_FUNC_ATTRIBUTE_MAX_DYNAMIC_SHARED_SIZE_BYTES',
5215
6942
  'CU_FUNC_ATTRIBUTE_MAX_THREADS_PER_BLOCK',
6943
+ 'CU_FUNC_ATTRIBUTE_NON_PORTABLE_CLUSTER_SIZE_ALLOWED',
5216
6944
  'CU_FUNC_ATTRIBUTE_NUM_REGS',
5217
6945
  'CU_FUNC_ATTRIBUTE_PREFERRED_SHARED_MEMORY_CARVEOUT',
5218
6946
  'CU_FUNC_ATTRIBUTE_PTX_VERSION',
6947
+ 'CU_FUNC_ATTRIBUTE_REQUIRED_CLUSTER_DEPTH',
6948
+ 'CU_FUNC_ATTRIBUTE_REQUIRED_CLUSTER_HEIGHT',
6949
+ 'CU_FUNC_ATTRIBUTE_REQUIRED_CLUSTER_WIDTH',
5219
6950
  'CU_FUNC_ATTRIBUTE_SHARED_SIZE_BYTES',
5220
6951
  'CU_FUNC_CACHE_PREFER_EQUAL', 'CU_FUNC_CACHE_PREFER_L1',
5221
6952
  'CU_FUNC_CACHE_PREFER_NONE', 'CU_FUNC_CACHE_PREFER_SHARED',
5222
6953
  'CU_GET_PROC_ADDRESS_DEFAULT',
5223
6954
  'CU_GET_PROC_ADDRESS_LEGACY_STREAM',
5224
6955
  'CU_GET_PROC_ADDRESS_PER_THREAD_DEFAULT_STREAM',
6956
+ 'CU_GET_PROC_ADDRESS_SUCCESS',
6957
+ 'CU_GET_PROC_ADDRESS_SYMBOL_NOT_FOUND',
6958
+ 'CU_GET_PROC_ADDRESS_VERSION_NOT_SUFFICIENT',
5225
6959
  'CU_GPU_DIRECT_RDMA_WRITES_ORDERING_ALL_DEVICES',
5226
6960
  'CU_GPU_DIRECT_RDMA_WRITES_ORDERING_NONE',
5227
6961
  'CU_GPU_DIRECT_RDMA_WRITES_ORDERING_OWNER',
@@ -5233,7 +6967,9 @@ __all__ = \
5233
6967
  'CU_GRAPHICS_REGISTER_FLAGS_SURFACE_LDST',
5234
6968
  'CU_GRAPHICS_REGISTER_FLAGS_TEXTURE_GATHER',
5235
6969
  'CU_GRAPHICS_REGISTER_FLAGS_WRITE_DISCARD',
6970
+ 'CU_GRAPH_DEBUG_DOT_FLAGS_BATCH_MEM_OP_NODE_PARAMS',
5236
6971
  'CU_GRAPH_DEBUG_DOT_FLAGS_EVENT_NODE_PARAMS',
6972
+ 'CU_GRAPH_DEBUG_DOT_FLAGS_EXTRA_TOPO_INFO',
5237
6973
  'CU_GRAPH_DEBUG_DOT_FLAGS_EXT_SEMAS_SIGNAL_NODE_PARAMS',
5238
6974
  'CU_GRAPH_DEBUG_DOT_FLAGS_EXT_SEMAS_WAIT_NODE_PARAMS',
5239
6975
  'CU_GRAPH_DEBUG_DOT_FLAGS_HANDLES',
@@ -5246,6 +6982,7 @@ __all__ = \
5246
6982
  'CU_GRAPH_DEBUG_DOT_FLAGS_MEM_FREE_NODE_PARAMS',
5247
6983
  'CU_GRAPH_DEBUG_DOT_FLAGS_RUNTIME_TYPES',
5248
6984
  'CU_GRAPH_DEBUG_DOT_FLAGS_VERBOSE', 'CU_GRAPH_EXEC_UPDATE_ERROR',
6985
+ 'CU_GRAPH_EXEC_UPDATE_ERROR_ATTRIBUTES_CHANGED',
5249
6986
  'CU_GRAPH_EXEC_UPDATE_ERROR_FUNCTION_CHANGED',
5250
6987
  'CU_GRAPH_EXEC_UPDATE_ERROR_NODE_TYPE_CHANGED',
5251
6988
  'CU_GRAPH_EXEC_UPDATE_ERROR_NOT_SUPPORTED',
@@ -5256,7 +6993,8 @@ __all__ = \
5256
6993
  'CU_GRAPH_MEM_ATTR_RESERVED_MEM_CURRENT',
5257
6994
  'CU_GRAPH_MEM_ATTR_RESERVED_MEM_HIGH',
5258
6995
  'CU_GRAPH_MEM_ATTR_USED_MEM_CURRENT',
5259
- 'CU_GRAPH_MEM_ATTR_USED_MEM_HIGH', 'CU_GRAPH_NODE_TYPE_EMPTY',
6996
+ 'CU_GRAPH_MEM_ATTR_USED_MEM_HIGH',
6997
+ 'CU_GRAPH_NODE_TYPE_BATCH_MEM_OP', 'CU_GRAPH_NODE_TYPE_EMPTY',
5260
6998
  'CU_GRAPH_NODE_TYPE_EVENT_RECORD',
5261
6999
  'CU_GRAPH_NODE_TYPE_EXT_SEMAS_SIGNAL',
5262
7000
  'CU_GRAPH_NODE_TYPE_EXT_SEMAS_WAIT', 'CU_GRAPH_NODE_TYPE_GRAPH',
@@ -5278,11 +7016,28 @@ __all__ = \
5278
7016
  'CU_JIT_LOG_VERBOSE', 'CU_JIT_LTO', 'CU_JIT_MAX_REGISTERS',
5279
7017
  'CU_JIT_NEW_SM3X_OPT', 'CU_JIT_NUM_INPUT_TYPES',
5280
7018
  'CU_JIT_NUM_OPTIONS', 'CU_JIT_OPTIMIZATION_LEVEL',
5281
- 'CU_JIT_PREC_DIV', 'CU_JIT_PREC_SQRT', 'CU_JIT_TARGET',
7019
+ 'CU_JIT_OPTIMIZE_UNUSED_DEVICE_VARIABLES',
7020
+ 'CU_JIT_POSITION_INDEPENDENT_CODE', 'CU_JIT_PREC_DIV',
7021
+ 'CU_JIT_PREC_SQRT', 'CU_JIT_REFERENCED_KERNEL_COUNT',
7022
+ 'CU_JIT_REFERENCED_KERNEL_NAMES',
7023
+ 'CU_JIT_REFERENCED_VARIABLE_COUNT',
7024
+ 'CU_JIT_REFERENCED_VARIABLE_NAMES', 'CU_JIT_TARGET',
5282
7025
  'CU_JIT_TARGET_FROM_CUCONTEXT', 'CU_JIT_THREADS_PER_BLOCK',
5283
- 'CU_JIT_WALL_TIME',
5284
- 'CU_KERNEL_NODE_ATTRIBUTE_ACCESS_POLICY_WINDOW',
5285
- 'CU_KERNEL_NODE_ATTRIBUTE_COOPERATIVE',
7026
+ 'CU_JIT_WALL_TIME', 'CU_LAUNCH_ATTRIBUTE_ACCESS_POLICY_WINDOW',
7027
+ 'CU_LAUNCH_ATTRIBUTE_CLUSTER_DIMENSION',
7028
+ 'CU_LAUNCH_ATTRIBUTE_CLUSTER_SCHEDULING_POLICY_PREFERENCE',
7029
+ 'CU_LAUNCH_ATTRIBUTE_COOPERATIVE', 'CU_LAUNCH_ATTRIBUTE_IGNORE',
7030
+ 'CU_LAUNCH_ATTRIBUTE_MEM_SYNC_DOMAIN',
7031
+ 'CU_LAUNCH_ATTRIBUTE_MEM_SYNC_DOMAIN_MAP',
7032
+ 'CU_LAUNCH_ATTRIBUTE_PRIORITY',
7033
+ 'CU_LAUNCH_ATTRIBUTE_PROGRAMMATIC_EVENT',
7034
+ 'CU_LAUNCH_ATTRIBUTE_PROGRAMMATIC_STREAM_SERIALIZATION',
7035
+ 'CU_LAUNCH_ATTRIBUTE_SYNCHRONIZATION_POLICY',
7036
+ 'CU_LAUNCH_MEM_SYNC_DOMAIN_DEFAULT',
7037
+ 'CU_LAUNCH_MEM_SYNC_DOMAIN_REMOTE',
7038
+ 'CU_LIBRARY_BINARY_IS_PRESERVED',
7039
+ 'CU_LIBRARY_HOST_UNIVERSAL_FUNCTION_AND_DATA_TABLE',
7040
+ 'CU_LIBRARY_NUM_OPTIONS',
5286
7041
  'CU_LIMIT_DEV_RUNTIME_PENDING_LAUNCH_COUNT',
5287
7042
  'CU_LIMIT_DEV_RUNTIME_SYNC_DEPTH', 'CU_LIMIT_MALLOC_HEAP_SIZE',
5288
7043
  'CU_LIMIT_MAX', 'CU_LIMIT_MAX_L2_FETCH_GRANULARITY',
@@ -5321,7 +7076,10 @@ __all__ = \
5321
7076
  'CU_MEM_RANGE_ATTRIBUTE_ACCESSED_BY',
5322
7077
  'CU_MEM_RANGE_ATTRIBUTE_LAST_PREFETCH_LOCATION',
5323
7078
  'CU_MEM_RANGE_ATTRIBUTE_PREFERRED_LOCATION',
5324
- 'CU_MEM_RANGE_ATTRIBUTE_READ_MOSTLY', 'CU_OCCUPANCY_DEFAULT',
7079
+ 'CU_MEM_RANGE_ATTRIBUTE_READ_MOSTLY',
7080
+ 'CU_MEM_RANGE_HANDLE_TYPE_DMA_BUF_FD',
7081
+ 'CU_MEM_RANGE_HANDLE_TYPE_MAX', 'CU_MODULE_EAGER_LOADING',
7082
+ 'CU_MODULE_LAZY_LOADING', 'CU_OCCUPANCY_DEFAULT',
5325
7083
  'CU_OCCUPANCY_DISABLE_CACHING_OVERRIDE',
5326
7084
  'CU_POINTER_ATTRIBUTE_ACCESS_FLAGS',
5327
7085
  'CU_POINTER_ATTRIBUTE_ACCESS_FLAG_NONE',
@@ -5335,6 +7093,9 @@ __all__ = \
5335
7093
  'CU_POINTER_ATTRIBUTE_IS_GPU_DIRECT_RDMA_CAPABLE',
5336
7094
  'CU_POINTER_ATTRIBUTE_IS_LEGACY_CUDA_IPC_CAPABLE',
5337
7095
  'CU_POINTER_ATTRIBUTE_IS_MANAGED', 'CU_POINTER_ATTRIBUTE_MAPPED',
7096
+ 'CU_POINTER_ATTRIBUTE_MAPPING_BASE_ADDR',
7097
+ 'CU_POINTER_ATTRIBUTE_MAPPING_SIZE',
7098
+ 'CU_POINTER_ATTRIBUTE_MEMORY_BLOCK_ID',
5338
7099
  'CU_POINTER_ATTRIBUTE_MEMORY_TYPE',
5339
7100
  'CU_POINTER_ATTRIBUTE_MEMPOOL_HANDLE',
5340
7101
  'CU_POINTER_ATTRIBUTE_P2P_TOKENS',
@@ -5370,13 +7131,13 @@ __all__ = \
5370
7131
  'CU_SHARED_MEM_CONFIG_EIGHT_BYTE_BANK_SIZE',
5371
7132
  'CU_SHARED_MEM_CONFIG_FOUR_BYTE_BANK_SIZE',
5372
7133
  'CU_STREAM_ADD_CAPTURE_DEPENDENCIES',
5373
- 'CU_STREAM_ATTRIBUTE_ACCESS_POLICY_WINDOW',
5374
- 'CU_STREAM_ATTRIBUTE_SYNCHRONIZATION_POLICY',
5375
7134
  'CU_STREAM_CAPTURE_MODE_GLOBAL', 'CU_STREAM_CAPTURE_MODE_RELAXED',
5376
7135
  'CU_STREAM_CAPTURE_MODE_THREAD_LOCAL',
5377
7136
  'CU_STREAM_CAPTURE_STATUS_ACTIVE',
5378
7137
  'CU_STREAM_CAPTURE_STATUS_INVALIDATED',
5379
7138
  'CU_STREAM_CAPTURE_STATUS_NONE', 'CU_STREAM_DEFAULT',
7139
+ 'CU_STREAM_MEMORY_BARRIER_TYPE_GPU',
7140
+ 'CU_STREAM_MEMORY_BARRIER_TYPE_SYS', 'CU_STREAM_MEM_OP_BARRIER',
5380
7141
  'CU_STREAM_MEM_OP_FLUSH_REMOTE_WRITES',
5381
7142
  'CU_STREAM_MEM_OP_WAIT_VALUE_32',
5382
7143
  'CU_STREAM_MEM_OP_WAIT_VALUE_64',
@@ -5388,8 +7149,7 @@ __all__ = \
5388
7149
  'CU_STREAM_WRITE_VALUE_DEFAULT',
5389
7150
  'CU_STREAM_WRITE_VALUE_NO_MEMORY_BARRIER', 'CU_SYNC_POLICY_AUTO',
5390
7151
  'CU_SYNC_POLICY_BLOCKING_SYNC', 'CU_SYNC_POLICY_SPIN',
5391
- 'CU_SYNC_POLICY_YIELD', 'CU_TARGET_COMPUTE_20',
5392
- 'CU_TARGET_COMPUTE_21', 'CU_TARGET_COMPUTE_30',
7152
+ 'CU_SYNC_POLICY_YIELD', 'CU_TARGET_COMPUTE_30',
5393
7153
  'CU_TARGET_COMPUTE_32', 'CU_TARGET_COMPUTE_35',
5394
7154
  'CU_TARGET_COMPUTE_37', 'CU_TARGET_COMPUTE_50',
5395
7155
  'CU_TARGET_COMPUTE_52', 'CU_TARGET_COMPUTE_53',
@@ -5397,39 +7157,68 @@ __all__ = \
5397
7157
  'CU_TARGET_COMPUTE_62', 'CU_TARGET_COMPUTE_70',
5398
7158
  'CU_TARGET_COMPUTE_72', 'CU_TARGET_COMPUTE_75',
5399
7159
  'CU_TARGET_COMPUTE_80', 'CU_TARGET_COMPUTE_86',
5400
- 'CU_TR_ADDRESS_MODE_BORDER', 'CU_TR_ADDRESS_MODE_CLAMP',
5401
- 'CU_TR_ADDRESS_MODE_MIRROR', 'CU_TR_ADDRESS_MODE_WRAP',
5402
- 'CU_TR_FILTER_MODE_LINEAR', 'CU_TR_FILTER_MODE_POINT',
5403
- 'CU_USER_OBJECT_NO_DESTRUCTOR_SYNC', 'CUaccessPolicyWindow',
5404
- 'CUaccessPolicyWindow_v1', 'CUaccessProperty',
5405
- 'CUaccessProperty__enumvalues', 'CUaccessProperty_enum',
5406
- 'CUaddress_mode', 'CUaddress_mode__enumvalues',
5407
- 'CUaddress_mode_enum', 'CUarray', 'CUarrayMapInfo',
5408
- 'CUarrayMapInfo_v1', 'CUarraySparseSubresourceType',
7160
+ 'CU_TARGET_COMPUTE_87', 'CU_TARGET_COMPUTE_89',
7161
+ 'CU_TARGET_COMPUTE_90', 'CU_TARGET_COMPUTE_90A',
7162
+ 'CU_TENSOR_MAP_DATA_TYPE_BFLOAT16',
7163
+ 'CU_TENSOR_MAP_DATA_TYPE_FLOAT16',
7164
+ 'CU_TENSOR_MAP_DATA_TYPE_FLOAT32',
7165
+ 'CU_TENSOR_MAP_DATA_TYPE_FLOAT32_FTZ',
7166
+ 'CU_TENSOR_MAP_DATA_TYPE_FLOAT64',
7167
+ 'CU_TENSOR_MAP_DATA_TYPE_INT32', 'CU_TENSOR_MAP_DATA_TYPE_INT64',
7168
+ 'CU_TENSOR_MAP_DATA_TYPE_TFLOAT32',
7169
+ 'CU_TENSOR_MAP_DATA_TYPE_TFLOAT32_FTZ',
7170
+ 'CU_TENSOR_MAP_DATA_TYPE_UINT16',
7171
+ 'CU_TENSOR_MAP_DATA_TYPE_UINT32',
7172
+ 'CU_TENSOR_MAP_DATA_TYPE_UINT64', 'CU_TENSOR_MAP_DATA_TYPE_UINT8',
7173
+ 'CU_TENSOR_MAP_FLOAT_OOB_FILL_NAN_REQUEST_ZERO_FMA',
7174
+ 'CU_TENSOR_MAP_FLOAT_OOB_FILL_NONE',
7175
+ 'CU_TENSOR_MAP_INTERLEAVE_16B', 'CU_TENSOR_MAP_INTERLEAVE_32B',
7176
+ 'CU_TENSOR_MAP_INTERLEAVE_NONE',
7177
+ 'CU_TENSOR_MAP_L2_PROMOTION_L2_128B',
7178
+ 'CU_TENSOR_MAP_L2_PROMOTION_L2_256B',
7179
+ 'CU_TENSOR_MAP_L2_PROMOTION_L2_64B',
7180
+ 'CU_TENSOR_MAP_L2_PROMOTION_NONE', 'CU_TENSOR_MAP_SWIZZLE_128B',
7181
+ 'CU_TENSOR_MAP_SWIZZLE_32B', 'CU_TENSOR_MAP_SWIZZLE_64B',
7182
+ 'CU_TENSOR_MAP_SWIZZLE_NONE', 'CU_TR_ADDRESS_MODE_BORDER',
7183
+ 'CU_TR_ADDRESS_MODE_CLAMP', 'CU_TR_ADDRESS_MODE_MIRROR',
7184
+ 'CU_TR_ADDRESS_MODE_WRAP', 'CU_TR_FILTER_MODE_LINEAR',
7185
+ 'CU_TR_FILTER_MODE_POINT', 'CU_USER_OBJECT_NO_DESTRUCTOR_SYNC',
7186
+ 'CUaccessPolicyWindow', 'CUaccessPolicyWindow_v1',
7187
+ 'CUaccessProperty', 'CUaccessProperty__enumvalues',
7188
+ 'CUaccessProperty_enum', 'CUaddress_mode',
7189
+ 'CUaddress_mode__enumvalues', 'CUaddress_mode_enum', 'CUarray',
7190
+ 'CUarrayMapInfo', 'CUarrayMapInfo_v1',
7191
+ 'CUarraySparseSubresourceType',
5409
7192
  'CUarraySparseSubresourceType__enumvalues',
5410
7193
  'CUarraySparseSubresourceType_enum', 'CUarray_cubemap_face',
5411
7194
  'CUarray_cubemap_face__enumvalues', 'CUarray_cubemap_face_enum',
5412
7195
  'CUarray_format', 'CUarray_format__enumvalues',
5413
- 'CUarray_format_enum', 'CUcomputemode',
7196
+ 'CUarray_format_enum', 'CUclusterSchedulingPolicy',
7197
+ 'CUclusterSchedulingPolicy__enumvalues',
7198
+ 'CUclusterSchedulingPolicy_enum', 'CUcomputemode',
5414
7199
  'CUcomputemode__enumvalues', 'CUcomputemode_enum', 'CUcontext',
5415
7200
  'CUctx_flags', 'CUctx_flags__enumvalues', 'CUctx_flags_enum',
5416
7201
  'CUdevice', 'CUdevice_P2PAttribute',
5417
7202
  'CUdevice_P2PAttribute__enumvalues', 'CUdevice_P2PAttribute_enum',
5418
7203
  'CUdevice_attribute', 'CUdevice_attribute__enumvalues',
5419
7204
  'CUdevice_attribute_enum', 'CUdevice_v1', 'CUdeviceptr',
5420
- 'CUdeviceptr_v2', 'CUdevprop', 'CUdevprop_v1',
7205
+ 'CUdeviceptr_v1', 'CUdeviceptr_v2', 'CUdevprop', 'CUdevprop_v1',
7206
+ 'CUdriverProcAddressQueryResult',
7207
+ 'CUdriverProcAddressQueryResult__enumvalues',
7208
+ 'CUdriverProcAddressQueryResult_enum',
5421
7209
  'CUdriverProcAddress_flags',
5422
7210
  'CUdriverProcAddress_flags__enumvalues',
5423
7211
  'CUdriverProcAddress_flags_enum', 'CUevent', 'CUevent_flags',
5424
7212
  'CUevent_flags__enumvalues', 'CUevent_flags_enum',
5425
7213
  'CUevent_record_flags', 'CUevent_record_flags__enumvalues',
5426
- 'CUevent_record_flags_enum', 'CUevent_wait_flags',
5427
- 'CUevent_wait_flags__enumvalues', 'CUevent_wait_flags_enum',
5428
- 'CUexecAffinityParam', 'CUexecAffinityParam_v1',
5429
- 'CUexecAffinitySmCount', 'CUexecAffinitySmCount_v1',
5430
- 'CUexecAffinityType', 'CUexecAffinityType__enumvalues',
5431
- 'CUexecAffinityType_enum', 'CUexternalMemory',
5432
- 'CUexternalMemoryHandleType',
7214
+ 'CUevent_record_flags_enum', 'CUevent_sched_flags',
7215
+ 'CUevent_sched_flags__enumvalues', 'CUevent_sched_flags_enum',
7216
+ 'CUevent_wait_flags', 'CUevent_wait_flags__enumvalues',
7217
+ 'CUevent_wait_flags_enum', 'CUexecAffinityParam',
7218
+ 'CUexecAffinityParam_v1', 'CUexecAffinitySmCount',
7219
+ 'CUexecAffinitySmCount_v1', 'CUexecAffinityType',
7220
+ 'CUexecAffinityType__enumvalues', 'CUexecAffinityType_enum',
7221
+ 'CUexternalMemory', 'CUexternalMemoryHandleType',
5433
7222
  'CUexternalMemoryHandleType__enumvalues',
5434
7223
  'CUexternalMemoryHandleType_enum', 'CUexternalSemaphore',
5435
7224
  'CUexternalSemaphoreHandleType',
@@ -5450,8 +7239,11 @@ __all__ = \
5450
7239
  'CUfunction_attribute_enum', 'CUgraph', 'CUgraphDebugDot_flags',
5451
7240
  'CUgraphDebugDot_flags__enumvalues', 'CUgraphDebugDot_flags_enum',
5452
7241
  'CUgraphExec', 'CUgraphExecUpdateResult',
7242
+ 'CUgraphExecUpdateResultInfo', 'CUgraphExecUpdateResultInfo_v1',
5453
7243
  'CUgraphExecUpdateResult__enumvalues',
5454
- 'CUgraphExecUpdateResult_enum', 'CUgraphInstantiate_flags',
7244
+ 'CUgraphExecUpdateResult_enum', 'CUgraphInstantiateResult',
7245
+ 'CUgraphInstantiateResult__enumvalues',
7246
+ 'CUgraphInstantiateResult_enum', 'CUgraphInstantiate_flags',
5455
7247
  'CUgraphInstantiate_flags__enumvalues',
5456
7248
  'CUgraphInstantiate_flags_enum', 'CUgraphMem_attribute',
5457
7249
  'CUgraphMem_attribute__enumvalues', 'CUgraphMem_attribute_enum',
@@ -5470,9 +7262,16 @@ __all__ = \
5470
7262
  'CUjit_fallback', 'CUjit_fallback__enumvalues',
5471
7263
  'CUjit_fallback_enum', 'CUjit_option', 'CUjit_option__enumvalues',
5472
7264
  'CUjit_option_enum', 'CUjit_target', 'CUjit_target__enumvalues',
5473
- 'CUjit_target_enum', 'CUkernelNodeAttrID',
5474
- 'CUkernelNodeAttrID__enumvalues', 'CUkernelNodeAttrID_enum',
5475
- 'CUkernelNodeAttrValue', 'CUkernelNodeAttrValue_v1', 'CUlimit',
7265
+ 'CUjit_target_enum', 'CUkernel', 'CUkernelNodeAttrID',
7266
+ 'CUkernelNodeAttrID__enumvalues', 'CUkernelNodeAttrValue',
7267
+ 'CUkernelNodeAttrValue_v1', 'CUlaunchAttribute',
7268
+ 'CUlaunchAttributeID', 'CUlaunchAttributeID__enumvalues',
7269
+ 'CUlaunchAttributeID_enum', 'CUlaunchAttributeValue',
7270
+ 'CUlaunchConfig', 'CUlaunchMemSyncDomain',
7271
+ 'CUlaunchMemSyncDomainMap', 'CUlaunchMemSyncDomain__enumvalues',
7272
+ 'CUlaunchMemSyncDomain_enum', 'CUlibrary',
7273
+ 'CUlibraryHostUniversalFunctionAndDataTable', 'CUlibraryOption',
7274
+ 'CUlibraryOption__enumvalues', 'CUlibraryOption_enum', 'CUlimit',
5476
7275
  'CUlimit__enumvalues', 'CUlimit_enum', 'CUlinkState',
5477
7276
  'CUmemAccessDesc', 'CUmemAccessDesc_v1', 'CUmemAccess_flags',
5478
7277
  'CUmemAccess_flags__enumvalues', 'CUmemAccess_flags_enum',
@@ -5497,22 +7296,25 @@ __all__ = \
5497
7296
  'CUmemPoolProps', 'CUmemPoolProps_v1', 'CUmemPoolPtrExportData',
5498
7297
  'CUmemPoolPtrExportData_v1', 'CUmemPool_attribute',
5499
7298
  'CUmemPool_attribute__enumvalues', 'CUmemPool_attribute_enum',
5500
- 'CUmem_advise', 'CUmem_advise__enumvalues', 'CUmem_advise_enum',
7299
+ 'CUmemRangeHandleType', 'CUmemRangeHandleType__enumvalues',
7300
+ 'CUmemRangeHandleType_enum', 'CUmem_advise',
7301
+ 'CUmem_advise__enumvalues', 'CUmem_advise_enum',
5501
7302
  'CUmem_range_attribute', 'CUmem_range_attribute__enumvalues',
5502
7303
  'CUmem_range_attribute_enum', 'CUmemoryPool', 'CUmemorytype',
5503
7304
  'CUmemorytype__enumvalues', 'CUmemorytype_enum',
5504
- 'CUmipmappedArray', 'CUmodule', 'CUoccupancyB2DSize',
5505
- 'CUoccupancy_flags', 'CUoccupancy_flags__enumvalues',
5506
- 'CUoccupancy_flags_enum', 'CUpointer_attribute',
5507
- 'CUpointer_attribute__enumvalues', 'CUpointer_attribute_enum',
5508
- 'CUresourceViewFormat', 'CUresourceViewFormat__enumvalues',
5509
- 'CUresourceViewFormat_enum', 'CUresourcetype',
5510
- 'CUresourcetype__enumvalues', 'CUresourcetype_enum', 'CUresult',
5511
- 'CUresult__enumvalues', 'CUshared_carveout',
5512
- 'CUshared_carveout__enumvalues', 'CUshared_carveout_enum',
5513
- 'CUsharedconfig', 'CUsharedconfig__enumvalues',
5514
- 'CUsharedconfig_enum', 'CUstream', 'CUstreamAttrID',
5515
- 'CUstreamAttrID__enumvalues', 'CUstreamAttrID_enum',
7305
+ 'CUmipmappedArray', 'CUmodule', 'CUmoduleLoadingMode',
7306
+ 'CUmoduleLoadingMode__enumvalues', 'CUmoduleLoadingMode_enum',
7307
+ 'CUoccupancyB2DSize', 'CUoccupancy_flags',
7308
+ 'CUoccupancy_flags__enumvalues', 'CUoccupancy_flags_enum',
7309
+ 'CUpointer_attribute', 'CUpointer_attribute__enumvalues',
7310
+ 'CUpointer_attribute_enum', 'CUresourceViewFormat',
7311
+ 'CUresourceViewFormat__enumvalues', 'CUresourceViewFormat_enum',
7312
+ 'CUresourcetype', 'CUresourcetype__enumvalues',
7313
+ 'CUresourcetype_enum', 'CUresult', 'CUresult__enumvalues',
7314
+ 'CUshared_carveout', 'CUshared_carveout__enumvalues',
7315
+ 'CUshared_carveout_enum', 'CUsharedconfig',
7316
+ 'CUsharedconfig__enumvalues', 'CUsharedconfig_enum', 'CUstream',
7317
+ 'CUstreamAttrID', 'CUstreamAttrID__enumvalues',
5516
7318
  'CUstreamAttrValue', 'CUstreamAttrValue_v1',
5517
7319
  'CUstreamBatchMemOpParams', 'CUstreamBatchMemOpParams_v1',
5518
7320
  'CUstreamBatchMemOpType', 'CUstreamBatchMemOpType__enumvalues',
@@ -5520,6 +7322,9 @@ __all__ = \
5520
7322
  'CUstreamCaptureMode', 'CUstreamCaptureMode__enumvalues',
5521
7323
  'CUstreamCaptureMode_enum', 'CUstreamCaptureStatus',
5522
7324
  'CUstreamCaptureStatus__enumvalues', 'CUstreamCaptureStatus_enum',
7325
+ 'CUstreamMemoryBarrier_flags',
7326
+ 'CUstreamMemoryBarrier_flags__enumvalues',
7327
+ 'CUstreamMemoryBarrier_flags_enum',
5523
7328
  'CUstreamUpdateCaptureDependencies_flags',
5524
7329
  'CUstreamUpdateCaptureDependencies_flags__enumvalues',
5525
7330
  'CUstreamUpdateCaptureDependencies_flags_enum',
@@ -5530,26 +7335,46 @@ __all__ = \
5530
7335
  'CUstream_flags__enumvalues', 'CUstream_flags_enum',
5531
7336
  'CUsurfObject', 'CUsurfObject_v1', 'CUsurfref',
5532
7337
  'CUsynchronizationPolicy', 'CUsynchronizationPolicy__enumvalues',
5533
- 'CUsynchronizationPolicy_enum', 'CUtexObject', 'CUtexObject_v1',
5534
- 'CUtexref', 'CUuserObject', 'CUuserObjectRetain_flags',
7338
+ 'CUsynchronizationPolicy_enum', 'CUtensorMap',
7339
+ 'CUtensorMapDataType', 'CUtensorMapDataType__enumvalues',
7340
+ 'CUtensorMapDataType_enum', 'CUtensorMapFloatOOBfill',
7341
+ 'CUtensorMapFloatOOBfill__enumvalues',
7342
+ 'CUtensorMapFloatOOBfill_enum', 'CUtensorMapInterleave',
7343
+ 'CUtensorMapInterleave__enumvalues', 'CUtensorMapInterleave_enum',
7344
+ 'CUtensorMapL2promotion', 'CUtensorMapL2promotion__enumvalues',
7345
+ 'CUtensorMapL2promotion_enum', 'CUtensorMapSwizzle',
7346
+ 'CUtensorMapSwizzle__enumvalues', 'CUtensorMapSwizzle_enum',
7347
+ 'CUtexObject', 'CUtexObject_v1', 'CUtexref', 'CUuserObject',
7348
+ 'CUuserObjectRetain_flags',
5535
7349
  'CUuserObjectRetain_flags__enumvalues',
5536
7350
  'CUuserObjectRetain_flags_enum', 'CUuserObject_flags',
5537
7351
  'CUuserObject_flags__enumvalues', 'CUuserObject_flags_enum',
5538
- 'CUuuid', 'cuArray3DCreate_v2', 'cuArray3DGetDescriptor_v2',
5539
- 'cuArrayCreate_v2', 'cuArrayDestroy', 'cuArrayGetDescriptor_v2',
7352
+ 'CUuuid', 'NVCL_CTX_SCHED_AUTO', 'NVCL_CTX_SCHED_BLOCKING_SYNC',
7353
+ 'NVCL_CTX_SCHED_SPIN', 'NVCL_CTX_SCHED_YIELD',
7354
+ 'NVCL_EVENT_SCHED_AUTO', 'NVCL_EVENT_SCHED_BLOCKING_SYNC',
7355
+ 'NVCL_EVENT_SCHED_SPIN', 'NVCL_EVENT_SCHED_YIELD',
7356
+ 'cl_context_flags', 'cl_context_flags__enumvalues',
7357
+ 'cl_context_flags_enum', 'cl_event_flags',
7358
+ 'cl_event_flags__enumvalues', 'cl_event_flags_enum',
7359
+ 'cuArray3DCreate', 'cuArray3DCreate_v2', 'cuArray3DGetDescriptor',
7360
+ 'cuArray3DGetDescriptor_v2', 'cuArrayCreate', 'cuArrayCreate_v2',
7361
+ 'cuArrayDestroy', 'cuArrayGetDescriptor',
7362
+ 'cuArrayGetDescriptor_v2', 'cuArrayGetMemoryRequirements',
5540
7363
  'cuArrayGetPlane', 'cuArrayGetSparseProperties', 'cuCtxAttach',
5541
- 'cuCtxCreate_v2', 'cuCtxCreate_v3', 'cuCtxDestroy_v2',
5542
- 'cuCtxDetach', 'cuCtxDisablePeerAccess', 'cuCtxEnablePeerAccess',
5543
- 'cuCtxGetApiVersion', 'cuCtxGetCacheConfig', 'cuCtxGetCurrent',
5544
- 'cuCtxGetDevice', 'cuCtxGetExecAffinity', 'cuCtxGetFlags',
7364
+ 'cuCtxCreate', 'cuCtxCreate_v2', 'cuCtxCreate_v3', 'cuCtxDestroy',
7365
+ 'cuCtxDestroy_v2', 'cuCtxDetach', 'cuCtxDisablePeerAccess',
7366
+ 'cuCtxEnablePeerAccess', 'cuCtxGetApiVersion',
7367
+ 'cuCtxGetCacheConfig', 'cuCtxGetCurrent', 'cuCtxGetDevice',
7368
+ 'cuCtxGetExecAffinity', 'cuCtxGetFlags', 'cuCtxGetId',
5545
7369
  'cuCtxGetLimit', 'cuCtxGetSharedMemConfig',
5546
- 'cuCtxGetStreamPriorityRange', 'cuCtxPopCurrent_v2',
5547
- 'cuCtxPushCurrent_v2', 'cuCtxResetPersistingL2Cache',
5548
- 'cuCtxSetCacheConfig', 'cuCtxSetCurrent', 'cuCtxSetLimit',
5549
- 'cuCtxSetSharedMemConfig', 'cuCtxSynchronize',
5550
- 'cuDestroyExternalMemory', 'cuDestroyExternalSemaphore',
5551
- 'cuDeviceCanAccessPeer', 'cuDeviceComputeCapability',
5552
- 'cuDeviceGet', 'cuDeviceGetAttribute', 'cuDeviceGetByPCIBusId',
7370
+ 'cuCtxGetStreamPriorityRange', 'cuCtxPopCurrent',
7371
+ 'cuCtxPopCurrent_v2', 'cuCtxPushCurrent', 'cuCtxPushCurrent_v2',
7372
+ 'cuCtxResetPersistingL2Cache', 'cuCtxSetCacheConfig',
7373
+ 'cuCtxSetCurrent', 'cuCtxSetLimit', 'cuCtxSetSharedMemConfig',
7374
+ 'cuCtxSynchronize', 'cuDestroyExternalMemory',
7375
+ 'cuDestroyExternalSemaphore', 'cuDeviceCanAccessPeer',
7376
+ 'cuDeviceComputeCapability', 'cuDeviceGet',
7377
+ 'cuDeviceGetAttribute', 'cuDeviceGetByPCIBusId',
5553
7378
  'cuDeviceGetCount', 'cuDeviceGetDefaultMemPool',
5554
7379
  'cuDeviceGetExecAffinitySupport', 'cuDeviceGetGraphMemAttribute',
5555
7380
  'cuDeviceGetLuid', 'cuDeviceGetMemPool', 'cuDeviceGetName',
@@ -5557,149 +7382,239 @@ __all__ = \
5557
7382
  'cuDeviceGetPCIBusId', 'cuDeviceGetProperties',
5558
7383
  'cuDeviceGetTexture1DLinearMaxWidth', 'cuDeviceGetUuid',
5559
7384
  'cuDeviceGetUuid_v2', 'cuDeviceGraphMemTrim',
5560
- 'cuDevicePrimaryCtxGetState', 'cuDevicePrimaryCtxRelease_v2',
7385
+ 'cuDevicePrimaryCtxGetState', 'cuDevicePrimaryCtxRelease',
7386
+ 'cuDevicePrimaryCtxRelease_v2', 'cuDevicePrimaryCtxReset',
5561
7387
  'cuDevicePrimaryCtxReset_v2', 'cuDevicePrimaryCtxRetain',
5562
- 'cuDevicePrimaryCtxSetFlags_v2', 'cuDeviceSetGraphMemAttribute',
5563
- 'cuDeviceSetMemPool', 'cuDeviceTotalMem_v2', 'cuDriverGetVersion',
5564
- 'cuEventCreate', 'cuEventDestroy_v2', 'cuEventElapsedTime',
5565
- 'cuEventQuery', 'cuEventRecord', 'cuEventRecordWithFlags',
5566
- 'cuEventSynchronize', 'cuExternalMemoryGetMappedBuffer',
7388
+ 'cuDevicePrimaryCtxSetFlags', 'cuDevicePrimaryCtxSetFlags_v2',
7389
+ 'cuDeviceSetGraphMemAttribute', 'cuDeviceSetMemPool',
7390
+ 'cuDeviceTotalMem', 'cuDeviceTotalMem_v2', 'cuDriverGetVersion',
7391
+ 'cuEventCreate', 'cuEventDestroy', 'cuEventDestroy_v2',
7392
+ 'cuEventElapsedTime', 'cuEventQuery', 'cuEventRecord',
7393
+ 'cuEventRecordWithFlags', 'cuEventRecordWithFlags_ptsz',
7394
+ 'cuEventRecord_ptsz', 'cuEventSynchronize',
7395
+ 'cuExternalMemoryGetMappedBuffer',
5567
7396
  'cuExternalMemoryGetMappedMipmappedArray',
5568
7397
  'cuFlushGPUDirectRDMAWrites', 'cuFuncGetAttribute',
5569
7398
  'cuFuncGetModule', 'cuFuncSetAttribute', 'cuFuncSetBlockShape',
5570
7399
  'cuFuncSetCacheConfig', 'cuFuncSetSharedMemConfig',
5571
7400
  'cuFuncSetSharedSize', 'cuGetErrorName', 'cuGetErrorString',
5572
- 'cuGetExportTable', 'cuGetProcAddress',
5573
- 'cuGraphAddChildGraphNode', 'cuGraphAddDependencies',
5574
- 'cuGraphAddEmptyNode', 'cuGraphAddEventRecordNode',
5575
- 'cuGraphAddEventWaitNode',
7401
+ 'cuGetExportTable', 'cuGetProcAddress', 'cuGetProcAddress_v2',
7402
+ 'cuGraphAddBatchMemOpNode', 'cuGraphAddChildGraphNode',
7403
+ 'cuGraphAddDependencies', 'cuGraphAddEmptyNode',
7404
+ 'cuGraphAddEventRecordNode', 'cuGraphAddEventWaitNode',
5576
7405
  'cuGraphAddExternalSemaphoresSignalNode',
5577
7406
  'cuGraphAddExternalSemaphoresWaitNode', 'cuGraphAddHostNode',
5578
- 'cuGraphAddKernelNode', 'cuGraphAddMemAllocNode',
5579
- 'cuGraphAddMemFreeNode', 'cuGraphAddMemcpyNode',
5580
- 'cuGraphAddMemsetNode', 'cuGraphChildGraphNodeGetGraph',
7407
+ 'cuGraphAddKernelNode', 'cuGraphAddKernelNode_v2',
7408
+ 'cuGraphAddMemAllocNode', 'cuGraphAddMemFreeNode',
7409
+ 'cuGraphAddMemcpyNode', 'cuGraphAddMemsetNode',
7410
+ 'cuGraphBatchMemOpNodeGetParams',
7411
+ 'cuGraphBatchMemOpNodeSetParams', 'cuGraphChildGraphNodeGetGraph',
5581
7412
  'cuGraphClone', 'cuGraphCreate', 'cuGraphDebugDotPrint',
5582
7413
  'cuGraphDestroy', 'cuGraphDestroyNode',
5583
7414
  'cuGraphEventRecordNodeGetEvent',
5584
7415
  'cuGraphEventRecordNodeSetEvent', 'cuGraphEventWaitNodeGetEvent',
5585
7416
  'cuGraphEventWaitNodeSetEvent',
7417
+ 'cuGraphExecBatchMemOpNodeSetParams',
5586
7418
  'cuGraphExecChildGraphNodeSetParams', 'cuGraphExecDestroy',
5587
7419
  'cuGraphExecEventRecordNodeSetEvent',
5588
7420
  'cuGraphExecEventWaitNodeSetEvent',
5589
7421
  'cuGraphExecExternalSemaphoresSignalNodeSetParams',
5590
7422
  'cuGraphExecExternalSemaphoresWaitNodeSetParams',
5591
- 'cuGraphExecHostNodeSetParams', 'cuGraphExecKernelNodeSetParams',
7423
+ 'cuGraphExecGetFlags', 'cuGraphExecHostNodeSetParams',
7424
+ 'cuGraphExecKernelNodeSetParams',
7425
+ 'cuGraphExecKernelNodeSetParams_v2',
5592
7426
  'cuGraphExecMemcpyNodeSetParams',
5593
7427
  'cuGraphExecMemsetNodeSetParams', 'cuGraphExecUpdate',
7428
+ 'cuGraphExecUpdate_v2',
5594
7429
  'cuGraphExternalSemaphoresSignalNodeGetParams',
5595
7430
  'cuGraphExternalSemaphoresSignalNodeSetParams',
5596
7431
  'cuGraphExternalSemaphoresWaitNodeGetParams',
5597
7432
  'cuGraphExternalSemaphoresWaitNodeSetParams', 'cuGraphGetEdges',
5598
7433
  'cuGraphGetNodes', 'cuGraphGetRootNodes',
5599
7434
  'cuGraphHostNodeGetParams', 'cuGraphHostNodeSetParams',
5600
- 'cuGraphInstantiateWithFlags', 'cuGraphInstantiate_v2',
7435
+ 'cuGraphInstantiate', 'cuGraphInstantiateWithFlags',
7436
+ 'cuGraphInstantiateWithParams',
7437
+ 'cuGraphInstantiateWithParams_ptsz', 'cuGraphInstantiate_v2',
5601
7438
  'cuGraphKernelNodeCopyAttributes',
5602
7439
  'cuGraphKernelNodeGetAttribute', 'cuGraphKernelNodeGetParams',
5603
- 'cuGraphKernelNodeSetAttribute', 'cuGraphKernelNodeSetParams',
5604
- 'cuGraphLaunch', 'cuGraphMemAllocNodeGetParams',
5605
- 'cuGraphMemFreeNodeGetParams', 'cuGraphMemcpyNodeGetParams',
5606
- 'cuGraphMemcpyNodeSetParams', 'cuGraphMemsetNodeGetParams',
5607
- 'cuGraphMemsetNodeSetParams', 'cuGraphNodeFindInClone',
5608
- 'cuGraphNodeGetDependencies', 'cuGraphNodeGetDependentNodes',
5609
- 'cuGraphNodeGetType', 'cuGraphReleaseUserObject',
5610
- 'cuGraphRemoveDependencies', 'cuGraphRetainUserObject',
5611
- 'cuGraphUpload', 'cuGraphicsMapResources',
7440
+ 'cuGraphKernelNodeGetParams_v2', 'cuGraphKernelNodeSetAttribute',
7441
+ 'cuGraphKernelNodeSetParams', 'cuGraphKernelNodeSetParams_v2',
7442
+ 'cuGraphLaunch', 'cuGraphLaunch_ptsz',
7443
+ 'cuGraphMemAllocNodeGetParams', 'cuGraphMemFreeNodeGetParams',
7444
+ 'cuGraphMemcpyNodeGetParams', 'cuGraphMemcpyNodeSetParams',
7445
+ 'cuGraphMemsetNodeGetParams', 'cuGraphMemsetNodeSetParams',
7446
+ 'cuGraphNodeFindInClone', 'cuGraphNodeGetDependencies',
7447
+ 'cuGraphNodeGetDependentNodes', 'cuGraphNodeGetEnabled',
7448
+ 'cuGraphNodeGetType', 'cuGraphNodeSetEnabled',
7449
+ 'cuGraphReleaseUserObject', 'cuGraphRemoveDependencies',
7450
+ 'cuGraphRetainUserObject', 'cuGraphUpload', 'cuGraphUpload_ptsz',
7451
+ 'cuGraphicsMapResources', 'cuGraphicsMapResources_ptsz',
5612
7452
  'cuGraphicsResourceGetMappedMipmappedArray',
7453
+ 'cuGraphicsResourceGetMappedPointer',
5613
7454
  'cuGraphicsResourceGetMappedPointer_v2',
7455
+ 'cuGraphicsResourceSetMapFlags',
5614
7456
  'cuGraphicsResourceSetMapFlags_v2',
5615
7457
  'cuGraphicsSubResourceGetMappedArray', 'cuGraphicsUnmapResources',
5616
- 'cuGraphicsUnregisterResource', 'cuImportExternalMemory',
5617
- 'cuImportExternalSemaphore', 'cuInit', 'cuIpcCloseMemHandle',
5618
- 'cuIpcGetEventHandle', 'cuIpcGetMemHandle',
5619
- 'cuIpcOpenEventHandle', 'cuIpcOpenMemHandle_v2', 'cuLaunch',
5620
- 'cuLaunchCooperativeKernel',
5621
- 'cuLaunchCooperativeKernelMultiDevice', 'cuLaunchGrid',
5622
- 'cuLaunchGridAsync', 'cuLaunchHostFunc', 'cuLaunchKernel',
5623
- 'cuLinkAddData_v2', 'cuLinkAddFile_v2', 'cuLinkComplete',
5624
- 'cuLinkCreate_v2', 'cuLinkDestroy', 'cuMemAddressFree',
5625
- 'cuMemAddressReserve', 'cuMemAdvise', 'cuMemAllocAsync',
5626
- 'cuMemAllocFromPoolAsync', 'cuMemAllocHost_v2',
5627
- 'cuMemAllocManaged', 'cuMemAllocPitch_v2', 'cuMemAlloc_v2',
5628
- 'cuMemCreate', 'cuMemExportToShareableHandle', 'cuMemFreeAsync',
5629
- 'cuMemFreeHost', 'cuMemFree_v2', 'cuMemGetAccess',
7458
+ 'cuGraphicsUnmapResources_ptsz', 'cuGraphicsUnregisterResource',
7459
+ 'cuImportExternalMemory', 'cuImportExternalSemaphore', 'cuInit',
7460
+ 'cuIpcCloseMemHandle', 'cuIpcGetEventHandle', 'cuIpcGetMemHandle',
7461
+ 'cuIpcOpenEventHandle', 'cuIpcOpenMemHandle',
7462
+ 'cuIpcOpenMemHandle_v2', 'cuKernelGetAttribute',
7463
+ 'cuKernelGetFunction', 'cuKernelSetAttribute',
7464
+ 'cuKernelSetCacheConfig', 'cuLaunch', 'cuLaunchCooperativeKernel',
7465
+ 'cuLaunchCooperativeKernelMultiDevice',
7466
+ 'cuLaunchCooperativeKernel_ptsz', 'cuLaunchGrid',
7467
+ 'cuLaunchGridAsync', 'cuLaunchHostFunc', 'cuLaunchHostFunc_ptsz',
7468
+ 'cuLaunchKernel', 'cuLaunchKernelEx', 'cuLaunchKernelEx_ptsz',
7469
+ 'cuLaunchKernel_ptsz', 'cuLibraryGetGlobal', 'cuLibraryGetKernel',
7470
+ 'cuLibraryGetManaged', 'cuLibraryGetModule',
7471
+ 'cuLibraryGetUnifiedFunction', 'cuLibraryLoadData',
7472
+ 'cuLibraryLoadFromFile', 'cuLibraryUnload', 'cuLinkAddData',
7473
+ 'cuLinkAddData_v2', 'cuLinkAddFile', 'cuLinkAddFile_v2',
7474
+ 'cuLinkComplete', 'cuLinkCreate', 'cuLinkCreate_v2',
7475
+ 'cuLinkDestroy', 'cuMemAddressFree', 'cuMemAddressReserve',
7476
+ 'cuMemAdvise', 'cuMemAlloc', 'cuMemAllocAsync',
7477
+ 'cuMemAllocAsync_ptsz', 'cuMemAllocFromPoolAsync',
7478
+ 'cuMemAllocFromPoolAsync_ptsz', 'cuMemAllocHost',
7479
+ 'cuMemAllocHost_v2', 'cuMemAllocManaged', 'cuMemAllocPitch',
7480
+ 'cuMemAllocPitch_v2', 'cuMemAlloc_v2', 'cuMemCreate',
7481
+ 'cuMemExportToShareableHandle', 'cuMemFree', 'cuMemFreeAsync',
7482
+ 'cuMemFreeAsync_ptsz', 'cuMemFreeHost', 'cuMemFree_v2',
7483
+ 'cuMemGetAccess', 'cuMemGetAddressRange',
5630
7484
  'cuMemGetAddressRange_v2', 'cuMemGetAllocationGranularity',
5631
- 'cuMemGetAllocationPropertiesFromHandle', 'cuMemGetInfo_v2',
5632
- 'cuMemHostAlloc', 'cuMemHostGetDevicePointer_v2',
5633
- 'cuMemHostGetFlags', 'cuMemHostRegister_v2',
7485
+ 'cuMemGetAllocationPropertiesFromHandle',
7486
+ 'cuMemGetHandleForAddressRange', 'cuMemGetInfo',
7487
+ 'cuMemGetInfo_v2', 'cuMemHostAlloc', 'cuMemHostGetDevicePointer',
7488
+ 'cuMemHostGetDevicePointer_v2', 'cuMemHostGetFlags',
7489
+ 'cuMemHostRegister', 'cuMemHostRegister_v2',
5634
7490
  'cuMemHostUnregister', 'cuMemImportFromShareableHandle',
5635
- 'cuMemMap', 'cuMemMapArrayAsync', 'cuMemPoolCreate',
5636
- 'cuMemPoolDestroy', 'cuMemPoolExportPointer',
7491
+ 'cuMemMap', 'cuMemMapArrayAsync', 'cuMemMapArrayAsync_ptsz',
7492
+ 'cuMemPoolCreate', 'cuMemPoolDestroy', 'cuMemPoolExportPointer',
5637
7493
  'cuMemPoolExportToShareableHandle', 'cuMemPoolGetAccess',
5638
7494
  'cuMemPoolGetAttribute', 'cuMemPoolImportFromShareableHandle',
5639
7495
  'cuMemPoolImportPointer', 'cuMemPoolSetAccess',
5640
7496
  'cuMemPoolSetAttribute', 'cuMemPoolTrimTo', 'cuMemPrefetchAsync',
5641
- 'cuMemRangeGetAttribute', 'cuMemRangeGetAttributes',
5642
- 'cuMemRelease', 'cuMemRetainAllocationHandle', 'cuMemSetAccess',
5643
- 'cuMemUnmap', 'cuMemcpy', 'cuMemcpy2DAsync_v2',
5644
- 'cuMemcpy2DUnaligned_v2', 'cuMemcpy2D_v2', 'cuMemcpy3DAsync_v2',
5645
- 'cuMemcpy3DPeer', 'cuMemcpy3DPeerAsync', 'cuMemcpy3D_v2',
5646
- 'cuMemcpyAsync', 'cuMemcpyAtoA_v2', 'cuMemcpyAtoD_v2',
5647
- 'cuMemcpyAtoHAsync_v2', 'cuMemcpyAtoH_v2', 'cuMemcpyDtoA_v2',
5648
- 'cuMemcpyDtoDAsync_v2', 'cuMemcpyDtoD_v2', 'cuMemcpyDtoHAsync_v2',
5649
- 'cuMemcpyDtoH_v2', 'cuMemcpyHtoAAsync_v2', 'cuMemcpyHtoA_v2',
5650
- 'cuMemcpyHtoDAsync_v2', 'cuMemcpyHtoD_v2', 'cuMemcpyPeer',
5651
- 'cuMemcpyPeerAsync', 'cuMemsetD16Async', 'cuMemsetD16_v2',
5652
- 'cuMemsetD2D16Async', 'cuMemsetD2D16_v2', 'cuMemsetD2D32Async',
5653
- 'cuMemsetD2D32_v2', 'cuMemsetD2D8Async', 'cuMemsetD2D8_v2',
5654
- 'cuMemsetD32Async', 'cuMemsetD32_v2', 'cuMemsetD8Async',
5655
- 'cuMemsetD8_v2', 'cuMipmappedArrayCreate',
7497
+ 'cuMemPrefetchAsync_ptsz', 'cuMemRangeGetAttribute',
7498
+ 'cuMemRangeGetAttributes', 'cuMemRelease',
7499
+ 'cuMemRetainAllocationHandle', 'cuMemSetAccess', 'cuMemUnmap',
7500
+ 'cuMemcpy', 'cuMemcpy2D', 'cuMemcpy2DAsync', 'cuMemcpy2DAsync_v2',
7501
+ 'cuMemcpy2DAsync_v2_ptsz', 'cuMemcpy2DUnaligned',
7502
+ 'cuMemcpy2DUnaligned_v2', 'cuMemcpy2DUnaligned_v2_ptds',
7503
+ 'cuMemcpy2D_v2', 'cuMemcpy2D_v2_ptds', 'cuMemcpy3D',
7504
+ 'cuMemcpy3DAsync', 'cuMemcpy3DAsync_v2',
7505
+ 'cuMemcpy3DAsync_v2_ptsz', 'cuMemcpy3DPeer',
7506
+ 'cuMemcpy3DPeerAsync', 'cuMemcpy3DPeerAsync_ptsz',
7507
+ 'cuMemcpy3DPeer_ptds', 'cuMemcpy3D_v2', 'cuMemcpy3D_v2_ptds',
7508
+ 'cuMemcpyAsync', 'cuMemcpyAsync_ptsz', 'cuMemcpyAtoA',
7509
+ 'cuMemcpyAtoA_v2', 'cuMemcpyAtoA_v2_ptds', 'cuMemcpyAtoD',
7510
+ 'cuMemcpyAtoD_v2', 'cuMemcpyAtoD_v2_ptds', 'cuMemcpyAtoH',
7511
+ 'cuMemcpyAtoHAsync', 'cuMemcpyAtoHAsync_v2',
7512
+ 'cuMemcpyAtoHAsync_v2_ptsz', 'cuMemcpyAtoH_v2',
7513
+ 'cuMemcpyAtoH_v2_ptds', 'cuMemcpyDtoA', 'cuMemcpyDtoA_v2',
7514
+ 'cuMemcpyDtoA_v2_ptds', 'cuMemcpyDtoD', 'cuMemcpyDtoDAsync',
7515
+ 'cuMemcpyDtoDAsync_v2', 'cuMemcpyDtoDAsync_v2_ptsz',
7516
+ 'cuMemcpyDtoD_v2', 'cuMemcpyDtoD_v2_ptds', 'cuMemcpyDtoH',
7517
+ 'cuMemcpyDtoHAsync', 'cuMemcpyDtoHAsync_v2',
7518
+ 'cuMemcpyDtoHAsync_v2_ptsz', 'cuMemcpyDtoH_v2',
7519
+ 'cuMemcpyDtoH_v2_ptds', 'cuMemcpyHtoA', 'cuMemcpyHtoAAsync',
7520
+ 'cuMemcpyHtoAAsync_v2', 'cuMemcpyHtoAAsync_v2_ptsz',
7521
+ 'cuMemcpyHtoA_v2', 'cuMemcpyHtoA_v2_ptds', 'cuMemcpyHtoD',
7522
+ 'cuMemcpyHtoDAsync', 'cuMemcpyHtoDAsync_v2',
7523
+ 'cuMemcpyHtoDAsync_v2_ptsz', 'cuMemcpyHtoD_v2',
7524
+ 'cuMemcpyHtoD_v2_ptds', 'cuMemcpyPeer', 'cuMemcpyPeerAsync',
7525
+ 'cuMemcpyPeerAsync_ptsz', 'cuMemcpyPeer_ptds', 'cuMemcpy_ptds',
7526
+ 'cuMemsetD16', 'cuMemsetD16Async', 'cuMemsetD16Async_ptsz',
7527
+ 'cuMemsetD16_v2', 'cuMemsetD16_v2_ptds', 'cuMemsetD2D16',
7528
+ 'cuMemsetD2D16Async', 'cuMemsetD2D16Async_ptsz',
7529
+ 'cuMemsetD2D16_v2', 'cuMemsetD2D16_v2_ptds', 'cuMemsetD2D32',
7530
+ 'cuMemsetD2D32Async', 'cuMemsetD2D32Async_ptsz',
7531
+ 'cuMemsetD2D32_v2', 'cuMemsetD2D32_v2_ptds', 'cuMemsetD2D8',
7532
+ 'cuMemsetD2D8Async', 'cuMemsetD2D8Async_ptsz', 'cuMemsetD2D8_v2',
7533
+ 'cuMemsetD2D8_v2_ptds', 'cuMemsetD32', 'cuMemsetD32Async',
7534
+ 'cuMemsetD32Async_ptsz', 'cuMemsetD32_v2', 'cuMemsetD32_v2_ptds',
7535
+ 'cuMemsetD8', 'cuMemsetD8Async', 'cuMemsetD8Async_ptsz',
7536
+ 'cuMemsetD8_v2', 'cuMemsetD8_v2_ptds', 'cuMipmappedArrayCreate',
5656
7537
  'cuMipmappedArrayDestroy', 'cuMipmappedArrayGetLevel',
7538
+ 'cuMipmappedArrayGetMemoryRequirements',
5657
7539
  'cuMipmappedArrayGetSparseProperties', 'cuModuleGetFunction',
5658
- 'cuModuleGetGlobal_v2', 'cuModuleGetSurfRef', 'cuModuleGetTexRef',
5659
- 'cuModuleLoad', 'cuModuleLoadData', 'cuModuleLoadDataEx',
5660
- 'cuModuleLoadFatBinary', 'cuModuleUnload',
7540
+ 'cuModuleGetGlobal', 'cuModuleGetGlobal_v2',
7541
+ 'cuModuleGetLoadingMode', 'cuModuleGetSurfRef',
7542
+ 'cuModuleGetTexRef', 'cuModuleLoad', 'cuModuleLoadData',
7543
+ 'cuModuleLoadDataEx', 'cuModuleLoadFatBinary', 'cuModuleUnload',
5661
7544
  'cuOccupancyAvailableDynamicSMemPerBlock',
5662
7545
  'cuOccupancyMaxActiveBlocksPerMultiprocessor',
5663
7546
  'cuOccupancyMaxActiveBlocksPerMultiprocessorWithFlags',
7547
+ 'cuOccupancyMaxActiveClusters',
5664
7548
  'cuOccupancyMaxPotentialBlockSize',
5665
- 'cuOccupancyMaxPotentialBlockSizeWithFlags', 'cuParamSetSize',
7549
+ 'cuOccupancyMaxPotentialBlockSizeWithFlags',
7550
+ 'cuOccupancyMaxPotentialClusterSize', 'cuParamSetSize',
5666
7551
  'cuParamSetTexRef', 'cuParamSetf', 'cuParamSeti', 'cuParamSetv',
5667
7552
  'cuPointerGetAttribute', 'cuPointerGetAttributes',
5668
7553
  'cuPointerSetAttribute', 'cuSignalExternalSemaphoresAsync',
5669
- 'cuStreamAddCallback', 'cuStreamAttachMemAsync',
5670
- 'cuStreamBatchMemOp', 'cuStreamBeginCapture_v2',
5671
- 'cuStreamCopyAttributes', 'cuStreamCreate',
5672
- 'cuStreamCreateWithPriority', 'cuStreamDestroy_v2',
5673
- 'cuStreamEndCapture', 'cuStreamGetAttribute',
5674
- 'cuStreamGetCaptureInfo', 'cuStreamGetCaptureInfo_v2',
5675
- 'cuStreamGetCtx', 'cuStreamGetFlags', 'cuStreamGetPriority',
5676
- 'cuStreamIsCapturing', 'cuStreamQuery', 'cuStreamSetAttribute',
5677
- 'cuStreamSynchronize', 'cuStreamUpdateCaptureDependencies',
5678
- 'cuStreamWaitEvent', 'cuStreamWaitValue32', 'cuStreamWaitValue64',
5679
- 'cuStreamWriteValue32', 'cuStreamWriteValue64',
5680
- 'cuSurfObjectCreate', 'cuSurfObjectDestroy',
5681
- 'cuSurfObjectGetResourceDesc', 'cuSurfRefGetArray',
5682
- 'cuSurfRefSetArray', 'cuTexObjectCreate', 'cuTexObjectDestroy',
5683
- 'cuTexObjectGetResourceDesc', 'cuTexObjectGetResourceViewDesc',
5684
- 'cuTexObjectGetTextureDesc', 'cuTexRefCreate', 'cuTexRefDestroy',
7554
+ 'cuSignalExternalSemaphoresAsync_ptsz', 'cuStreamAddCallback',
7555
+ 'cuStreamAddCallback_ptsz', 'cuStreamAttachMemAsync',
7556
+ 'cuStreamAttachMemAsync_ptsz', 'cuStreamBatchMemOp',
7557
+ 'cuStreamBatchMemOp_ptsz', 'cuStreamBatchMemOp_v2',
7558
+ 'cuStreamBatchMemOp_v2_ptsz', 'cuStreamBeginCapture',
7559
+ 'cuStreamBeginCapture_ptsz', 'cuStreamBeginCapture_v2',
7560
+ 'cuStreamBeginCapture_v2_ptsz', 'cuStreamCopyAttributes',
7561
+ 'cuStreamCopyAttributes_ptsz', 'cuStreamCreate',
7562
+ 'cuStreamCreateWithPriority', 'cuStreamDestroy',
7563
+ 'cuStreamDestroy_v2', 'cuStreamEndCapture',
7564
+ 'cuStreamEndCapture_ptsz', 'cuStreamGetAttribute',
7565
+ 'cuStreamGetAttribute_ptsz', 'cuStreamGetCaptureInfo',
7566
+ 'cuStreamGetCaptureInfo_ptsz', 'cuStreamGetCaptureInfo_v2',
7567
+ 'cuStreamGetCaptureInfo_v2_ptsz', 'cuStreamGetCtx',
7568
+ 'cuStreamGetCtx_ptsz', 'cuStreamGetFlags',
7569
+ 'cuStreamGetFlags_ptsz', 'cuStreamGetId', 'cuStreamGetId_ptsz',
7570
+ 'cuStreamGetPriority', 'cuStreamGetPriority_ptsz',
7571
+ 'cuStreamIsCapturing', 'cuStreamIsCapturing_ptsz',
7572
+ 'cuStreamQuery', 'cuStreamQuery_ptsz', 'cuStreamSetAttribute',
7573
+ 'cuStreamSetAttribute_ptsz', 'cuStreamSynchronize',
7574
+ 'cuStreamSynchronize_ptsz', 'cuStreamUpdateCaptureDependencies',
7575
+ 'cuStreamUpdateCaptureDependencies_ptsz', 'cuStreamWaitEvent',
7576
+ 'cuStreamWaitEvent_ptsz', 'cuStreamWaitValue32',
7577
+ 'cuStreamWaitValue32_ptsz', 'cuStreamWaitValue32_v2',
7578
+ 'cuStreamWaitValue32_v2_ptsz', 'cuStreamWaitValue64',
7579
+ 'cuStreamWaitValue64_ptsz', 'cuStreamWaitValue64_v2',
7580
+ 'cuStreamWaitValue64_v2_ptsz', 'cuStreamWriteValue32',
7581
+ 'cuStreamWriteValue32_ptsz', 'cuStreamWriteValue32_v2',
7582
+ 'cuStreamWriteValue32_v2_ptsz', 'cuStreamWriteValue64',
7583
+ 'cuStreamWriteValue64_ptsz', 'cuStreamWriteValue64_v2',
7584
+ 'cuStreamWriteValue64_v2_ptsz', 'cuSurfObjectCreate',
7585
+ 'cuSurfObjectDestroy', 'cuSurfObjectGetResourceDesc',
7586
+ 'cuSurfRefGetArray', 'cuSurfRefSetArray',
7587
+ 'cuTensorMapEncodeIm2col', 'cuTensorMapEncodeTiled',
7588
+ 'cuTensorMapReplaceAddress', 'cuTexObjectCreate',
7589
+ 'cuTexObjectDestroy', 'cuTexObjectGetResourceDesc',
7590
+ 'cuTexObjectGetResourceViewDesc', 'cuTexObjectGetTextureDesc',
7591
+ 'cuTexRefCreate', 'cuTexRefDestroy', 'cuTexRefGetAddress',
5685
7592
  'cuTexRefGetAddressMode', 'cuTexRefGetAddress_v2',
5686
7593
  'cuTexRefGetArray', 'cuTexRefGetBorderColor',
5687
7594
  'cuTexRefGetFilterMode', 'cuTexRefGetFlags', 'cuTexRefGetFormat',
5688
7595
  'cuTexRefGetMaxAnisotropy', 'cuTexRefGetMipmapFilterMode',
5689
7596
  'cuTexRefGetMipmapLevelBias', 'cuTexRefGetMipmapLevelClamp',
5690
- 'cuTexRefGetMipmappedArray', 'cuTexRefSetAddress2D_v3',
5691
- 'cuTexRefSetAddressMode', 'cuTexRefSetAddress_v2',
5692
- 'cuTexRefSetArray', 'cuTexRefSetBorderColor',
5693
- 'cuTexRefSetFilterMode', 'cuTexRefSetFlags', 'cuTexRefSetFormat',
7597
+ 'cuTexRefGetMipmappedArray', 'cuTexRefSetAddress',
7598
+ 'cuTexRefSetAddress2D', 'cuTexRefSetAddress2D_v2',
7599
+ 'cuTexRefSetAddress2D_v3', 'cuTexRefSetAddressMode',
7600
+ 'cuTexRefSetAddress_v2', 'cuTexRefSetArray',
7601
+ 'cuTexRefSetBorderColor', 'cuTexRefSetFilterMode',
7602
+ 'cuTexRefSetFlags', 'cuTexRefSetFormat',
5694
7603
  'cuTexRefSetMaxAnisotropy', 'cuTexRefSetMipmapFilterMode',
5695
7604
  'cuTexRefSetMipmapLevelBias', 'cuTexRefSetMipmapLevelClamp',
5696
7605
  'cuTexRefSetMipmappedArray', 'cuThreadExchangeStreamCaptureMode',
5697
7606
  'cuUserObjectCreate', 'cuUserObjectRelease', 'cuUserObjectRetain',
5698
- 'cuWaitExternalSemaphoresAsync', 'cudaError_enum', 'cuuint32_t',
5699
- 'cuuint64_t', 'size_t', 'struct_CUDA_ARRAY3D_DESCRIPTOR_st',
7607
+ 'cuWaitExternalSemaphoresAsync',
7608
+ 'cuWaitExternalSemaphoresAsync_ptsz', 'cudaError_enum',
7609
+ 'cuuint32_t', 'cuuint64_t', 'size_t',
7610
+ 'struct_CUDA_ARRAY3D_DESCRIPTOR_st',
7611
+ 'struct_CUDA_ARRAY3D_DESCRIPTOR_v1_st',
5700
7612
  'struct_CUDA_ARRAY_DESCRIPTOR_st',
7613
+ 'struct_CUDA_ARRAY_DESCRIPTOR_v1_st',
7614
+ 'struct_CUDA_ARRAY_MEMORY_REQUIREMENTS_st',
5701
7615
  'struct_CUDA_ARRAY_SPARSE_PROPERTIES_st',
5702
7616
  'struct_CUDA_ARRAY_SPARSE_PROPERTIES_st_tileExtent',
7617
+ 'struct_CUDA_BATCH_MEM_OP_NODE_PARAMS_st',
5703
7618
  'struct_CUDA_EXTERNAL_MEMORY_BUFFER_DESC_st',
5704
7619
  'struct_CUDA_EXTERNAL_MEMORY_HANDLE_DESC_st',
5705
7620
  'struct_CUDA_EXTERNAL_MEMORY_HANDLE_DESC_st_0_win32',
@@ -5716,10 +7631,13 @@ __all__ = \
5716
7631
  'struct_CUDA_EXTERNAL_SEMAPHORE_WAIT_PARAMS_st_params',
5717
7632
  'struct_CUDA_EXT_SEM_SIGNAL_NODE_PARAMS_st',
5718
7633
  'struct_CUDA_EXT_SEM_WAIT_NODE_PARAMS_st',
7634
+ 'struct_CUDA_GRAPH_INSTANTIATE_PARAMS_st',
5719
7635
  'struct_CUDA_HOST_NODE_PARAMS_st',
5720
7636
  'struct_CUDA_KERNEL_NODE_PARAMS_st',
7637
+ 'struct_CUDA_KERNEL_NODE_PARAMS_v2_st',
5721
7638
  'struct_CUDA_LAUNCH_PARAMS_st', 'struct_CUDA_MEMCPY2D_st',
5722
- 'struct_CUDA_MEMCPY3D_PEER_st', 'struct_CUDA_MEMCPY3D_st',
7639
+ 'struct_CUDA_MEMCPY2D_v1_st', 'struct_CUDA_MEMCPY3D_PEER_st',
7640
+ 'struct_CUDA_MEMCPY3D_st', 'struct_CUDA_MEMCPY3D_v1_st',
5723
7641
  'struct_CUDA_MEMSET_NODE_PARAMS_st',
5724
7642
  'struct_CUDA_MEM_ALLOC_NODE_PARAMS_st',
5725
7643
  'struct_CUDA_POINTER_ATTRIBUTE_P2P_TOKENS_st',
@@ -5737,9 +7655,15 @@ __all__ = \
5737
7655
  'struct_CUexecAffinityParam_st',
5738
7656
  'struct_CUexecAffinitySmCount_st', 'struct_CUextMemory_st',
5739
7657
  'struct_CUextSemaphore_st', 'struct_CUfunc_st',
5740
- 'struct_CUgraphExec_st', 'struct_CUgraphNode_st',
5741
- 'struct_CUgraph_st', 'struct_CUgraphicsResource_st',
5742
- 'struct_CUipcEventHandle_st', 'struct_CUipcMemHandle_st',
7658
+ 'struct_CUgraphExecUpdateResultInfo_st', 'struct_CUgraphExec_st',
7659
+ 'struct_CUgraphNode_st', 'struct_CUgraph_st',
7660
+ 'struct_CUgraphicsResource_st', 'struct_CUipcEventHandle_st',
7661
+ 'struct_CUipcMemHandle_st', 'struct_CUkern_st',
7662
+ 'struct_CUlaunchAttributeValue_union_clusterDim',
7663
+ 'struct_CUlaunchAttributeValue_union_programmaticEvent',
7664
+ 'struct_CUlaunchAttribute_st', 'struct_CUlaunchConfig_st',
7665
+ 'struct_CUlaunchMemSyncDomainMap_st', 'struct_CUlib_st',
7666
+ 'struct_CUlibraryHostUniversalFunctionAndDataTable_st',
5743
7667
  'struct_CUlinkState_st', 'struct_CUmemAccessDesc_st',
5744
7668
  'struct_CUmemAllocationProp_st',
5745
7669
  'struct_CUmemAllocationProp_st_allocFlags',
@@ -5747,10 +7671,12 @@ __all__ = \
5747
7671
  'struct_CUmemPoolProps_st', 'struct_CUmemPoolPtrExportData_st',
5748
7672
  'struct_CUmipmappedArray_st', 'struct_CUmod_st',
5749
7673
  'struct_CUstreamMemOpFlushRemoteWritesParams_st',
7674
+ 'struct_CUstreamMemOpMemoryBarrierParams_st',
5750
7675
  'struct_CUstreamMemOpWaitValueParams_st',
5751
7676
  'struct_CUstreamMemOpWriteValueParams_st', 'struct_CUstream_st',
5752
- 'struct_CUsurfref_st', 'struct_CUtexref_st',
5753
- 'struct_CUuserObject_st', 'struct_CUuuid_st',
7677
+ 'struct_CUsurfref_st', 'struct_CUtensorMap_st',
7678
+ 'struct_CUtexref_st', 'struct_CUuserObject_st',
7679
+ 'struct_CUuuid_st',
5754
7680
  'union_CUDA_EXTERNAL_MEMORY_HANDLE_DESC_st_handle',
5755
7681
  'union_CUDA_EXTERNAL_SEMAPHORE_HANDLE_DESC_st_handle',
5756
7682
  'union_CUDA_EXTERNAL_SEMAPHORE_SIGNAL_PARAMS_st_0_nvSciSync',
@@ -5760,8 +7686,7 @@ __all__ = \
5760
7686
  'union_CUarrayMapInfo_st_resource',
5761
7687
  'union_CUarrayMapInfo_st_subresource',
5762
7688
  'union_CUexecAffinityParam_st_param',
5763
- 'union_CUkernelNodeAttrValue_union',
5764
- 'union_CUstreamAttrValue_union',
7689
+ 'union_CUlaunchAttributeValue_union',
5765
7690
  'union_CUstreamBatchMemOpParams_union',
5766
7691
  'union_CUstreamMemOpWaitValueParams_st_0',
5767
7692
  'union_CUstreamMemOpWriteValueParams_st_0']