numba-cuda 0.21.1__cp313-cp313-win_amd64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (488) hide show
  1. _numba_cuda_redirector.pth +4 -0
  2. _numba_cuda_redirector.py +89 -0
  3. numba_cuda/VERSION +1 -0
  4. numba_cuda/__init__.py +6 -0
  5. numba_cuda/_version.py +11 -0
  6. numba_cuda/numba/cuda/__init__.py +70 -0
  7. numba_cuda/numba/cuda/_internal/cuda_bf16.py +16394 -0
  8. numba_cuda/numba/cuda/_internal/cuda_fp16.py +8112 -0
  9. numba_cuda/numba/cuda/api.py +577 -0
  10. numba_cuda/numba/cuda/api_util.py +76 -0
  11. numba_cuda/numba/cuda/args.py +72 -0
  12. numba_cuda/numba/cuda/bf16.py +397 -0
  13. numba_cuda/numba/cuda/cache_hints.py +287 -0
  14. numba_cuda/numba/cuda/cext/__init__.py +2 -0
  15. numba_cuda/numba/cuda/cext/_devicearray.cp313-win_amd64.pyd +0 -0
  16. numba_cuda/numba/cuda/cext/_devicearray.cpp +159 -0
  17. numba_cuda/numba/cuda/cext/_devicearray.h +29 -0
  18. numba_cuda/numba/cuda/cext/_dispatcher.cp313-win_amd64.pyd +0 -0
  19. numba_cuda/numba/cuda/cext/_dispatcher.cpp +1098 -0
  20. numba_cuda/numba/cuda/cext/_hashtable.cpp +532 -0
  21. numba_cuda/numba/cuda/cext/_hashtable.h +135 -0
  22. numba_cuda/numba/cuda/cext/_helperlib.c +71 -0
  23. numba_cuda/numba/cuda/cext/_helperlib.cp313-win_amd64.pyd +0 -0
  24. numba_cuda/numba/cuda/cext/_helpermod.c +82 -0
  25. numba_cuda/numba/cuda/cext/_pymodule.h +38 -0
  26. numba_cuda/numba/cuda/cext/_typeconv.cp313-win_amd64.pyd +0 -0
  27. numba_cuda/numba/cuda/cext/_typeconv.cpp +206 -0
  28. numba_cuda/numba/cuda/cext/_typeof.cpp +1159 -0
  29. numba_cuda/numba/cuda/cext/_typeof.h +19 -0
  30. numba_cuda/numba/cuda/cext/capsulethunk.h +111 -0
  31. numba_cuda/numba/cuda/cext/mviewbuf.c +385 -0
  32. numba_cuda/numba/cuda/cext/mviewbuf.cp313-win_amd64.pyd +0 -0
  33. numba_cuda/numba/cuda/cext/typeconv.cpp +212 -0
  34. numba_cuda/numba/cuda/cext/typeconv.hpp +101 -0
  35. numba_cuda/numba/cuda/cg.py +67 -0
  36. numba_cuda/numba/cuda/cgutils.py +1294 -0
  37. numba_cuda/numba/cuda/cloudpickle/__init__.py +21 -0
  38. numba_cuda/numba/cuda/cloudpickle/cloudpickle.py +1598 -0
  39. numba_cuda/numba/cuda/cloudpickle/cloudpickle_fast.py +17 -0
  40. numba_cuda/numba/cuda/codegen.py +541 -0
  41. numba_cuda/numba/cuda/compiler.py +1396 -0
  42. numba_cuda/numba/cuda/core/analysis.py +758 -0
  43. numba_cuda/numba/cuda/core/annotations/__init__.py +0 -0
  44. numba_cuda/numba/cuda/core/annotations/pretty_annotate.py +288 -0
  45. numba_cuda/numba/cuda/core/annotations/type_annotations.py +305 -0
  46. numba_cuda/numba/cuda/core/base.py +1332 -0
  47. numba_cuda/numba/cuda/core/boxing.py +1411 -0
  48. numba_cuda/numba/cuda/core/bytecode.py +728 -0
  49. numba_cuda/numba/cuda/core/byteflow.py +2346 -0
  50. numba_cuda/numba/cuda/core/caching.py +744 -0
  51. numba_cuda/numba/cuda/core/callconv.py +392 -0
  52. numba_cuda/numba/cuda/core/codegen.py +171 -0
  53. numba_cuda/numba/cuda/core/compiler.py +199 -0
  54. numba_cuda/numba/cuda/core/compiler_lock.py +85 -0
  55. numba_cuda/numba/cuda/core/compiler_machinery.py +497 -0
  56. numba_cuda/numba/cuda/core/config.py +650 -0
  57. numba_cuda/numba/cuda/core/consts.py +124 -0
  58. numba_cuda/numba/cuda/core/controlflow.py +989 -0
  59. numba_cuda/numba/cuda/core/entrypoints.py +57 -0
  60. numba_cuda/numba/cuda/core/environment.py +66 -0
  61. numba_cuda/numba/cuda/core/errors.py +917 -0
  62. numba_cuda/numba/cuda/core/event.py +511 -0
  63. numba_cuda/numba/cuda/core/funcdesc.py +330 -0
  64. numba_cuda/numba/cuda/core/generators.py +387 -0
  65. numba_cuda/numba/cuda/core/imputils.py +509 -0
  66. numba_cuda/numba/cuda/core/inline_closurecall.py +1787 -0
  67. numba_cuda/numba/cuda/core/interpreter.py +3617 -0
  68. numba_cuda/numba/cuda/core/ir.py +1812 -0
  69. numba_cuda/numba/cuda/core/ir_utils.py +2638 -0
  70. numba_cuda/numba/cuda/core/optional.py +129 -0
  71. numba_cuda/numba/cuda/core/options.py +262 -0
  72. numba_cuda/numba/cuda/core/postproc.py +249 -0
  73. numba_cuda/numba/cuda/core/pythonapi.py +1859 -0
  74. numba_cuda/numba/cuda/core/registry.py +46 -0
  75. numba_cuda/numba/cuda/core/removerefctpass.py +123 -0
  76. numba_cuda/numba/cuda/core/rewrites/__init__.py +26 -0
  77. numba_cuda/numba/cuda/core/rewrites/ir_print.py +91 -0
  78. numba_cuda/numba/cuda/core/rewrites/registry.py +104 -0
  79. numba_cuda/numba/cuda/core/rewrites/static_binop.py +41 -0
  80. numba_cuda/numba/cuda/core/rewrites/static_getitem.py +189 -0
  81. numba_cuda/numba/cuda/core/rewrites/static_raise.py +100 -0
  82. numba_cuda/numba/cuda/core/sigutils.py +68 -0
  83. numba_cuda/numba/cuda/core/ssa.py +498 -0
  84. numba_cuda/numba/cuda/core/targetconfig.py +330 -0
  85. numba_cuda/numba/cuda/core/tracing.py +231 -0
  86. numba_cuda/numba/cuda/core/transforms.py +956 -0
  87. numba_cuda/numba/cuda/core/typed_passes.py +867 -0
  88. numba_cuda/numba/cuda/core/typeinfer.py +1950 -0
  89. numba_cuda/numba/cuda/core/unsafe/__init__.py +0 -0
  90. numba_cuda/numba/cuda/core/unsafe/bytes.py +67 -0
  91. numba_cuda/numba/cuda/core/unsafe/eh.py +67 -0
  92. numba_cuda/numba/cuda/core/unsafe/refcount.py +98 -0
  93. numba_cuda/numba/cuda/core/untyped_passes.py +1979 -0
  94. numba_cuda/numba/cuda/cpython/builtins.py +1153 -0
  95. numba_cuda/numba/cuda/cpython/charseq.py +1218 -0
  96. numba_cuda/numba/cuda/cpython/cmathimpl.py +560 -0
  97. numba_cuda/numba/cuda/cpython/enumimpl.py +103 -0
  98. numba_cuda/numba/cuda/cpython/iterators.py +167 -0
  99. numba_cuda/numba/cuda/cpython/listobj.py +1326 -0
  100. numba_cuda/numba/cuda/cpython/mathimpl.py +499 -0
  101. numba_cuda/numba/cuda/cpython/numbers.py +1475 -0
  102. numba_cuda/numba/cuda/cpython/rangeobj.py +289 -0
  103. numba_cuda/numba/cuda/cpython/slicing.py +322 -0
  104. numba_cuda/numba/cuda/cpython/tupleobj.py +456 -0
  105. numba_cuda/numba/cuda/cpython/unicode.py +2865 -0
  106. numba_cuda/numba/cuda/cpython/unicode_support.py +1597 -0
  107. numba_cuda/numba/cuda/cpython/unsafe/__init__.py +0 -0
  108. numba_cuda/numba/cuda/cpython/unsafe/numbers.py +64 -0
  109. numba_cuda/numba/cuda/cpython/unsafe/tuple.py +92 -0
  110. numba_cuda/numba/cuda/cuda_paths.py +691 -0
  111. numba_cuda/numba/cuda/cudadecl.py +556 -0
  112. numba_cuda/numba/cuda/cudadrv/__init__.py +14 -0
  113. numba_cuda/numba/cuda/cudadrv/devicearray.py +951 -0
  114. numba_cuda/numba/cuda/cudadrv/devices.py +249 -0
  115. numba_cuda/numba/cuda/cudadrv/driver.py +3222 -0
  116. numba_cuda/numba/cuda/cudadrv/drvapi.py +435 -0
  117. numba_cuda/numba/cuda/cudadrv/dummyarray.py +558 -0
  118. numba_cuda/numba/cuda/cudadrv/enums.py +613 -0
  119. numba_cuda/numba/cuda/cudadrv/error.py +48 -0
  120. numba_cuda/numba/cuda/cudadrv/libs.py +220 -0
  121. numba_cuda/numba/cuda/cudadrv/linkable_code.py +184 -0
  122. numba_cuda/numba/cuda/cudadrv/mappings.py +14 -0
  123. numba_cuda/numba/cuda/cudadrv/ndarray.py +26 -0
  124. numba_cuda/numba/cuda/cudadrv/nvrtc.py +193 -0
  125. numba_cuda/numba/cuda/cudadrv/nvvm.py +756 -0
  126. numba_cuda/numba/cuda/cudadrv/rtapi.py +13 -0
  127. numba_cuda/numba/cuda/cudadrv/runtime.py +34 -0
  128. numba_cuda/numba/cuda/cudaimpl.py +995 -0
  129. numba_cuda/numba/cuda/cudamath.py +149 -0
  130. numba_cuda/numba/cuda/datamodel/__init__.py +7 -0
  131. numba_cuda/numba/cuda/datamodel/cuda_manager.py +66 -0
  132. numba_cuda/numba/cuda/datamodel/cuda_models.py +1446 -0
  133. numba_cuda/numba/cuda/datamodel/cuda_packer.py +224 -0
  134. numba_cuda/numba/cuda/datamodel/cuda_registry.py +22 -0
  135. numba_cuda/numba/cuda/datamodel/cuda_testing.py +153 -0
  136. numba_cuda/numba/cuda/datamodel/manager.py +11 -0
  137. numba_cuda/numba/cuda/datamodel/models.py +9 -0
  138. numba_cuda/numba/cuda/datamodel/packer.py +9 -0
  139. numba_cuda/numba/cuda/datamodel/registry.py +11 -0
  140. numba_cuda/numba/cuda/datamodel/testing.py +11 -0
  141. numba_cuda/numba/cuda/debuginfo.py +903 -0
  142. numba_cuda/numba/cuda/decorators.py +294 -0
  143. numba_cuda/numba/cuda/descriptor.py +35 -0
  144. numba_cuda/numba/cuda/device_init.py +158 -0
  145. numba_cuda/numba/cuda/deviceufunc.py +1021 -0
  146. numba_cuda/numba/cuda/dispatcher.py +2463 -0
  147. numba_cuda/numba/cuda/errors.py +72 -0
  148. numba_cuda/numba/cuda/extending.py +697 -0
  149. numba_cuda/numba/cuda/flags.py +178 -0
  150. numba_cuda/numba/cuda/fp16.py +357 -0
  151. numba_cuda/numba/cuda/include/12/cuda_bf16.h +5118 -0
  152. numba_cuda/numba/cuda/include/12/cuda_bf16.hpp +3865 -0
  153. numba_cuda/numba/cuda/include/12/cuda_fp16.h +5363 -0
  154. numba_cuda/numba/cuda/include/12/cuda_fp16.hpp +3483 -0
  155. numba_cuda/numba/cuda/include/13/cuda_bf16.h +5118 -0
  156. numba_cuda/numba/cuda/include/13/cuda_bf16.hpp +3865 -0
  157. numba_cuda/numba/cuda/include/13/cuda_fp16.h +5363 -0
  158. numba_cuda/numba/cuda/include/13/cuda_fp16.hpp +3483 -0
  159. numba_cuda/numba/cuda/initialize.py +24 -0
  160. numba_cuda/numba/cuda/intrinsic_wrapper.py +41 -0
  161. numba_cuda/numba/cuda/intrinsics.py +382 -0
  162. numba_cuda/numba/cuda/itanium_mangler.py +214 -0
  163. numba_cuda/numba/cuda/kernels/__init__.py +2 -0
  164. numba_cuda/numba/cuda/kernels/reduction.py +265 -0
  165. numba_cuda/numba/cuda/kernels/transpose.py +65 -0
  166. numba_cuda/numba/cuda/libdevice.py +3386 -0
  167. numba_cuda/numba/cuda/libdevicedecl.py +20 -0
  168. numba_cuda/numba/cuda/libdevicefuncs.py +1060 -0
  169. numba_cuda/numba/cuda/libdeviceimpl.py +88 -0
  170. numba_cuda/numba/cuda/locks.py +19 -0
  171. numba_cuda/numba/cuda/lowering.py +1951 -0
  172. numba_cuda/numba/cuda/mathimpl.py +374 -0
  173. numba_cuda/numba/cuda/memory_management/__init__.py +4 -0
  174. numba_cuda/numba/cuda/memory_management/memsys.cu +99 -0
  175. numba_cuda/numba/cuda/memory_management/memsys.cuh +22 -0
  176. numba_cuda/numba/cuda/memory_management/nrt.cu +212 -0
  177. numba_cuda/numba/cuda/memory_management/nrt.cuh +48 -0
  178. numba_cuda/numba/cuda/memory_management/nrt.py +390 -0
  179. numba_cuda/numba/cuda/memory_management/nrt_context.py +438 -0
  180. numba_cuda/numba/cuda/misc/appdirs.py +594 -0
  181. numba_cuda/numba/cuda/misc/cffiimpl.py +24 -0
  182. numba_cuda/numba/cuda/misc/coverage_support.py +43 -0
  183. numba_cuda/numba/cuda/misc/dump_style.py +41 -0
  184. numba_cuda/numba/cuda/misc/findlib.py +75 -0
  185. numba_cuda/numba/cuda/misc/firstlinefinder.py +96 -0
  186. numba_cuda/numba/cuda/misc/gdb_hook.py +240 -0
  187. numba_cuda/numba/cuda/misc/literal.py +28 -0
  188. numba_cuda/numba/cuda/misc/llvm_pass_timings.py +412 -0
  189. numba_cuda/numba/cuda/misc/special.py +94 -0
  190. numba_cuda/numba/cuda/models.py +56 -0
  191. numba_cuda/numba/cuda/np/arraymath.py +5130 -0
  192. numba_cuda/numba/cuda/np/arrayobj.py +7635 -0
  193. numba_cuda/numba/cuda/np/extensions.py +11 -0
  194. numba_cuda/numba/cuda/np/linalg.py +3087 -0
  195. numba_cuda/numba/cuda/np/math/__init__.py +0 -0
  196. numba_cuda/numba/cuda/np/math/cmathimpl.py +558 -0
  197. numba_cuda/numba/cuda/np/math/mathimpl.py +487 -0
  198. numba_cuda/numba/cuda/np/math/numbers.py +1461 -0
  199. numba_cuda/numba/cuda/np/npdatetime.py +969 -0
  200. numba_cuda/numba/cuda/np/npdatetime_helpers.py +217 -0
  201. numba_cuda/numba/cuda/np/npyfuncs.py +1808 -0
  202. numba_cuda/numba/cuda/np/npyimpl.py +1027 -0
  203. numba_cuda/numba/cuda/np/numpy_support.py +798 -0
  204. numba_cuda/numba/cuda/np/polynomial/__init__.py +4 -0
  205. numba_cuda/numba/cuda/np/polynomial/polynomial_core.py +242 -0
  206. numba_cuda/numba/cuda/np/polynomial/polynomial_functions.py +380 -0
  207. numba_cuda/numba/cuda/np/ufunc/__init__.py +4 -0
  208. numba_cuda/numba/cuda/np/ufunc/decorators.py +203 -0
  209. numba_cuda/numba/cuda/np/ufunc/sigparse.py +68 -0
  210. numba_cuda/numba/cuda/np/ufunc/ufuncbuilder.py +65 -0
  211. numba_cuda/numba/cuda/np/ufunc_db.py +1282 -0
  212. numba_cuda/numba/cuda/np/unsafe/__init__.py +0 -0
  213. numba_cuda/numba/cuda/np/unsafe/ndarray.py +84 -0
  214. numba_cuda/numba/cuda/nvvmutils.py +254 -0
  215. numba_cuda/numba/cuda/printimpl.py +126 -0
  216. numba_cuda/numba/cuda/random.py +308 -0
  217. numba_cuda/numba/cuda/reshape_funcs.cu +156 -0
  218. numba_cuda/numba/cuda/serialize.py +267 -0
  219. numba_cuda/numba/cuda/simulator/__init__.py +63 -0
  220. numba_cuda/numba/cuda/simulator/_internal/__init__.py +4 -0
  221. numba_cuda/numba/cuda/simulator/_internal/cuda_bf16.py +2 -0
  222. numba_cuda/numba/cuda/simulator/api.py +179 -0
  223. numba_cuda/numba/cuda/simulator/bf16.py +4 -0
  224. numba_cuda/numba/cuda/simulator/compiler.py +38 -0
  225. numba_cuda/numba/cuda/simulator/cudadrv/__init__.py +11 -0
  226. numba_cuda/numba/cuda/simulator/cudadrv/devicearray.py +462 -0
  227. numba_cuda/numba/cuda/simulator/cudadrv/devices.py +122 -0
  228. numba_cuda/numba/cuda/simulator/cudadrv/driver.py +66 -0
  229. numba_cuda/numba/cuda/simulator/cudadrv/drvapi.py +7 -0
  230. numba_cuda/numba/cuda/simulator/cudadrv/dummyarray.py +7 -0
  231. numba_cuda/numba/cuda/simulator/cudadrv/error.py +10 -0
  232. numba_cuda/numba/cuda/simulator/cudadrv/libs.py +10 -0
  233. numba_cuda/numba/cuda/simulator/cudadrv/linkable_code.py +61 -0
  234. numba_cuda/numba/cuda/simulator/cudadrv/nvrtc.py +11 -0
  235. numba_cuda/numba/cuda/simulator/cudadrv/nvvm.py +32 -0
  236. numba_cuda/numba/cuda/simulator/cudadrv/runtime.py +22 -0
  237. numba_cuda/numba/cuda/simulator/dispatcher.py +11 -0
  238. numba_cuda/numba/cuda/simulator/kernel.py +320 -0
  239. numba_cuda/numba/cuda/simulator/kernelapi.py +509 -0
  240. numba_cuda/numba/cuda/simulator/memory_management/__init__.py +4 -0
  241. numba_cuda/numba/cuda/simulator/memory_management/nrt.py +21 -0
  242. numba_cuda/numba/cuda/simulator/reduction.py +19 -0
  243. numba_cuda/numba/cuda/simulator/tests/support.py +4 -0
  244. numba_cuda/numba/cuda/simulator/vector_types.py +65 -0
  245. numba_cuda/numba/cuda/simulator_init.py +18 -0
  246. numba_cuda/numba/cuda/stubs.py +635 -0
  247. numba_cuda/numba/cuda/target.py +505 -0
  248. numba_cuda/numba/cuda/testing.py +347 -0
  249. numba_cuda/numba/cuda/tests/__init__.py +62 -0
  250. numba_cuda/numba/cuda/tests/benchmarks/__init__.py +0 -0
  251. numba_cuda/numba/cuda/tests/benchmarks/test_kernel_launch.py +119 -0
  252. numba_cuda/numba/cuda/tests/cloudpickle_main_class.py +9 -0
  253. numba_cuda/numba/cuda/tests/core/serialize_usecases.py +113 -0
  254. numba_cuda/numba/cuda/tests/core/test_itanium_mangler.py +83 -0
  255. numba_cuda/numba/cuda/tests/core/test_serialize.py +371 -0
  256. numba_cuda/numba/cuda/tests/cudadrv/__init__.py +9 -0
  257. numba_cuda/numba/cuda/tests/cudadrv/test_array_attr.py +147 -0
  258. numba_cuda/numba/cuda/tests/cudadrv/test_context_stack.py +161 -0
  259. numba_cuda/numba/cuda/tests/cudadrv/test_cuda_array_slicing.py +397 -0
  260. numba_cuda/numba/cuda/tests/cudadrv/test_cuda_auto_context.py +24 -0
  261. numba_cuda/numba/cuda/tests/cudadrv/test_cuda_devicerecord.py +180 -0
  262. numba_cuda/numba/cuda/tests/cudadrv/test_cuda_driver.py +313 -0
  263. numba_cuda/numba/cuda/tests/cudadrv/test_cuda_memory.py +187 -0
  264. numba_cuda/numba/cuda/tests/cudadrv/test_cuda_ndarray.py +621 -0
  265. numba_cuda/numba/cuda/tests/cudadrv/test_deallocations.py +247 -0
  266. numba_cuda/numba/cuda/tests/cudadrv/test_detect.py +100 -0
  267. numba_cuda/numba/cuda/tests/cudadrv/test_emm_plugins.py +198 -0
  268. numba_cuda/numba/cuda/tests/cudadrv/test_events.py +53 -0
  269. numba_cuda/numba/cuda/tests/cudadrv/test_host_alloc.py +72 -0
  270. numba_cuda/numba/cuda/tests/cudadrv/test_init.py +138 -0
  271. numba_cuda/numba/cuda/tests/cudadrv/test_inline_ptx.py +43 -0
  272. numba_cuda/numba/cuda/tests/cudadrv/test_is_fp16.py +15 -0
  273. numba_cuda/numba/cuda/tests/cudadrv/test_linkable_code.py +58 -0
  274. numba_cuda/numba/cuda/tests/cudadrv/test_linker.py +348 -0
  275. numba_cuda/numba/cuda/tests/cudadrv/test_managed_alloc.py +128 -0
  276. numba_cuda/numba/cuda/tests/cudadrv/test_module_callbacks.py +301 -0
  277. numba_cuda/numba/cuda/tests/cudadrv/test_nvjitlink.py +174 -0
  278. numba_cuda/numba/cuda/tests/cudadrv/test_nvrtc.py +28 -0
  279. numba_cuda/numba/cuda/tests/cudadrv/test_nvvm_driver.py +185 -0
  280. numba_cuda/numba/cuda/tests/cudadrv/test_pinned.py +39 -0
  281. numba_cuda/numba/cuda/tests/cudadrv/test_profiler.py +23 -0
  282. numba_cuda/numba/cuda/tests/cudadrv/test_reset_device.py +38 -0
  283. numba_cuda/numba/cuda/tests/cudadrv/test_runtime.py +48 -0
  284. numba_cuda/numba/cuda/tests/cudadrv/test_select_device.py +44 -0
  285. numba_cuda/numba/cuda/tests/cudadrv/test_streams.py +127 -0
  286. numba_cuda/numba/cuda/tests/cudapy/__init__.py +9 -0
  287. numba_cuda/numba/cuda/tests/cudapy/cache_usecases.py +231 -0
  288. numba_cuda/numba/cuda/tests/cudapy/cache_with_cpu_usecases.py +50 -0
  289. numba_cuda/numba/cuda/tests/cudapy/cg_cache_usecases.py +36 -0
  290. numba_cuda/numba/cuda/tests/cudapy/complex_usecases.py +116 -0
  291. numba_cuda/numba/cuda/tests/cudapy/enum_usecases.py +59 -0
  292. numba_cuda/numba/cuda/tests/cudapy/extensions_usecases.py +62 -0
  293. numba_cuda/numba/cuda/tests/cudapy/jitlink.ptx +28 -0
  294. numba_cuda/numba/cuda/tests/cudapy/overload_usecases.py +33 -0
  295. numba_cuda/numba/cuda/tests/cudapy/recursion_usecases.py +104 -0
  296. numba_cuda/numba/cuda/tests/cudapy/test_alignment.py +47 -0
  297. numba_cuda/numba/cuda/tests/cudapy/test_analysis.py +1122 -0
  298. numba_cuda/numba/cuda/tests/cudapy/test_array.py +344 -0
  299. numba_cuda/numba/cuda/tests/cudapy/test_array_alignment.py +268 -0
  300. numba_cuda/numba/cuda/tests/cudapy/test_array_args.py +203 -0
  301. numba_cuda/numba/cuda/tests/cudapy/test_array_methods.py +63 -0
  302. numba_cuda/numba/cuda/tests/cudapy/test_array_reductions.py +360 -0
  303. numba_cuda/numba/cuda/tests/cudapy/test_atomics.py +1815 -0
  304. numba_cuda/numba/cuda/tests/cudapy/test_bfloat16.py +599 -0
  305. numba_cuda/numba/cuda/tests/cudapy/test_bfloat16_bindings.py +377 -0
  306. numba_cuda/numba/cuda/tests/cudapy/test_blackscholes.py +160 -0
  307. numba_cuda/numba/cuda/tests/cudapy/test_boolean.py +27 -0
  308. numba_cuda/numba/cuda/tests/cudapy/test_byteflow.py +98 -0
  309. numba_cuda/numba/cuda/tests/cudapy/test_cache_hints.py +210 -0
  310. numba_cuda/numba/cuda/tests/cudapy/test_caching.py +683 -0
  311. numba_cuda/numba/cuda/tests/cudapy/test_casting.py +265 -0
  312. numba_cuda/numba/cuda/tests/cudapy/test_cffi.py +42 -0
  313. numba_cuda/numba/cuda/tests/cudapy/test_compiler.py +718 -0
  314. numba_cuda/numba/cuda/tests/cudapy/test_complex.py +370 -0
  315. numba_cuda/numba/cuda/tests/cudapy/test_complex_kernel.py +23 -0
  316. numba_cuda/numba/cuda/tests/cudapy/test_const_string.py +142 -0
  317. numba_cuda/numba/cuda/tests/cudapy/test_constmem.py +178 -0
  318. numba_cuda/numba/cuda/tests/cudapy/test_cooperative_groups.py +193 -0
  319. numba_cuda/numba/cuda/tests/cudapy/test_copy_propagate.py +131 -0
  320. numba_cuda/numba/cuda/tests/cudapy/test_cuda_array_interface.py +438 -0
  321. numba_cuda/numba/cuda/tests/cudapy/test_cuda_jit_no_types.py +94 -0
  322. numba_cuda/numba/cuda/tests/cudapy/test_datetime.py +101 -0
  323. numba_cuda/numba/cuda/tests/cudapy/test_debug.py +105 -0
  324. numba_cuda/numba/cuda/tests/cudapy/test_debuginfo.py +889 -0
  325. numba_cuda/numba/cuda/tests/cudapy/test_debuginfo_types.py +476 -0
  326. numba_cuda/numba/cuda/tests/cudapy/test_device_func.py +500 -0
  327. numba_cuda/numba/cuda/tests/cudapy/test_dispatcher.py +820 -0
  328. numba_cuda/numba/cuda/tests/cudapy/test_enums.py +152 -0
  329. numba_cuda/numba/cuda/tests/cudapy/test_errors.py +111 -0
  330. numba_cuda/numba/cuda/tests/cudapy/test_exception.py +170 -0
  331. numba_cuda/numba/cuda/tests/cudapy/test_extending.py +1088 -0
  332. numba_cuda/numba/cuda/tests/cudapy/test_extending_types.py +71 -0
  333. numba_cuda/numba/cuda/tests/cudapy/test_fastmath.py +265 -0
  334. numba_cuda/numba/cuda/tests/cudapy/test_flow_control.py +1433 -0
  335. numba_cuda/numba/cuda/tests/cudapy/test_forall.py +57 -0
  336. numba_cuda/numba/cuda/tests/cudapy/test_freevar.py +34 -0
  337. numba_cuda/numba/cuda/tests/cudapy/test_frexp_ldexp.py +69 -0
  338. numba_cuda/numba/cuda/tests/cudapy/test_globals.py +62 -0
  339. numba_cuda/numba/cuda/tests/cudapy/test_gufunc.py +474 -0
  340. numba_cuda/numba/cuda/tests/cudapy/test_gufunc_scalar.py +167 -0
  341. numba_cuda/numba/cuda/tests/cudapy/test_gufunc_scheduling.py +92 -0
  342. numba_cuda/numba/cuda/tests/cudapy/test_idiv.py +39 -0
  343. numba_cuda/numba/cuda/tests/cudapy/test_inline.py +170 -0
  344. numba_cuda/numba/cuda/tests/cudapy/test_inspect.py +255 -0
  345. numba_cuda/numba/cuda/tests/cudapy/test_intrinsics.py +1219 -0
  346. numba_cuda/numba/cuda/tests/cudapy/test_ipc.py +263 -0
  347. numba_cuda/numba/cuda/tests/cudapy/test_ir.py +598 -0
  348. numba_cuda/numba/cuda/tests/cudapy/test_ir_utils.py +276 -0
  349. numba_cuda/numba/cuda/tests/cudapy/test_iterators.py +101 -0
  350. numba_cuda/numba/cuda/tests/cudapy/test_lang.py +68 -0
  351. numba_cuda/numba/cuda/tests/cudapy/test_laplace.py +123 -0
  352. numba_cuda/numba/cuda/tests/cudapy/test_libdevice.py +194 -0
  353. numba_cuda/numba/cuda/tests/cudapy/test_lineinfo.py +220 -0
  354. numba_cuda/numba/cuda/tests/cudapy/test_localmem.py +173 -0
  355. numba_cuda/numba/cuda/tests/cudapy/test_make_function_to_jit_function.py +364 -0
  356. numba_cuda/numba/cuda/tests/cudapy/test_mandel.py +47 -0
  357. numba_cuda/numba/cuda/tests/cudapy/test_math.py +842 -0
  358. numba_cuda/numba/cuda/tests/cudapy/test_matmul.py +76 -0
  359. numba_cuda/numba/cuda/tests/cudapy/test_minmax.py +78 -0
  360. numba_cuda/numba/cuda/tests/cudapy/test_montecarlo.py +25 -0
  361. numba_cuda/numba/cuda/tests/cudapy/test_multigpu.py +145 -0
  362. numba_cuda/numba/cuda/tests/cudapy/test_multiprocessing.py +39 -0
  363. numba_cuda/numba/cuda/tests/cudapy/test_multithreads.py +82 -0
  364. numba_cuda/numba/cuda/tests/cudapy/test_nondet.py +53 -0
  365. numba_cuda/numba/cuda/tests/cudapy/test_operator.py +504 -0
  366. numba_cuda/numba/cuda/tests/cudapy/test_optimization.py +93 -0
  367. numba_cuda/numba/cuda/tests/cudapy/test_overload.py +402 -0
  368. numba_cuda/numba/cuda/tests/cudapy/test_powi.py +128 -0
  369. numba_cuda/numba/cuda/tests/cudapy/test_print.py +193 -0
  370. numba_cuda/numba/cuda/tests/cudapy/test_py2_div_issue.py +37 -0
  371. numba_cuda/numba/cuda/tests/cudapy/test_random.py +117 -0
  372. numba_cuda/numba/cuda/tests/cudapy/test_record_dtype.py +614 -0
  373. numba_cuda/numba/cuda/tests/cudapy/test_recursion.py +130 -0
  374. numba_cuda/numba/cuda/tests/cudapy/test_reduction.py +94 -0
  375. numba_cuda/numba/cuda/tests/cudapy/test_retrieve_autoconverted_arrays.py +83 -0
  376. numba_cuda/numba/cuda/tests/cudapy/test_serialize.py +86 -0
  377. numba_cuda/numba/cuda/tests/cudapy/test_slicing.py +40 -0
  378. numba_cuda/numba/cuda/tests/cudapy/test_sm.py +457 -0
  379. numba_cuda/numba/cuda/tests/cudapy/test_sm_creation.py +233 -0
  380. numba_cuda/numba/cuda/tests/cudapy/test_ssa.py +454 -0
  381. numba_cuda/numba/cuda/tests/cudapy/test_stream_api.py +56 -0
  382. numba_cuda/numba/cuda/tests/cudapy/test_sync.py +277 -0
  383. numba_cuda/numba/cuda/tests/cudapy/test_tracing.py +200 -0
  384. numba_cuda/numba/cuda/tests/cudapy/test_transpose.py +90 -0
  385. numba_cuda/numba/cuda/tests/cudapy/test_typeconv.py +333 -0
  386. numba_cuda/numba/cuda/tests/cudapy/test_typeinfer.py +538 -0
  387. numba_cuda/numba/cuda/tests/cudapy/test_ufuncs.py +585 -0
  388. numba_cuda/numba/cuda/tests/cudapy/test_userexc.py +42 -0
  389. numba_cuda/numba/cuda/tests/cudapy/test_vector_type.py +485 -0
  390. numba_cuda/numba/cuda/tests/cudapy/test_vectorize.py +312 -0
  391. numba_cuda/numba/cuda/tests/cudapy/test_vectorize_complex.py +23 -0
  392. numba_cuda/numba/cuda/tests/cudapy/test_vectorize_decor.py +183 -0
  393. numba_cuda/numba/cuda/tests/cudapy/test_vectorize_device.py +40 -0
  394. numba_cuda/numba/cuda/tests/cudapy/test_vectorize_scalar_arg.py +40 -0
  395. numba_cuda/numba/cuda/tests/cudapy/test_warning.py +206 -0
  396. numba_cuda/numba/cuda/tests/cudapy/test_warp_ops.py +331 -0
  397. numba_cuda/numba/cuda/tests/cudasim/__init__.py +9 -0
  398. numba_cuda/numba/cuda/tests/cudasim/support.py +9 -0
  399. numba_cuda/numba/cuda/tests/cudasim/test_cudasim_issues.py +111 -0
  400. numba_cuda/numba/cuda/tests/data/__init__.py +2 -0
  401. numba_cuda/numba/cuda/tests/data/cta_barrier.cu +28 -0
  402. numba_cuda/numba/cuda/tests/data/cuda_include.cu +10 -0
  403. numba_cuda/numba/cuda/tests/data/error.cu +12 -0
  404. numba_cuda/numba/cuda/tests/data/include/add.cuh +8 -0
  405. numba_cuda/numba/cuda/tests/data/jitlink.cu +28 -0
  406. numba_cuda/numba/cuda/tests/data/jitlink.ptx +49 -0
  407. numba_cuda/numba/cuda/tests/data/warn.cu +12 -0
  408. numba_cuda/numba/cuda/tests/doc_examples/__init__.py +9 -0
  409. numba_cuda/numba/cuda/tests/doc_examples/ffi/__init__.py +2 -0
  410. numba_cuda/numba/cuda/tests/doc_examples/ffi/functions.cu +54 -0
  411. numba_cuda/numba/cuda/tests/doc_examples/ffi/include/mul.cuh +8 -0
  412. numba_cuda/numba/cuda/tests/doc_examples/ffi/saxpy.cu +14 -0
  413. numba_cuda/numba/cuda/tests/doc_examples/test_cg.py +86 -0
  414. numba_cuda/numba/cuda/tests/doc_examples/test_cpointer.py +68 -0
  415. numba_cuda/numba/cuda/tests/doc_examples/test_cpu_gpu_compat.py +81 -0
  416. numba_cuda/numba/cuda/tests/doc_examples/test_ffi.py +141 -0
  417. numba_cuda/numba/cuda/tests/doc_examples/test_laplace.py +160 -0
  418. numba_cuda/numba/cuda/tests/doc_examples/test_matmul.py +180 -0
  419. numba_cuda/numba/cuda/tests/doc_examples/test_montecarlo.py +119 -0
  420. numba_cuda/numba/cuda/tests/doc_examples/test_random.py +66 -0
  421. numba_cuda/numba/cuda/tests/doc_examples/test_reduction.py +80 -0
  422. numba_cuda/numba/cuda/tests/doc_examples/test_sessionize.py +206 -0
  423. numba_cuda/numba/cuda/tests/doc_examples/test_ufunc.py +53 -0
  424. numba_cuda/numba/cuda/tests/doc_examples/test_vecadd.py +76 -0
  425. numba_cuda/numba/cuda/tests/nocuda/__init__.py +9 -0
  426. numba_cuda/numba/cuda/tests/nocuda/test_dummyarray.py +391 -0
  427. numba_cuda/numba/cuda/tests/nocuda/test_function_resolution.py +48 -0
  428. numba_cuda/numba/cuda/tests/nocuda/test_import.py +63 -0
  429. numba_cuda/numba/cuda/tests/nocuda/test_library_lookup.py +252 -0
  430. numba_cuda/numba/cuda/tests/nocuda/test_nvvm.py +59 -0
  431. numba_cuda/numba/cuda/tests/nrt/__init__.py +9 -0
  432. numba_cuda/numba/cuda/tests/nrt/test_nrt.py +387 -0
  433. numba_cuda/numba/cuda/tests/nrt/test_nrt_refct.py +124 -0
  434. numba_cuda/numba/cuda/tests/support.py +900 -0
  435. numba_cuda/numba/cuda/typeconv/__init__.py +4 -0
  436. numba_cuda/numba/cuda/typeconv/castgraph.py +137 -0
  437. numba_cuda/numba/cuda/typeconv/rules.py +63 -0
  438. numba_cuda/numba/cuda/typeconv/typeconv.py +121 -0
  439. numba_cuda/numba/cuda/types/__init__.py +233 -0
  440. numba_cuda/numba/cuda/types/__init__.pyi +167 -0
  441. numba_cuda/numba/cuda/types/abstract.py +9 -0
  442. numba_cuda/numba/cuda/types/common.py +9 -0
  443. numba_cuda/numba/cuda/types/containers.py +9 -0
  444. numba_cuda/numba/cuda/types/cuda_abstract.py +533 -0
  445. numba_cuda/numba/cuda/types/cuda_common.py +110 -0
  446. numba_cuda/numba/cuda/types/cuda_containers.py +971 -0
  447. numba_cuda/numba/cuda/types/cuda_function_type.py +230 -0
  448. numba_cuda/numba/cuda/types/cuda_functions.py +798 -0
  449. numba_cuda/numba/cuda/types/cuda_iterators.py +120 -0
  450. numba_cuda/numba/cuda/types/cuda_misc.py +569 -0
  451. numba_cuda/numba/cuda/types/cuda_npytypes.py +690 -0
  452. numba_cuda/numba/cuda/types/cuda_scalars.py +280 -0
  453. numba_cuda/numba/cuda/types/ext_types.py +101 -0
  454. numba_cuda/numba/cuda/types/function_type.py +11 -0
  455. numba_cuda/numba/cuda/types/functions.py +9 -0
  456. numba_cuda/numba/cuda/types/iterators.py +9 -0
  457. numba_cuda/numba/cuda/types/misc.py +9 -0
  458. numba_cuda/numba/cuda/types/npytypes.py +9 -0
  459. numba_cuda/numba/cuda/types/scalars.py +9 -0
  460. numba_cuda/numba/cuda/typing/__init__.py +19 -0
  461. numba_cuda/numba/cuda/typing/arraydecl.py +939 -0
  462. numba_cuda/numba/cuda/typing/asnumbatype.py +130 -0
  463. numba_cuda/numba/cuda/typing/bufproto.py +70 -0
  464. numba_cuda/numba/cuda/typing/builtins.py +1209 -0
  465. numba_cuda/numba/cuda/typing/cffi_utils.py +219 -0
  466. numba_cuda/numba/cuda/typing/cmathdecl.py +47 -0
  467. numba_cuda/numba/cuda/typing/collections.py +138 -0
  468. numba_cuda/numba/cuda/typing/context.py +782 -0
  469. numba_cuda/numba/cuda/typing/ctypes_utils.py +125 -0
  470. numba_cuda/numba/cuda/typing/dictdecl.py +63 -0
  471. numba_cuda/numba/cuda/typing/enumdecl.py +74 -0
  472. numba_cuda/numba/cuda/typing/listdecl.py +147 -0
  473. numba_cuda/numba/cuda/typing/mathdecl.py +158 -0
  474. numba_cuda/numba/cuda/typing/npdatetime.py +322 -0
  475. numba_cuda/numba/cuda/typing/npydecl.py +749 -0
  476. numba_cuda/numba/cuda/typing/setdecl.py +115 -0
  477. numba_cuda/numba/cuda/typing/templates.py +1446 -0
  478. numba_cuda/numba/cuda/typing/typeof.py +301 -0
  479. numba_cuda/numba/cuda/ufuncs.py +746 -0
  480. numba_cuda/numba/cuda/utils.py +724 -0
  481. numba_cuda/numba/cuda/vector_types.py +214 -0
  482. numba_cuda/numba/cuda/vectorizers.py +260 -0
  483. numba_cuda-0.21.1.dist-info/METADATA +109 -0
  484. numba_cuda-0.21.1.dist-info/RECORD +488 -0
  485. numba_cuda-0.21.1.dist-info/WHEEL +5 -0
  486. numba_cuda-0.21.1.dist-info/licenses/LICENSE +26 -0
  487. numba_cuda-0.21.1.dist-info/licenses/LICENSE.numba +24 -0
  488. numba_cuda-0.21.1.dist-info/top_level.txt +1 -0
@@ -0,0 +1,613 @@
1
+ # SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
+ # SPDX-License-Identifier: BSD-2-Clause
3
+
4
+ """
5
+ Enum values for CUDA driver. Information about the values
6
+ can be found on the official NVIDIA documentation website.
7
+ ref: https://docs.nvidia.com/cuda/cuda-driver-api/group__CUDA__TYPES.html
8
+ anchor: #group__CUDA__TYPES
9
+ """
10
+
11
+
12
+ # Error codes
13
+
14
+ CUDA_SUCCESS = 0
15
+ CUDA_ERROR_INVALID_VALUE = 1
16
+ CUDA_ERROR_OUT_OF_MEMORY = 2
17
+ CUDA_ERROR_NOT_INITIALIZED = 3
18
+ CUDA_ERROR_DEINITIALIZED = 4
19
+ CUDA_ERROR_PROFILER_DISABLED = 5
20
+ CUDA_ERROR_PROFILER_NOT_INITIALIZED = 6
21
+ CUDA_ERROR_PROFILER_ALREADY_STARTED = 7
22
+ CUDA_ERROR_PROFILER_ALREADY_STOPPED = 8
23
+ CUDA_ERROR_STUB_LIBRARY = 34
24
+ CUDA_ERROR_DEVICE_UNAVAILABLE = 46
25
+ CUDA_ERROR_NO_DEVICE = 100
26
+ CUDA_ERROR_INVALID_DEVICE = 101
27
+ CUDA_ERROR_DEVICE_NOT_LICENSED = 102
28
+ CUDA_ERROR_INVALID_IMAGE = 200
29
+ CUDA_ERROR_INVALID_CONTEXT = 201
30
+ CUDA_ERROR_CONTEXT_ALREADY_CURRENT = 202
31
+ CUDA_ERROR_MAP_FAILED = 205
32
+ CUDA_ERROR_UNMAP_FAILED = 206
33
+ CUDA_ERROR_ARRAY_IS_MAPPED = 207
34
+ CUDA_ERROR_ALREADY_MAPPED = 208
35
+ CUDA_ERROR_NO_BINARY_FOR_GPU = 209
36
+ CUDA_ERROR_ALREADY_ACQUIRED = 210
37
+ CUDA_ERROR_NOT_MAPPED = 211
38
+ CUDA_ERROR_NOT_MAPPED_AS_ARRAY = 212
39
+ CUDA_ERROR_NOT_MAPPED_AS_POINTER = 213
40
+ CUDA_ERROR_ECC_UNCORRECTABLE = 214
41
+ CUDA_ERROR_UNSUPPORTED_LIMIT = 215
42
+ CUDA_ERROR_CONTEXT_ALREADY_IN_USE = 216
43
+ CUDA_ERROR_PEER_ACCESS_UNSUPPORTED = 217
44
+ CUDA_ERROR_INVALID_PTX = 218
45
+ CUDA_ERROR_INVALID_GRAPHICS_CONTEXT = 219
46
+ CUDA_ERROR_NVLINK_UNCORRECTABLE = 220
47
+ CUDA_ERROR_JIT_COMPILER_NOT_FOUND = 221
48
+ CUDA_ERROR_UNSUPPORTED_PTX_VERSION = 222
49
+ CUDA_ERROR_JIT_COMPILATION_DISABLED = 223
50
+ CUDA_ERROR_UNSUPPORTED_EXEC_AFFINITY = 224
51
+ CUDA_ERROR_UNSUPPORTED_DEVSIDE_SYNC = 225
52
+ CUDA_ERROR_INVALID_SOURCE = 300
53
+ CUDA_ERROR_FILE_NOT_FOUND = 301
54
+ CUDA_ERROR_SHARED_OBJECT_SYMBOL_NOT_FOUND = 302
55
+ CUDA_ERROR_SHARED_OBJECT_INIT_FAILED = 303
56
+ CUDA_ERROR_OPERATING_SYSTEM = 304
57
+ CUDA_ERROR_INVALID_HANDLE = 400
58
+ CUDA_ERROR_ILLEGAL_STATE = 401
59
+ CUDA_ERROR_NOT_FOUND = 500
60
+ CUDA_ERROR_NOT_READY = 600
61
+ CUDA_ERROR_ILLEGAL_ADDRESS = 700
62
+ CUDA_ERROR_LAUNCH_OUT_OF_RESOURCES = 701
63
+ CUDA_ERROR_LAUNCH_TIMEOUT = 702
64
+ CUDA_ERROR_LAUNCH_INCOMPATIBLE_TEXTURING = 703
65
+ CUDA_ERROR_PEER_ACCESS_ALREADY_ENABLED = 704
66
+ CUDA_ERROR_PEER_ACCESS_NOT_ENABLED = 705
67
+ CUDA_ERROR_PRIMARY_CONTEXT_ACTIVE = 708
68
+ CUDA_ERROR_CONTEXT_IS_DESTROYED = 709
69
+ CUDA_ERROR_ASSERT = 710
70
+ CUDA_ERROR_TOO_MANY_PEERS = 711
71
+ CUDA_ERROR_HOST_MEMORY_ALREADY_REGISTERED = 712
72
+ CUDA_ERROR_HOST_MEMORY_NOT_REGISTERED = 713
73
+ CUDA_ERROR_HARDWARE_STACK_ERROR = 714
74
+ CUDA_ERROR_ILLEGAL_INSTRUCTION = 715
75
+ CUDA_ERROR_MISALIGNED_ADDRESS = 716
76
+ CUDA_ERROR_INVALID_ADDRESS_SPACE = 717
77
+ CUDA_ERROR_INVALID_PC = 718
78
+ CUDA_ERROR_LAUNCH_FAILED = 719
79
+ CUDA_ERROR_COOPERATIVE_LAUNCH_TOO_LARGE = 720
80
+ CUDA_ERROR_NOT_PERMITTED = 800
81
+ CUDA_ERROR_NOT_SUPPORTED = 801
82
+ CUDA_ERROR_SYSTEM_NOT_READY = 802
83
+ CUDA_ERROR_SYSTEM_DRIVER_MISMATCH = 803
84
+ CUDA_ERROR_COMPAT_NOT_SUPPORTED_ON_DEVICE = 804
85
+ CUDA_ERROR_MPS_CONNECTION_FAILED = 805
86
+ CUDA_ERROR_MPS_RPC_FAILURE = 806
87
+ CUDA_ERROR_MPS_SERVER_NOT_READY = 807
88
+ CUDA_ERROR_MPS_MAX_CLIENTS_REACHED = 808
89
+ CUDA_ERROR_MPS_MAX_CONNECTIONS_REACHED = 809
90
+ CUDA_ERROR_MPS_CLIENT_TERMINATED = 810
91
+ CUDA_ERROR_CDP_NOT_SUPPORTED = 811
92
+ CUDA_ERROR_CDP_VERSION_MISMATCH = 812
93
+ CUDA_ERROR_STREAM_CAPTURE_UNSUPPORTED = 900
94
+ CUDA_ERROR_STREAM_CAPTURE_INVALIDATED = 901
95
+ CUDA_ERROR_STREAM_CAPTURE_MERGE = 902
96
+ CUDA_ERROR_STREAM_CAPTURE_UNMATCHED = 903
97
+ CUDA_ERROR_STREAM_CAPTURE_UNJOINED = 904
98
+ CUDA_ERROR_STREAM_CAPTURE_ISOLATION = 905
99
+ CUDA_ERROR_STREAM_CAPTURE_IMPLICIT = 906
100
+ CUDA_ERROR_CAPTURED_EVENT = 907
101
+ CUDA_ERROR_STREAM_CAPTURE_WRONG_THREAD = 908
102
+ CUDA_ERROR_TIMEOUT = 909
103
+ CUDA_ERROR_GRAPH_EXEC_UPDATE_FAILURE = 910
104
+ CUDA_ERROR_EXTERNAL_DEVICE = 911
105
+ CUDA_ERROR_INVALID_CLUSTER_SIZE = 912
106
+ CUDA_ERROR_UNKNOWN = 999
107
+
108
+
109
+ # Function cache configurations
110
+
111
+ # no preference for shared memory or L1 (default)
112
+ CU_FUNC_CACHE_PREFER_NONE = 0x00
113
+ # prefer larger shared memory and smaller L1 cache
114
+ CU_FUNC_CACHE_PREFER_SHARED = 0x01
115
+ # prefer larger L1 cache and smaller shared memory
116
+ CU_FUNC_CACHE_PREFER_L1 = 0x02
117
+ # prefer equal sized L1 cache and shared memory
118
+ CU_FUNC_CACHE_PREFER_EQUAL = 0x03
119
+
120
+
121
+ # Context creation flags
122
+
123
+ # Automatic scheduling
124
+ CU_CTX_SCHED_AUTO = 0x00
125
+ # Set spin as default scheduling
126
+ CU_CTX_SCHED_SPIN = 0x01
127
+ # Set yield as default scheduling
128
+ CU_CTX_SCHED_YIELD = 0x02
129
+ # Set blocking synchronization as default scheduling
130
+ CU_CTX_SCHED_BLOCKING_SYNC = 0x04
131
+
132
+ CU_CTX_SCHED_MASK = 0x07
133
+ # Support mapped pinned allocations
134
+ # This flag was deprecated as of CUDA 11.0 and it no longer has effect.
135
+ # All contexts as of CUDA 3.2 behave as though the flag is enabled.
136
+ CU_CTX_MAP_HOST = 0x08
137
+ # Keep local memory allocation after launch
138
+ CU_CTX_LMEM_RESIZE_TO_MAX = 0x10
139
+ # Trigger coredumps from exceptions in this context
140
+ CU_CTX_COREDUMP_ENABLE = 0x20
141
+ # Enable user pipe to trigger coredumps in this context
142
+ CU_CTX_USER_COREDUMP_ENABLE = 0x40
143
+ # Force synchronous blocking on cudaMemcpy/cudaMemset
144
+ CU_CTX_SYNC_MEMOPS = 0x80
145
+
146
+ CU_CTX_FLAGS_MASK = 0xFF
147
+
148
+
149
+ # DEFINES
150
+
151
+ # If set, host memory is portable between CUDA contexts.
152
+ # Flag for cuMemHostAlloc()
153
+ CU_MEMHOSTALLOC_PORTABLE = 0x01
154
+
155
+ # If set, host memory is mapped into CUDA address space and
156
+ # cuMemHostGetDevicePointer() may be called on the host pointer.
157
+ # Flag for cuMemHostAlloc()
158
+ CU_MEMHOSTALLOC_DEVICEMAP = 0x02
159
+
160
+ # If set, host memory is allocated as write-combined - fast to write,
161
+ # faster to DMA, slow to read except via SSE4 streaming load instruction
162
+ # (MOVNTDQA).
163
+ # Flag for cuMemHostAlloc()
164
+ CU_MEMHOSTALLOC_WRITECOMBINED = 0x04
165
+
166
+
167
+ # If set, host memory is portable between CUDA contexts.
168
+ # Flag for cuMemHostRegister()
169
+ CU_MEMHOSTREGISTER_PORTABLE = 0x01
170
+
171
+ # If set, host memory is mapped into CUDA address space and
172
+ # cuMemHostGetDevicePointer() may be called on the host pointer.
173
+ # Flag for cuMemHostRegister()
174
+ CU_MEMHOSTREGISTER_DEVICEMAP = 0x02
175
+
176
+ # If set, the passed memory pointer is treated as pointing to some
177
+ # memory-mapped I/O space, e.g. belonging to a third-party PCIe device.
178
+ # On Windows the flag is a no-op. On Linux that memory is marked
179
+ # as non cache-coherent for the GPU and is expected
180
+ # to be physically contiguous. It may return CUDA_ERROR_NOT_PERMITTED
181
+ # if run as an unprivileged user, CUDA_ERROR_NOT_SUPPORTED on older
182
+ # Linux kernel versions. On all other platforms, it is not supported
183
+ # and CUDA_ERROR_NOT_SUPPORTED is returned.
184
+ # Flag for cuMemHostRegister()
185
+ CU_MEMHOSTREGISTER_IOMEMORY = 0x04
186
+
187
+ # If set, the passed memory pointer is treated as pointing to memory
188
+ # that is considered read-only by the device. On platforms without
189
+ # CU_DEVICE_ATTRIBUTE_PAGEABLE_MEMORY_ACCESS_USES_HOST_PAGE_TABLES,
190
+ # this flag is required in order to register memory mapped
191
+ # to the CPU as read-only. Support for the use of this flag can be
192
+ # queried from the device attribute
193
+ # CU_DEVICE_ATTRIBUTE_READ_ONLY_HOST_REGISTER_SUPPORTED.
194
+ # Using this flag with a current context associated with a device
195
+ # that does not have this attribute set will cause cuMemHostRegister
196
+ # to error with CUDA_ERROR_NOT_SUPPORTED.
197
+ CU_MEMHOSTREGISTER_READ_ONLY = 0x08
198
+
199
+
200
+ # CUDA Mem Attach Flags
201
+
202
+ # If set, managed memory is accessible from all streams on all devices.
203
+ CU_MEM_ATTACH_GLOBAL = 0x01
204
+
205
+ # If set on a platform where the device attribute
206
+ # cudaDevAttrConcurrentManagedAccess is zero, then managed memory is
207
+ # only accessible on the host (unless explicitly attached to a stream
208
+ # with cudaStreamAttachMemAsync, in which case it can be used in kernels
209
+ # launched on that stream).
210
+ CU_MEM_ATTACH_HOST = 0x02
211
+
212
+ # If set on a platform where the device attribute
213
+ # cudaDevAttrConcurrentManagedAccess is zero, then managed memory accesses
214
+ # on the associated device must only be from a single stream.
215
+ CU_MEM_ATTACH_SINGLE = 0x04
216
+
217
+
218
+ # Event creation flags
219
+
220
+ # Default event flag
221
+ CU_EVENT_DEFAULT = 0x0
222
+ # Event uses blocking synchronization
223
+ CU_EVENT_BLOCKING_SYNC = 0x1
224
+ # Event will not record timing data
225
+ CU_EVENT_DISABLE_TIMING = 0x2
226
+ # Event is suitable for interprocess use. CU_EVENT_DISABLE_TIMING must be set
227
+ CU_EVENT_INTERPROCESS = 0x4
228
+
229
+
230
+ # Pointer information
231
+
232
+ # The CUcontext on which a pointer was allocated or registered
233
+ CU_POINTER_ATTRIBUTE_CONTEXT = 1
234
+ # The CUmemorytype describing the physical location of a pointer
235
+ CU_POINTER_ATTRIBUTE_MEMORY_TYPE = 2
236
+ # The address at which a pointer's memory may be accessed on the device
237
+ CU_POINTER_ATTRIBUTE_DEVICE_POINTER = 3
238
+ # The address at which a pointer's memory may be accessed on the host
239
+ CU_POINTER_ATTRIBUTE_HOST_POINTER = 4
240
+ # A pair of tokens for use with the nv-p2p.h Linux kernel interface
241
+ CU_POINTER_ATTRIBUTE_P2P_TOKENS = 5
242
+ # Synchronize every synchronous memory operation initiated on this region
243
+ CU_POINTER_ATTRIBUTE_SYNC_MEMOPS = 6
244
+ # A process-wide unique ID for an allocated memory region
245
+ CU_POINTER_ATTRIBUTE_BUFFER_ID = 7
246
+ # Indicates if the pointer points to managed memory
247
+ CU_POINTER_ATTRIBUTE_IS_MANAGED = 8
248
+ # A device ordinal of a device on which a pointer was allocated or registered
249
+ CU_POINTER_ATTRIBUTE_DEVICE_ORDINAL = 9
250
+ # 1 if this pointer maps to an allocation
251
+ # that is suitable for cudaIpcGetMemHandle, 0 otherwise
252
+ CU_POINTER_ATTRIBUTE_IS_LEGACY_CUDA_IPC_CAPABLE = 10
253
+ # Starting address for this requested pointer
254
+ CU_POINTER_ATTRIBUTE_RANGE_START_ADDR = 11
255
+ # Size of the address range for this requested pointer
256
+ CU_POINTER_ATTRIBUTE_RANGE_SIZE = 12
257
+ # 1 if this pointer is in a valid address range
258
+ # that is mapped to a backing allocation, 0 otherwise
259
+ CU_POINTER_ATTRIBUTE_MAPPED = 13
260
+ # Bitmask of allowed CUmemAllocationHandleType for this allocation
261
+ CU_POINTER_ATTRIBUTE_ALLOWED_HANDLE_TYPES = 14
262
+ # 1 if the memory this pointer is referencing
263
+ # can be used with the GPUDirect RDMA API
264
+ CU_POINTER_ATTRIBUTE_IS_GPU_DIRECT_RDMA_CAPABLE = 15
265
+ # Returns the access flags the device associated
266
+ # with the current context has on the corresponding
267
+ # memory referenced by the pointer given
268
+ CU_POINTER_ATTRIBUTE_ACCESS_FLAGS = 16
269
+ # Returns the mempool handle for the allocation
270
+ # if it was allocated from a mempool. Otherwise returns NULL
271
+ CU_POINTER_ATTRIBUTE_MEMPOOL_HANDLE = 17
272
+ # Size of the actual underlying mapping that the pointer belongs to
273
+ CU_POINTER_ATTRIBUTE_MAPPING_SIZE = 18
274
+ # The start address of the mapping that the pointer belongs to
275
+ CU_POINTER_ATTRIBUTE_MAPPING_BASE_ADDR = 19
276
+ # A process-wide unique id corresponding to the
277
+ # physical allocation the pointer belongs to
278
+ CU_POINTER_ATTRIBUTE_MEMORY_BLOCK_ID = 20
279
+
280
+
281
+ # Memory types
282
+
283
+ # Host memory
284
+ CU_MEMORYTYPE_HOST = 0x01
285
+ # Device memory
286
+ CU_MEMORYTYPE_DEVICE = 0x02
287
+ # Array memory
288
+ CU_MEMORYTYPE_ARRAY = 0x03
289
+ # Unified device or host memory
290
+ CU_MEMORYTYPE_UNIFIED = 0x04
291
+
292
+
293
+ # Device code formats
294
+
295
+ # Compiled device-class-specific device code
296
+ # Applicable options: none
297
+ CU_JIT_INPUT_CUBIN = 0
298
+
299
+ # PTX source code
300
+ # Applicable options: PTX compiler options
301
+ CU_JIT_INPUT_PTX = 1
302
+
303
+ # Bundle of multiple cubins and/or PTX of some device code
304
+ # Applicable options: PTX compiler options, ::CU_JIT_FALLBACK_STRATEGY
305
+ CU_JIT_INPUT_FATBINARY = 2
306
+
307
+ # Host object with embedded device code
308
+ # Applicable options: PTX compiler options, ::CU_JIT_FALLBACK_STRATEGY
309
+ CU_JIT_INPUT_OBJECT = 3
310
+
311
+ # Archive of host objects with embedded device code
312
+ # Applicable options: PTX compiler options, ::CU_JIT_FALLBACK_STRATEGY
313
+ CU_JIT_INPUT_LIBRARY = 4
314
+
315
+ # LTO IR
316
+ CU_JIT_INPUT_NVVM = 5
317
+
318
+ CU_JIT_NUM_INPUT_TYPES = 6
319
+
320
+
321
+ # Online compiler and linker options
322
+
323
+ # Max number of registers that a thread may use.
324
+ # Option type: unsigned int
325
+ # Applies to: compiler only
326
+ CU_JIT_MAX_REGISTERS = 0
327
+
328
+ # IN: Specifies minimum number of threads per block to target compilation
329
+ # for
330
+ # OUT: Returns the number of threads the compiler actually targeted.
331
+ # This restricts the resource utilization fo the compiler (e.g. max
332
+ # registers) such that a block with the given number of threads should be
333
+ # able to launch based on register limitations. Note, this option does not
334
+ # currently take into account any other resource limitations, such as
335
+ # shared memory utilization.
336
+ # Cannot be combined with ::CU_JIT_TARGET.
337
+ # Option type: unsigned int
338
+ # Applies to: compiler only
339
+ CU_JIT_THREADS_PER_BLOCK = 1
340
+
341
+ # Overwrites the option value with the total wall clock time, in
342
+ # milliseconds, spent in the compiler and linker
343
+ # Option type: float
344
+ # Applies to: compiler and linker
345
+ CU_JIT_WALL_TIME = 2
346
+
347
+ # Pointer to a buffer in which to print any log messages
348
+ # that are informational in nature (the buffer size is specified via
349
+ # option ::CU_JIT_INFO_LOG_BUFFER_SIZE_BYTES)
350
+ # Option type: char *
351
+ # Applies to: compiler and linker
352
+ CU_JIT_INFO_LOG_BUFFER = 3
353
+
354
+ # IN: Log buffer size in bytes. Log messages will be capped at this size
355
+ # (including null terminator)
356
+ # OUT: Amount of log buffer filled with messages
357
+ # Option type: unsigned int
358
+ # Applies to: compiler and linker
359
+ CU_JIT_INFO_LOG_BUFFER_SIZE_BYTES = 4
360
+
361
+ # Pointer to a buffer in which to print any log messages that
362
+ # reflect errors (the buffer size is specified via option
363
+ # ::CU_JIT_ERROR_LOG_BUFFER_SIZE_BYTES)
364
+ # Option type: char *
365
+ # Applies to: compiler and linker
366
+ CU_JIT_ERROR_LOG_BUFFER = 5
367
+
368
+ # IN: Log buffer size in bytes. Log messages will be capped at this size
369
+ # (including null terminator)
370
+ # OUT: Amount of log buffer filled with messages
371
+ # Option type: unsigned int
372
+ # Applies to: compiler and linker
373
+ CU_JIT_ERROR_LOG_BUFFER_SIZE_BYTES = 6
374
+
375
+ # Level of optimizations to apply to generated code (0 - 4), with 4
376
+ # being the default and highest level of optimizations.
377
+ # Option type: unsigned int
378
+ # Applies to: compiler only
379
+ CU_JIT_OPTIMIZATION_LEVEL = 7
380
+
381
+ # No option value required. Determines the target based on the current
382
+ # attached context (default)
383
+ # Option type: No option value needed
384
+ # Applies to: compiler and linker
385
+ CU_JIT_TARGET_FROM_CUCONTEXT = 8
386
+
387
+ # Target is chosen based on supplied ::CUjit_target. Cannot be
388
+ # combined with ::CU_JIT_THREADS_PER_BLOCK.
389
+ # Option type: unsigned int for enumerated type ::CUjit_target
390
+ # Applies to: compiler and linker
391
+ CU_JIT_TARGET = 9
392
+
393
+ # Specifies choice of fallback strategy if matching cubin is not found.
394
+ # Choice is based on supplied ::CUjit_fallback.
395
+ # Option type: unsigned int for enumerated type ::CUjit_fallback
396
+ # Applies to: compiler only
397
+ CU_JIT_FALLBACK_STRATEGY = 10
398
+
399
+ # Specifies whether to create debug information in output (-g)
400
+ # (0: false, default)
401
+ # Option type: int
402
+ # Applies to: compiler and linker
403
+ CU_JIT_GENERATE_DEBUG_INFO = 11
404
+
405
+ # Generate verbose log messages (0: false, default)
406
+ # Option type: int
407
+ # Applies to: compiler and linker
408
+ CU_JIT_LOG_VERBOSE = 12
409
+
410
+ # Generate line number information (-lineinfo) (0: false, default)
411
+ # Option type: int
412
+ # Applies to: compiler only
413
+ CU_JIT_GENERATE_LINE_INFO = 13
414
+
415
+ # Specifies whether to enable caching explicitly (-dlcm)
416
+ # Choice is based on supplied ::CUjit_cacheMode_enum.
417
+ # Option type: unsigned int for enumerated type ::CUjit_cacheMode_enum
418
+ # Applies to: compiler only
419
+ CU_JIT_CACHE_MODE = 14
420
+
421
+
422
+ # CUfunction_attribute
423
+
424
+ # The maximum number of threads per block, beyond which a launch of the
425
+ # function would fail. This number depends on both the function and the
426
+ # device on which the function is currently loaded.
427
+ CU_FUNC_ATTRIBUTE_MAX_THREADS_PER_BLOCK = 0
428
+
429
+ # The size in bytes of statically-allocated shared memory required by
430
+ # this function. This does not include dynamically-allocated shared
431
+ # memory requested by the user at runtime.
432
+ CU_FUNC_ATTRIBUTE_SHARED_SIZE_BYTES = 1
433
+
434
+ # The size in bytes of user-allocated constant memory required by this
435
+ # function.
436
+ CU_FUNC_ATTRIBUTE_CONST_SIZE_BYTES = 2
437
+
438
+ # The size in bytes of local memory used by each thread of this function.
439
+ CU_FUNC_ATTRIBUTE_LOCAL_SIZE_BYTES = 3
440
+
441
+ # The number of registers used by each thread of this function.
442
+ CU_FUNC_ATTRIBUTE_NUM_REGS = 4
443
+
444
+ # The PTX virtual architecture version for which the function was
445
+ # compiled. This value is the major PTX version * 10 + the minor PTX
446
+ # version, so a PTX version 1.3 function would return the value 13.
447
+ # Note that this may return the undefined value of 0 for cubins
448
+ # compiled prior to CUDA 3.0.
449
+ CU_FUNC_ATTRIBUTE_PTX_VERSION = 5
450
+
451
+ # The binary architecture version for which the function was compiled.
452
+ # This value is the major binary version * 10 + the minor binary version,
453
+ # so a binary version 1.3 function would return the value 13. Note that
454
+ # this will return a value of 10 for legacy cubins that do not have a
455
+ # properly-encoded binary architecture version.
456
+ CU_FUNC_ATTRIBUTE_BINARY_VERSION = 6
457
+
458
+ # The attribute to indicate whether the function has been compiled
459
+ # with user specified option "-Xptxas --dlcm=ca" set
460
+ CU_FUNC_ATTRIBUTE_CACHE_MODE_CA = 7
461
+
462
+ # The maximum size in bytes of dynamically-allocated shared memory
463
+ # that can be used by this function. If the user-specified
464
+ # dynamic shared memory size is larger than this value,
465
+ # the launch will fail. See cuFuncSetAttribute, cuKernelSetAttribute
466
+ CU_FUNC_ATTRIBUTE_MAX_DYNAMIC_SHARED_SIZE_BYTES = 8
467
+
468
+ # On devices where the L1 cache and shared memory use the same
469
+ # hardware resources, this sets the shared memory carveout preference,
470
+ # in percent of the total shared memory. Refer to
471
+ # CU_DEVICE_ATTRIBUTE_MAX_SHARED_MEMORY_PER_MULTIPROCESSOR.
472
+ # This is only a hint, and the driver can choose a different ratio
473
+ # if required to execute the function.
474
+ # See cuFuncSetAttribute, cuKernelSetAttribute
475
+ CU_FUNC_ATTRIBUTE_PREFERRED_SHARED_MEMORY_CARVEOUT = 9
476
+
477
+ # If this attribute is set, the kernel must launch with a valid cluster
478
+ # size specified. See cuFuncSetAttribute, cuKernelSetAttribute
479
+ CU_FUNC_ATTRIBUTE_CLUSTER_SIZE_MUST_BE_SET = 10
480
+
481
+ # The required cluster width in blocks. The values must either all be 0
482
+ # or all be positive. The validity of the cluster dimensions
483
+ # is otherwise checked at launch time. If the value is set during
484
+ # compile time, it cannot be set at runtime.
485
+ # Setting it at runtime will return CUDA_ERROR_NOT_PERMITTED.
486
+ # See cuFuncSetAttribute, cuKernelSetAttribute
487
+ CU_FUNC_ATTRIBUTE_REQUIRED_CLUSTER_WIDTH = 11
488
+
489
+ # The required cluster height in blocks. The values must either all be 0
490
+ # or all be positive. The validity of the cluster dimensions
491
+ # is otherwise checked at launch time.If the value is set during
492
+ # compile time, it cannot be set at runtime.
493
+ # Setting it at runtime should return CUDA_ERROR_NOT_PERMITTED.
494
+ # See cuFuncSetAttribute, cuKernelSetAttribute
495
+ CU_FUNC_ATTRIBUTE_REQUIRED_CLUSTER_HEIGHT = 12
496
+
497
+ # The required cluster depth in blocks. The values must either all be 0
498
+ # or all be positive. The validity of the cluster dimensions
499
+ # is otherwise checked at launch time.If the value is set during
500
+ # compile time, it cannot be set at runtime.
501
+ # Setting it at runtime should return CUDA_ERROR_NOT_PERMITTED.
502
+ # See cuFuncSetAttribute, cuKernelSetAttribute
503
+ CU_FUNC_ATTRIBUTE_REQUIRED_CLUSTER_DEPTH = 13
504
+
505
+ # Whether the function can be launched with non-portable cluster size.
506
+ # 1 is allowed, 0 is disallowed. A non-portable cluster size may only
507
+ # function on the specific SKUs the program is tested on.
508
+ # The launch might fail if the program is run on a different hardware platform.
509
+ # For more details refer to link :
510
+ # https://docs.nvidia.com/cuda/cuda-driver-api/group__CUDA__TYPES.html#group__CUDA__TYPES
511
+ CU_FUNC_ATTRIBUTE_NON_PORTABLE_CLUSTER_SIZE_ALLOWED = 14
512
+
513
+ # The block scheduling policy of a function.
514
+ # The value type is CUclusterSchedulingPolicy / cudaClusterSchedulingPolicy.
515
+ # See cuFuncSetAttribute, cuKernelSetAttribute
516
+ CU_FUNC_ATTRIBUTE_CLUSTER_SCHEDULING_POLICY_PREFERENCE = 15
517
+
518
+
519
+ # Device attributes
520
+
521
+ CU_DEVICE_ATTRIBUTE_MAX_THREADS_PER_BLOCK = 1
522
+ CU_DEVICE_ATTRIBUTE_MAX_BLOCK_DIM_X = 2
523
+ CU_DEVICE_ATTRIBUTE_MAX_BLOCK_DIM_Y = 3
524
+ CU_DEVICE_ATTRIBUTE_MAX_BLOCK_DIM_Z = 4
525
+ CU_DEVICE_ATTRIBUTE_MAX_GRID_DIM_X = 5
526
+ CU_DEVICE_ATTRIBUTE_MAX_GRID_DIM_Y = 6
527
+ CU_DEVICE_ATTRIBUTE_MAX_GRID_DIM_Z = 7
528
+ CU_DEVICE_ATTRIBUTE_MAX_SHARED_MEMORY_PER_BLOCK = 8
529
+ CU_DEVICE_ATTRIBUTE_TOTAL_CONSTANT_MEMORY = 9
530
+ CU_DEVICE_ATTRIBUTE_WARP_SIZE = 10
531
+ CU_DEVICE_ATTRIBUTE_MAX_PITCH = 11
532
+ CU_DEVICE_ATTRIBUTE_MAX_REGISTERS_PER_BLOCK = 12
533
+ CU_DEVICE_ATTRIBUTE_CLOCK_RATE = 13
534
+ CU_DEVICE_ATTRIBUTE_TEXTURE_ALIGNMENT = 14
535
+ CU_DEVICE_ATTRIBUTE_GPU_OVERLAP = 15
536
+ CU_DEVICE_ATTRIBUTE_MULTIPROCESSOR_COUNT = 16
537
+ CU_DEVICE_ATTRIBUTE_KERNEL_EXEC_TIMEOUT = 17
538
+ CU_DEVICE_ATTRIBUTE_INTEGRATED = 18
539
+ CU_DEVICE_ATTRIBUTE_CAN_MAP_HOST_MEMORY = 19
540
+ CU_DEVICE_ATTRIBUTE_COMPUTE_MODE = 20
541
+ CU_DEVICE_ATTRIBUTE_MAX_TEXTURE_1D_WIDTH = 21
542
+ CU_DEVICE_ATTRIBUTE_MAX_TEXTURE_2D_WIDTH = 22
543
+ CU_DEVICE_ATTRIBUTE_MAX_TEXTURE_2D_HEIGHT = 23
544
+ CU_DEVICE_ATTRIBUTE_MAX_TEXTURE_3D_WIDTH = 24
545
+ CU_DEVICE_ATTRIBUTE_MAX_TEXTURE_3D_HEIGHT = 25
546
+ CU_DEVICE_ATTRIBUTE_MAX_TEXTURE_3D_DEPTH = 26
547
+ CU_DEVICE_ATTRIBUTE_MAX_TEXTURE_2D_LAYERED_WIDTH = 27
548
+ CU_DEVICE_ATTRIBUTE_MAX_TEXTURE_2D_LAYERED_HEIGHT = 28
549
+ CU_DEVICE_ATTRIBUTE_MAX_TEXTURE_2D_LAYERED_LAYERS = 29
550
+ CU_DEVICE_ATTRIBUTE_SURFACE_ALIGNMENT = 30
551
+ CU_DEVICE_ATTRIBUTE_CONCURRENT_KERNELS = 31
552
+ CU_DEVICE_ATTRIBUTE_ECC_ENABLED = 32
553
+ CU_DEVICE_ATTRIBUTE_PCI_BUS_ID = 33
554
+ CU_DEVICE_ATTRIBUTE_PCI_DEVICE_ID = 34
555
+ CU_DEVICE_ATTRIBUTE_TCC_DRIVER = 35
556
+ CU_DEVICE_ATTRIBUTE_MEMORY_CLOCK_RATE = 36
557
+ CU_DEVICE_ATTRIBUTE_GLOBAL_MEMORY_BUS_WIDTH = 37
558
+ CU_DEVICE_ATTRIBUTE_L2_CACHE_SIZE = 38
559
+ CU_DEVICE_ATTRIBUTE_MAX_THREADS_PER_MULTI_PROCESSOR = 39
560
+ CU_DEVICE_ATTRIBUTE_ASYNC_ENGINE_COUNT = 40
561
+ CU_DEVICE_ATTRIBUTE_UNIFIED_ADDRESSING = 41
562
+ CU_DEVICE_ATTRIBUTE_MAX_TEXTURE_1D_LAYERED_WIDTH = 42
563
+ CU_DEVICE_ATTRIBUTE_MAX_TEXTURE_1D_LAYERED_LAYERS = 43
564
+ CU_DEVICE_ATTRIBUTE_MAX_TEXTURE_2D_GATHER_WIDTH = 45
565
+ CU_DEVICE_ATTRIBUTE_MAX_TEXTURE_2D_GATHER_HEIGHT = 46
566
+ CU_DEVICE_ATTRIBUTE_MAX_TEXTURE_3D_WIDTH_ALT = 47
567
+ CU_DEVICE_ATTRIBUTE_MAX_TEXTURE_3D_HEIGHT_ALT = 48
568
+ CU_DEVICE_ATTRIBUTE_MAX_TEXTURE_3D_DEPTH_ALT = 49
569
+ CU_DEVICE_ATTRIBUTE_PCI_DOMAIN_ID = 50
570
+ CU_DEVICE_ATTRIBUTE_TEXTURE_PITCH_ALIGNMENT = 51
571
+ CU_DEVICE_ATTRIBUTE_MAX_TEXTURE_CUBEMAP_WIDTH = 52
572
+ CU_DEVICE_ATTRIBUTE_MAX_TEXTURE_CUBEMAP_LAYERED_WIDTH = 53
573
+ CU_DEVICE_ATTRIBUTE_MAX_TEXTURE_CUBEMAP_LAYERED_LAYERS = 54
574
+ CU_DEVICE_ATTRIBUTE_MAX_SURFACE_1D_WIDTH = 55
575
+ CU_DEVICE_ATTRIBUTE_MAX_SURFACE_2D_WIDTH = 56
576
+ CU_DEVICE_ATTRIBUTE_MAX_SURFACE_2D_HEIGHT = 57
577
+ CU_DEVICE_ATTRIBUTE_MAX_SURFACE_3D_WIDTH = 58
578
+ CU_DEVICE_ATTRIBUTE_MAX_SURFACE_3D_HEIGHT = 59
579
+ CU_DEVICE_ATTRIBUTE_MAX_SURFACE_3D_DEPTH = 60
580
+ CU_DEVICE_ATTRIBUTE_MAX_SURFACE_1D_LAYERED_WIDTH = 61
581
+ CU_DEVICE_ATTRIBUTE_MAX_SURFACE_1D_LAYERED_LAYERS = 62
582
+ CU_DEVICE_ATTRIBUTE_MAX_SURFACE_2D_LAYERED_WIDTH = 63
583
+ CU_DEVICE_ATTRIBUTE_MAX_SURFACE_2D_LAYERED_HEIGHT = 64
584
+ CU_DEVICE_ATTRIBUTE_MAX_SURFACE_2D_LAYERED_LAYERS = 65
585
+ CU_DEVICE_ATTRIBUTE_MAX_SURFACE_CUBEMAP_WIDTH = 66
586
+ CU_DEVICE_ATTRIBUTE_MAX_SURFACE_CUBEMAP_LAYERED_WIDTH = 67
587
+ CU_DEVICE_ATTRIBUTE_MAX_SURFACE_CUBEMAP_LAYERED_LAYERS = 68
588
+ CU_DEVICE_ATTRIBUTE_MAX_TEXTURE_1D_LINEAR_WIDTH = 69
589
+ CU_DEVICE_ATTRIBUTE_MAX_TEXTURE_2D_LINEAR_WIDTH = 70
590
+ CU_DEVICE_ATTRIBUTE_MAX_TEXTURE_2D_LINEAR_HEIGHT = 71
591
+ CU_DEVICE_ATTRIBUTE_MAX_TEXTURE_2D_LINEAR_PITCH = 72
592
+ CU_DEVICE_ATTRIBUTE_MAX_TEXTURE_2D_MIPMAPPED_WIDTH = 73
593
+ CU_DEVICE_ATTRIBUTE_MAX_MAX_TEXTURE_2D_MIPMAPPED_HEIGHT = 74
594
+ CU_DEVICE_ATTRIBUTE_COMPUTE_CAPABILITY_MAJOR = 75
595
+ CU_DEVICE_ATTRIBUTE_COMPUTE_CAPABILITY_MINOR = 76
596
+ CU_DEVICE_ATTRIBUTE_MAX_TEXTURE_1D_MIPMAPPED_WIDTH = 77
597
+ CU_DEVICE_ATTRIBUTE_STREAM_PRIORITIES_SUPPORTED = 78
598
+ CU_DEVICE_ATTRIBUTE_GLOBAL_L1_CACHE_SUPPORTED = 79
599
+ CU_DEVICE_ATTRIBUTE_LOCAL_L1_CACHE_SUPPORTED = 80
600
+ CU_DEVICE_ATTRIBUTE_MAX_SHARED_MEMORY_PER_MULTIPROCESSOR = 81
601
+ CU_DEVICE_ATTRIBUTE_MAX_REGISTERS_PER_MULTIPROCESSOR = 82
602
+ CU_DEVICE_ATTRIBUTE_MANAGED_MEMORY = 83
603
+ CU_DEVICE_ATTRIBUTE_IS_MULTI_GPU_BOARD = 84
604
+ CU_DEVICE_ATTRIBUTE_MULTI_GPU_BOARD_GROUP_ID = 85
605
+ CU_DEVICE_ATTRIBUTE_HOST_NATIVE_ATOMIC_SUPPORTED = 86
606
+ CU_DEVICE_ATTRIBUTE_SINGLE_TO_DOUBLE_PRECISION_PERF_RATIO = 87
607
+ CU_DEVICE_ATTRIBUTE_PAGEABLE_MEMORY_ACCESS = 88
608
+ CU_DEVICE_ATTRIBUTE_CONCURRENT_MANAGED_ACCESS = 89
609
+ CU_DEVICE_ATTRIBUTE_COMPUTE_PREEMPTION_SUPPORTED = 90
610
+ CU_DEVICE_ATTRIBUTE_CAN_USE_HOST_POINTER_FOR_REGISTERED_MEM = 91
611
+ CU_DEVICE_ATTRIBUTE_COOPERATIVE_LAUNCH = 95
612
+ CU_DEVICE_ATTRIBUTE_COOPERATIVE_MULTI_DEVICE_LAUNCH = 96
613
+ CU_DEVICE_ATTRIBUTE_MAX_SHARED_MEMORY_PER_BLOCK_OPTIN = 97
@@ -0,0 +1,48 @@
1
+ # SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
+ # SPDX-License-Identifier: BSD-2-Clause
3
+
4
+
5
+ class CudaDriverError(Exception):
6
+ pass
7
+
8
+
9
+ class CudaRuntimeError(Exception):
10
+ pass
11
+
12
+
13
+ class CudaSupportError(ImportError):
14
+ pass
15
+
16
+
17
+ class NvvmError(Exception):
18
+ def __str__(self):
19
+ return "\n".join(map(str, self.args))
20
+
21
+
22
+ class NvvmSupportError(ImportError):
23
+ pass
24
+
25
+
26
+ class NvvmWarning(Warning):
27
+ pass
28
+
29
+
30
+ class NvrtcError(Exception):
31
+ def __str__(self):
32
+ return "\n".join(map(str, self.args))
33
+
34
+
35
+ class NvrtcCompilationError(NvrtcError):
36
+ pass
37
+
38
+
39
+ class NvrtcBuiltinOperationFailure(NvrtcError):
40
+ pass
41
+
42
+
43
+ class NvrtcSupportError(ImportError):
44
+ pass
45
+
46
+
47
+ class CCSupportError(RuntimeError):
48
+ pass