numba-cuda 0.21.1__cp313-cp313-win_amd64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (488) hide show
  1. _numba_cuda_redirector.pth +4 -0
  2. _numba_cuda_redirector.py +89 -0
  3. numba_cuda/VERSION +1 -0
  4. numba_cuda/__init__.py +6 -0
  5. numba_cuda/_version.py +11 -0
  6. numba_cuda/numba/cuda/__init__.py +70 -0
  7. numba_cuda/numba/cuda/_internal/cuda_bf16.py +16394 -0
  8. numba_cuda/numba/cuda/_internal/cuda_fp16.py +8112 -0
  9. numba_cuda/numba/cuda/api.py +577 -0
  10. numba_cuda/numba/cuda/api_util.py +76 -0
  11. numba_cuda/numba/cuda/args.py +72 -0
  12. numba_cuda/numba/cuda/bf16.py +397 -0
  13. numba_cuda/numba/cuda/cache_hints.py +287 -0
  14. numba_cuda/numba/cuda/cext/__init__.py +2 -0
  15. numba_cuda/numba/cuda/cext/_devicearray.cp313-win_amd64.pyd +0 -0
  16. numba_cuda/numba/cuda/cext/_devicearray.cpp +159 -0
  17. numba_cuda/numba/cuda/cext/_devicearray.h +29 -0
  18. numba_cuda/numba/cuda/cext/_dispatcher.cp313-win_amd64.pyd +0 -0
  19. numba_cuda/numba/cuda/cext/_dispatcher.cpp +1098 -0
  20. numba_cuda/numba/cuda/cext/_hashtable.cpp +532 -0
  21. numba_cuda/numba/cuda/cext/_hashtable.h +135 -0
  22. numba_cuda/numba/cuda/cext/_helperlib.c +71 -0
  23. numba_cuda/numba/cuda/cext/_helperlib.cp313-win_amd64.pyd +0 -0
  24. numba_cuda/numba/cuda/cext/_helpermod.c +82 -0
  25. numba_cuda/numba/cuda/cext/_pymodule.h +38 -0
  26. numba_cuda/numba/cuda/cext/_typeconv.cp313-win_amd64.pyd +0 -0
  27. numba_cuda/numba/cuda/cext/_typeconv.cpp +206 -0
  28. numba_cuda/numba/cuda/cext/_typeof.cpp +1159 -0
  29. numba_cuda/numba/cuda/cext/_typeof.h +19 -0
  30. numba_cuda/numba/cuda/cext/capsulethunk.h +111 -0
  31. numba_cuda/numba/cuda/cext/mviewbuf.c +385 -0
  32. numba_cuda/numba/cuda/cext/mviewbuf.cp313-win_amd64.pyd +0 -0
  33. numba_cuda/numba/cuda/cext/typeconv.cpp +212 -0
  34. numba_cuda/numba/cuda/cext/typeconv.hpp +101 -0
  35. numba_cuda/numba/cuda/cg.py +67 -0
  36. numba_cuda/numba/cuda/cgutils.py +1294 -0
  37. numba_cuda/numba/cuda/cloudpickle/__init__.py +21 -0
  38. numba_cuda/numba/cuda/cloudpickle/cloudpickle.py +1598 -0
  39. numba_cuda/numba/cuda/cloudpickle/cloudpickle_fast.py +17 -0
  40. numba_cuda/numba/cuda/codegen.py +541 -0
  41. numba_cuda/numba/cuda/compiler.py +1396 -0
  42. numba_cuda/numba/cuda/core/analysis.py +758 -0
  43. numba_cuda/numba/cuda/core/annotations/__init__.py +0 -0
  44. numba_cuda/numba/cuda/core/annotations/pretty_annotate.py +288 -0
  45. numba_cuda/numba/cuda/core/annotations/type_annotations.py +305 -0
  46. numba_cuda/numba/cuda/core/base.py +1332 -0
  47. numba_cuda/numba/cuda/core/boxing.py +1411 -0
  48. numba_cuda/numba/cuda/core/bytecode.py +728 -0
  49. numba_cuda/numba/cuda/core/byteflow.py +2346 -0
  50. numba_cuda/numba/cuda/core/caching.py +744 -0
  51. numba_cuda/numba/cuda/core/callconv.py +392 -0
  52. numba_cuda/numba/cuda/core/codegen.py +171 -0
  53. numba_cuda/numba/cuda/core/compiler.py +199 -0
  54. numba_cuda/numba/cuda/core/compiler_lock.py +85 -0
  55. numba_cuda/numba/cuda/core/compiler_machinery.py +497 -0
  56. numba_cuda/numba/cuda/core/config.py +650 -0
  57. numba_cuda/numba/cuda/core/consts.py +124 -0
  58. numba_cuda/numba/cuda/core/controlflow.py +989 -0
  59. numba_cuda/numba/cuda/core/entrypoints.py +57 -0
  60. numba_cuda/numba/cuda/core/environment.py +66 -0
  61. numba_cuda/numba/cuda/core/errors.py +917 -0
  62. numba_cuda/numba/cuda/core/event.py +511 -0
  63. numba_cuda/numba/cuda/core/funcdesc.py +330 -0
  64. numba_cuda/numba/cuda/core/generators.py +387 -0
  65. numba_cuda/numba/cuda/core/imputils.py +509 -0
  66. numba_cuda/numba/cuda/core/inline_closurecall.py +1787 -0
  67. numba_cuda/numba/cuda/core/interpreter.py +3617 -0
  68. numba_cuda/numba/cuda/core/ir.py +1812 -0
  69. numba_cuda/numba/cuda/core/ir_utils.py +2638 -0
  70. numba_cuda/numba/cuda/core/optional.py +129 -0
  71. numba_cuda/numba/cuda/core/options.py +262 -0
  72. numba_cuda/numba/cuda/core/postproc.py +249 -0
  73. numba_cuda/numba/cuda/core/pythonapi.py +1859 -0
  74. numba_cuda/numba/cuda/core/registry.py +46 -0
  75. numba_cuda/numba/cuda/core/removerefctpass.py +123 -0
  76. numba_cuda/numba/cuda/core/rewrites/__init__.py +26 -0
  77. numba_cuda/numba/cuda/core/rewrites/ir_print.py +91 -0
  78. numba_cuda/numba/cuda/core/rewrites/registry.py +104 -0
  79. numba_cuda/numba/cuda/core/rewrites/static_binop.py +41 -0
  80. numba_cuda/numba/cuda/core/rewrites/static_getitem.py +189 -0
  81. numba_cuda/numba/cuda/core/rewrites/static_raise.py +100 -0
  82. numba_cuda/numba/cuda/core/sigutils.py +68 -0
  83. numba_cuda/numba/cuda/core/ssa.py +498 -0
  84. numba_cuda/numba/cuda/core/targetconfig.py +330 -0
  85. numba_cuda/numba/cuda/core/tracing.py +231 -0
  86. numba_cuda/numba/cuda/core/transforms.py +956 -0
  87. numba_cuda/numba/cuda/core/typed_passes.py +867 -0
  88. numba_cuda/numba/cuda/core/typeinfer.py +1950 -0
  89. numba_cuda/numba/cuda/core/unsafe/__init__.py +0 -0
  90. numba_cuda/numba/cuda/core/unsafe/bytes.py +67 -0
  91. numba_cuda/numba/cuda/core/unsafe/eh.py +67 -0
  92. numba_cuda/numba/cuda/core/unsafe/refcount.py +98 -0
  93. numba_cuda/numba/cuda/core/untyped_passes.py +1979 -0
  94. numba_cuda/numba/cuda/cpython/builtins.py +1153 -0
  95. numba_cuda/numba/cuda/cpython/charseq.py +1218 -0
  96. numba_cuda/numba/cuda/cpython/cmathimpl.py +560 -0
  97. numba_cuda/numba/cuda/cpython/enumimpl.py +103 -0
  98. numba_cuda/numba/cuda/cpython/iterators.py +167 -0
  99. numba_cuda/numba/cuda/cpython/listobj.py +1326 -0
  100. numba_cuda/numba/cuda/cpython/mathimpl.py +499 -0
  101. numba_cuda/numba/cuda/cpython/numbers.py +1475 -0
  102. numba_cuda/numba/cuda/cpython/rangeobj.py +289 -0
  103. numba_cuda/numba/cuda/cpython/slicing.py +322 -0
  104. numba_cuda/numba/cuda/cpython/tupleobj.py +456 -0
  105. numba_cuda/numba/cuda/cpython/unicode.py +2865 -0
  106. numba_cuda/numba/cuda/cpython/unicode_support.py +1597 -0
  107. numba_cuda/numba/cuda/cpython/unsafe/__init__.py +0 -0
  108. numba_cuda/numba/cuda/cpython/unsafe/numbers.py +64 -0
  109. numba_cuda/numba/cuda/cpython/unsafe/tuple.py +92 -0
  110. numba_cuda/numba/cuda/cuda_paths.py +691 -0
  111. numba_cuda/numba/cuda/cudadecl.py +556 -0
  112. numba_cuda/numba/cuda/cudadrv/__init__.py +14 -0
  113. numba_cuda/numba/cuda/cudadrv/devicearray.py +951 -0
  114. numba_cuda/numba/cuda/cudadrv/devices.py +249 -0
  115. numba_cuda/numba/cuda/cudadrv/driver.py +3222 -0
  116. numba_cuda/numba/cuda/cudadrv/drvapi.py +435 -0
  117. numba_cuda/numba/cuda/cudadrv/dummyarray.py +558 -0
  118. numba_cuda/numba/cuda/cudadrv/enums.py +613 -0
  119. numba_cuda/numba/cuda/cudadrv/error.py +48 -0
  120. numba_cuda/numba/cuda/cudadrv/libs.py +220 -0
  121. numba_cuda/numba/cuda/cudadrv/linkable_code.py +184 -0
  122. numba_cuda/numba/cuda/cudadrv/mappings.py +14 -0
  123. numba_cuda/numba/cuda/cudadrv/ndarray.py +26 -0
  124. numba_cuda/numba/cuda/cudadrv/nvrtc.py +193 -0
  125. numba_cuda/numba/cuda/cudadrv/nvvm.py +756 -0
  126. numba_cuda/numba/cuda/cudadrv/rtapi.py +13 -0
  127. numba_cuda/numba/cuda/cudadrv/runtime.py +34 -0
  128. numba_cuda/numba/cuda/cudaimpl.py +995 -0
  129. numba_cuda/numba/cuda/cudamath.py +149 -0
  130. numba_cuda/numba/cuda/datamodel/__init__.py +7 -0
  131. numba_cuda/numba/cuda/datamodel/cuda_manager.py +66 -0
  132. numba_cuda/numba/cuda/datamodel/cuda_models.py +1446 -0
  133. numba_cuda/numba/cuda/datamodel/cuda_packer.py +224 -0
  134. numba_cuda/numba/cuda/datamodel/cuda_registry.py +22 -0
  135. numba_cuda/numba/cuda/datamodel/cuda_testing.py +153 -0
  136. numba_cuda/numba/cuda/datamodel/manager.py +11 -0
  137. numba_cuda/numba/cuda/datamodel/models.py +9 -0
  138. numba_cuda/numba/cuda/datamodel/packer.py +9 -0
  139. numba_cuda/numba/cuda/datamodel/registry.py +11 -0
  140. numba_cuda/numba/cuda/datamodel/testing.py +11 -0
  141. numba_cuda/numba/cuda/debuginfo.py +903 -0
  142. numba_cuda/numba/cuda/decorators.py +294 -0
  143. numba_cuda/numba/cuda/descriptor.py +35 -0
  144. numba_cuda/numba/cuda/device_init.py +158 -0
  145. numba_cuda/numba/cuda/deviceufunc.py +1021 -0
  146. numba_cuda/numba/cuda/dispatcher.py +2463 -0
  147. numba_cuda/numba/cuda/errors.py +72 -0
  148. numba_cuda/numba/cuda/extending.py +697 -0
  149. numba_cuda/numba/cuda/flags.py +178 -0
  150. numba_cuda/numba/cuda/fp16.py +357 -0
  151. numba_cuda/numba/cuda/include/12/cuda_bf16.h +5118 -0
  152. numba_cuda/numba/cuda/include/12/cuda_bf16.hpp +3865 -0
  153. numba_cuda/numba/cuda/include/12/cuda_fp16.h +5363 -0
  154. numba_cuda/numba/cuda/include/12/cuda_fp16.hpp +3483 -0
  155. numba_cuda/numba/cuda/include/13/cuda_bf16.h +5118 -0
  156. numba_cuda/numba/cuda/include/13/cuda_bf16.hpp +3865 -0
  157. numba_cuda/numba/cuda/include/13/cuda_fp16.h +5363 -0
  158. numba_cuda/numba/cuda/include/13/cuda_fp16.hpp +3483 -0
  159. numba_cuda/numba/cuda/initialize.py +24 -0
  160. numba_cuda/numba/cuda/intrinsic_wrapper.py +41 -0
  161. numba_cuda/numba/cuda/intrinsics.py +382 -0
  162. numba_cuda/numba/cuda/itanium_mangler.py +214 -0
  163. numba_cuda/numba/cuda/kernels/__init__.py +2 -0
  164. numba_cuda/numba/cuda/kernels/reduction.py +265 -0
  165. numba_cuda/numba/cuda/kernels/transpose.py +65 -0
  166. numba_cuda/numba/cuda/libdevice.py +3386 -0
  167. numba_cuda/numba/cuda/libdevicedecl.py +20 -0
  168. numba_cuda/numba/cuda/libdevicefuncs.py +1060 -0
  169. numba_cuda/numba/cuda/libdeviceimpl.py +88 -0
  170. numba_cuda/numba/cuda/locks.py +19 -0
  171. numba_cuda/numba/cuda/lowering.py +1951 -0
  172. numba_cuda/numba/cuda/mathimpl.py +374 -0
  173. numba_cuda/numba/cuda/memory_management/__init__.py +4 -0
  174. numba_cuda/numba/cuda/memory_management/memsys.cu +99 -0
  175. numba_cuda/numba/cuda/memory_management/memsys.cuh +22 -0
  176. numba_cuda/numba/cuda/memory_management/nrt.cu +212 -0
  177. numba_cuda/numba/cuda/memory_management/nrt.cuh +48 -0
  178. numba_cuda/numba/cuda/memory_management/nrt.py +390 -0
  179. numba_cuda/numba/cuda/memory_management/nrt_context.py +438 -0
  180. numba_cuda/numba/cuda/misc/appdirs.py +594 -0
  181. numba_cuda/numba/cuda/misc/cffiimpl.py +24 -0
  182. numba_cuda/numba/cuda/misc/coverage_support.py +43 -0
  183. numba_cuda/numba/cuda/misc/dump_style.py +41 -0
  184. numba_cuda/numba/cuda/misc/findlib.py +75 -0
  185. numba_cuda/numba/cuda/misc/firstlinefinder.py +96 -0
  186. numba_cuda/numba/cuda/misc/gdb_hook.py +240 -0
  187. numba_cuda/numba/cuda/misc/literal.py +28 -0
  188. numba_cuda/numba/cuda/misc/llvm_pass_timings.py +412 -0
  189. numba_cuda/numba/cuda/misc/special.py +94 -0
  190. numba_cuda/numba/cuda/models.py +56 -0
  191. numba_cuda/numba/cuda/np/arraymath.py +5130 -0
  192. numba_cuda/numba/cuda/np/arrayobj.py +7635 -0
  193. numba_cuda/numba/cuda/np/extensions.py +11 -0
  194. numba_cuda/numba/cuda/np/linalg.py +3087 -0
  195. numba_cuda/numba/cuda/np/math/__init__.py +0 -0
  196. numba_cuda/numba/cuda/np/math/cmathimpl.py +558 -0
  197. numba_cuda/numba/cuda/np/math/mathimpl.py +487 -0
  198. numba_cuda/numba/cuda/np/math/numbers.py +1461 -0
  199. numba_cuda/numba/cuda/np/npdatetime.py +969 -0
  200. numba_cuda/numba/cuda/np/npdatetime_helpers.py +217 -0
  201. numba_cuda/numba/cuda/np/npyfuncs.py +1808 -0
  202. numba_cuda/numba/cuda/np/npyimpl.py +1027 -0
  203. numba_cuda/numba/cuda/np/numpy_support.py +798 -0
  204. numba_cuda/numba/cuda/np/polynomial/__init__.py +4 -0
  205. numba_cuda/numba/cuda/np/polynomial/polynomial_core.py +242 -0
  206. numba_cuda/numba/cuda/np/polynomial/polynomial_functions.py +380 -0
  207. numba_cuda/numba/cuda/np/ufunc/__init__.py +4 -0
  208. numba_cuda/numba/cuda/np/ufunc/decorators.py +203 -0
  209. numba_cuda/numba/cuda/np/ufunc/sigparse.py +68 -0
  210. numba_cuda/numba/cuda/np/ufunc/ufuncbuilder.py +65 -0
  211. numba_cuda/numba/cuda/np/ufunc_db.py +1282 -0
  212. numba_cuda/numba/cuda/np/unsafe/__init__.py +0 -0
  213. numba_cuda/numba/cuda/np/unsafe/ndarray.py +84 -0
  214. numba_cuda/numba/cuda/nvvmutils.py +254 -0
  215. numba_cuda/numba/cuda/printimpl.py +126 -0
  216. numba_cuda/numba/cuda/random.py +308 -0
  217. numba_cuda/numba/cuda/reshape_funcs.cu +156 -0
  218. numba_cuda/numba/cuda/serialize.py +267 -0
  219. numba_cuda/numba/cuda/simulator/__init__.py +63 -0
  220. numba_cuda/numba/cuda/simulator/_internal/__init__.py +4 -0
  221. numba_cuda/numba/cuda/simulator/_internal/cuda_bf16.py +2 -0
  222. numba_cuda/numba/cuda/simulator/api.py +179 -0
  223. numba_cuda/numba/cuda/simulator/bf16.py +4 -0
  224. numba_cuda/numba/cuda/simulator/compiler.py +38 -0
  225. numba_cuda/numba/cuda/simulator/cudadrv/__init__.py +11 -0
  226. numba_cuda/numba/cuda/simulator/cudadrv/devicearray.py +462 -0
  227. numba_cuda/numba/cuda/simulator/cudadrv/devices.py +122 -0
  228. numba_cuda/numba/cuda/simulator/cudadrv/driver.py +66 -0
  229. numba_cuda/numba/cuda/simulator/cudadrv/drvapi.py +7 -0
  230. numba_cuda/numba/cuda/simulator/cudadrv/dummyarray.py +7 -0
  231. numba_cuda/numba/cuda/simulator/cudadrv/error.py +10 -0
  232. numba_cuda/numba/cuda/simulator/cudadrv/libs.py +10 -0
  233. numba_cuda/numba/cuda/simulator/cudadrv/linkable_code.py +61 -0
  234. numba_cuda/numba/cuda/simulator/cudadrv/nvrtc.py +11 -0
  235. numba_cuda/numba/cuda/simulator/cudadrv/nvvm.py +32 -0
  236. numba_cuda/numba/cuda/simulator/cudadrv/runtime.py +22 -0
  237. numba_cuda/numba/cuda/simulator/dispatcher.py +11 -0
  238. numba_cuda/numba/cuda/simulator/kernel.py +320 -0
  239. numba_cuda/numba/cuda/simulator/kernelapi.py +509 -0
  240. numba_cuda/numba/cuda/simulator/memory_management/__init__.py +4 -0
  241. numba_cuda/numba/cuda/simulator/memory_management/nrt.py +21 -0
  242. numba_cuda/numba/cuda/simulator/reduction.py +19 -0
  243. numba_cuda/numba/cuda/simulator/tests/support.py +4 -0
  244. numba_cuda/numba/cuda/simulator/vector_types.py +65 -0
  245. numba_cuda/numba/cuda/simulator_init.py +18 -0
  246. numba_cuda/numba/cuda/stubs.py +635 -0
  247. numba_cuda/numba/cuda/target.py +505 -0
  248. numba_cuda/numba/cuda/testing.py +347 -0
  249. numba_cuda/numba/cuda/tests/__init__.py +62 -0
  250. numba_cuda/numba/cuda/tests/benchmarks/__init__.py +0 -0
  251. numba_cuda/numba/cuda/tests/benchmarks/test_kernel_launch.py +119 -0
  252. numba_cuda/numba/cuda/tests/cloudpickle_main_class.py +9 -0
  253. numba_cuda/numba/cuda/tests/core/serialize_usecases.py +113 -0
  254. numba_cuda/numba/cuda/tests/core/test_itanium_mangler.py +83 -0
  255. numba_cuda/numba/cuda/tests/core/test_serialize.py +371 -0
  256. numba_cuda/numba/cuda/tests/cudadrv/__init__.py +9 -0
  257. numba_cuda/numba/cuda/tests/cudadrv/test_array_attr.py +147 -0
  258. numba_cuda/numba/cuda/tests/cudadrv/test_context_stack.py +161 -0
  259. numba_cuda/numba/cuda/tests/cudadrv/test_cuda_array_slicing.py +397 -0
  260. numba_cuda/numba/cuda/tests/cudadrv/test_cuda_auto_context.py +24 -0
  261. numba_cuda/numba/cuda/tests/cudadrv/test_cuda_devicerecord.py +180 -0
  262. numba_cuda/numba/cuda/tests/cudadrv/test_cuda_driver.py +313 -0
  263. numba_cuda/numba/cuda/tests/cudadrv/test_cuda_memory.py +187 -0
  264. numba_cuda/numba/cuda/tests/cudadrv/test_cuda_ndarray.py +621 -0
  265. numba_cuda/numba/cuda/tests/cudadrv/test_deallocations.py +247 -0
  266. numba_cuda/numba/cuda/tests/cudadrv/test_detect.py +100 -0
  267. numba_cuda/numba/cuda/tests/cudadrv/test_emm_plugins.py +198 -0
  268. numba_cuda/numba/cuda/tests/cudadrv/test_events.py +53 -0
  269. numba_cuda/numba/cuda/tests/cudadrv/test_host_alloc.py +72 -0
  270. numba_cuda/numba/cuda/tests/cudadrv/test_init.py +138 -0
  271. numba_cuda/numba/cuda/tests/cudadrv/test_inline_ptx.py +43 -0
  272. numba_cuda/numba/cuda/tests/cudadrv/test_is_fp16.py +15 -0
  273. numba_cuda/numba/cuda/tests/cudadrv/test_linkable_code.py +58 -0
  274. numba_cuda/numba/cuda/tests/cudadrv/test_linker.py +348 -0
  275. numba_cuda/numba/cuda/tests/cudadrv/test_managed_alloc.py +128 -0
  276. numba_cuda/numba/cuda/tests/cudadrv/test_module_callbacks.py +301 -0
  277. numba_cuda/numba/cuda/tests/cudadrv/test_nvjitlink.py +174 -0
  278. numba_cuda/numba/cuda/tests/cudadrv/test_nvrtc.py +28 -0
  279. numba_cuda/numba/cuda/tests/cudadrv/test_nvvm_driver.py +185 -0
  280. numba_cuda/numba/cuda/tests/cudadrv/test_pinned.py +39 -0
  281. numba_cuda/numba/cuda/tests/cudadrv/test_profiler.py +23 -0
  282. numba_cuda/numba/cuda/tests/cudadrv/test_reset_device.py +38 -0
  283. numba_cuda/numba/cuda/tests/cudadrv/test_runtime.py +48 -0
  284. numba_cuda/numba/cuda/tests/cudadrv/test_select_device.py +44 -0
  285. numba_cuda/numba/cuda/tests/cudadrv/test_streams.py +127 -0
  286. numba_cuda/numba/cuda/tests/cudapy/__init__.py +9 -0
  287. numba_cuda/numba/cuda/tests/cudapy/cache_usecases.py +231 -0
  288. numba_cuda/numba/cuda/tests/cudapy/cache_with_cpu_usecases.py +50 -0
  289. numba_cuda/numba/cuda/tests/cudapy/cg_cache_usecases.py +36 -0
  290. numba_cuda/numba/cuda/tests/cudapy/complex_usecases.py +116 -0
  291. numba_cuda/numba/cuda/tests/cudapy/enum_usecases.py +59 -0
  292. numba_cuda/numba/cuda/tests/cudapy/extensions_usecases.py +62 -0
  293. numba_cuda/numba/cuda/tests/cudapy/jitlink.ptx +28 -0
  294. numba_cuda/numba/cuda/tests/cudapy/overload_usecases.py +33 -0
  295. numba_cuda/numba/cuda/tests/cudapy/recursion_usecases.py +104 -0
  296. numba_cuda/numba/cuda/tests/cudapy/test_alignment.py +47 -0
  297. numba_cuda/numba/cuda/tests/cudapy/test_analysis.py +1122 -0
  298. numba_cuda/numba/cuda/tests/cudapy/test_array.py +344 -0
  299. numba_cuda/numba/cuda/tests/cudapy/test_array_alignment.py +268 -0
  300. numba_cuda/numba/cuda/tests/cudapy/test_array_args.py +203 -0
  301. numba_cuda/numba/cuda/tests/cudapy/test_array_methods.py +63 -0
  302. numba_cuda/numba/cuda/tests/cudapy/test_array_reductions.py +360 -0
  303. numba_cuda/numba/cuda/tests/cudapy/test_atomics.py +1815 -0
  304. numba_cuda/numba/cuda/tests/cudapy/test_bfloat16.py +599 -0
  305. numba_cuda/numba/cuda/tests/cudapy/test_bfloat16_bindings.py +377 -0
  306. numba_cuda/numba/cuda/tests/cudapy/test_blackscholes.py +160 -0
  307. numba_cuda/numba/cuda/tests/cudapy/test_boolean.py +27 -0
  308. numba_cuda/numba/cuda/tests/cudapy/test_byteflow.py +98 -0
  309. numba_cuda/numba/cuda/tests/cudapy/test_cache_hints.py +210 -0
  310. numba_cuda/numba/cuda/tests/cudapy/test_caching.py +683 -0
  311. numba_cuda/numba/cuda/tests/cudapy/test_casting.py +265 -0
  312. numba_cuda/numba/cuda/tests/cudapy/test_cffi.py +42 -0
  313. numba_cuda/numba/cuda/tests/cudapy/test_compiler.py +718 -0
  314. numba_cuda/numba/cuda/tests/cudapy/test_complex.py +370 -0
  315. numba_cuda/numba/cuda/tests/cudapy/test_complex_kernel.py +23 -0
  316. numba_cuda/numba/cuda/tests/cudapy/test_const_string.py +142 -0
  317. numba_cuda/numba/cuda/tests/cudapy/test_constmem.py +178 -0
  318. numba_cuda/numba/cuda/tests/cudapy/test_cooperative_groups.py +193 -0
  319. numba_cuda/numba/cuda/tests/cudapy/test_copy_propagate.py +131 -0
  320. numba_cuda/numba/cuda/tests/cudapy/test_cuda_array_interface.py +438 -0
  321. numba_cuda/numba/cuda/tests/cudapy/test_cuda_jit_no_types.py +94 -0
  322. numba_cuda/numba/cuda/tests/cudapy/test_datetime.py +101 -0
  323. numba_cuda/numba/cuda/tests/cudapy/test_debug.py +105 -0
  324. numba_cuda/numba/cuda/tests/cudapy/test_debuginfo.py +889 -0
  325. numba_cuda/numba/cuda/tests/cudapy/test_debuginfo_types.py +476 -0
  326. numba_cuda/numba/cuda/tests/cudapy/test_device_func.py +500 -0
  327. numba_cuda/numba/cuda/tests/cudapy/test_dispatcher.py +820 -0
  328. numba_cuda/numba/cuda/tests/cudapy/test_enums.py +152 -0
  329. numba_cuda/numba/cuda/tests/cudapy/test_errors.py +111 -0
  330. numba_cuda/numba/cuda/tests/cudapy/test_exception.py +170 -0
  331. numba_cuda/numba/cuda/tests/cudapy/test_extending.py +1088 -0
  332. numba_cuda/numba/cuda/tests/cudapy/test_extending_types.py +71 -0
  333. numba_cuda/numba/cuda/tests/cudapy/test_fastmath.py +265 -0
  334. numba_cuda/numba/cuda/tests/cudapy/test_flow_control.py +1433 -0
  335. numba_cuda/numba/cuda/tests/cudapy/test_forall.py +57 -0
  336. numba_cuda/numba/cuda/tests/cudapy/test_freevar.py +34 -0
  337. numba_cuda/numba/cuda/tests/cudapy/test_frexp_ldexp.py +69 -0
  338. numba_cuda/numba/cuda/tests/cudapy/test_globals.py +62 -0
  339. numba_cuda/numba/cuda/tests/cudapy/test_gufunc.py +474 -0
  340. numba_cuda/numba/cuda/tests/cudapy/test_gufunc_scalar.py +167 -0
  341. numba_cuda/numba/cuda/tests/cudapy/test_gufunc_scheduling.py +92 -0
  342. numba_cuda/numba/cuda/tests/cudapy/test_idiv.py +39 -0
  343. numba_cuda/numba/cuda/tests/cudapy/test_inline.py +170 -0
  344. numba_cuda/numba/cuda/tests/cudapy/test_inspect.py +255 -0
  345. numba_cuda/numba/cuda/tests/cudapy/test_intrinsics.py +1219 -0
  346. numba_cuda/numba/cuda/tests/cudapy/test_ipc.py +263 -0
  347. numba_cuda/numba/cuda/tests/cudapy/test_ir.py +598 -0
  348. numba_cuda/numba/cuda/tests/cudapy/test_ir_utils.py +276 -0
  349. numba_cuda/numba/cuda/tests/cudapy/test_iterators.py +101 -0
  350. numba_cuda/numba/cuda/tests/cudapy/test_lang.py +68 -0
  351. numba_cuda/numba/cuda/tests/cudapy/test_laplace.py +123 -0
  352. numba_cuda/numba/cuda/tests/cudapy/test_libdevice.py +194 -0
  353. numba_cuda/numba/cuda/tests/cudapy/test_lineinfo.py +220 -0
  354. numba_cuda/numba/cuda/tests/cudapy/test_localmem.py +173 -0
  355. numba_cuda/numba/cuda/tests/cudapy/test_make_function_to_jit_function.py +364 -0
  356. numba_cuda/numba/cuda/tests/cudapy/test_mandel.py +47 -0
  357. numba_cuda/numba/cuda/tests/cudapy/test_math.py +842 -0
  358. numba_cuda/numba/cuda/tests/cudapy/test_matmul.py +76 -0
  359. numba_cuda/numba/cuda/tests/cudapy/test_minmax.py +78 -0
  360. numba_cuda/numba/cuda/tests/cudapy/test_montecarlo.py +25 -0
  361. numba_cuda/numba/cuda/tests/cudapy/test_multigpu.py +145 -0
  362. numba_cuda/numba/cuda/tests/cudapy/test_multiprocessing.py +39 -0
  363. numba_cuda/numba/cuda/tests/cudapy/test_multithreads.py +82 -0
  364. numba_cuda/numba/cuda/tests/cudapy/test_nondet.py +53 -0
  365. numba_cuda/numba/cuda/tests/cudapy/test_operator.py +504 -0
  366. numba_cuda/numba/cuda/tests/cudapy/test_optimization.py +93 -0
  367. numba_cuda/numba/cuda/tests/cudapy/test_overload.py +402 -0
  368. numba_cuda/numba/cuda/tests/cudapy/test_powi.py +128 -0
  369. numba_cuda/numba/cuda/tests/cudapy/test_print.py +193 -0
  370. numba_cuda/numba/cuda/tests/cudapy/test_py2_div_issue.py +37 -0
  371. numba_cuda/numba/cuda/tests/cudapy/test_random.py +117 -0
  372. numba_cuda/numba/cuda/tests/cudapy/test_record_dtype.py +614 -0
  373. numba_cuda/numba/cuda/tests/cudapy/test_recursion.py +130 -0
  374. numba_cuda/numba/cuda/tests/cudapy/test_reduction.py +94 -0
  375. numba_cuda/numba/cuda/tests/cudapy/test_retrieve_autoconverted_arrays.py +83 -0
  376. numba_cuda/numba/cuda/tests/cudapy/test_serialize.py +86 -0
  377. numba_cuda/numba/cuda/tests/cudapy/test_slicing.py +40 -0
  378. numba_cuda/numba/cuda/tests/cudapy/test_sm.py +457 -0
  379. numba_cuda/numba/cuda/tests/cudapy/test_sm_creation.py +233 -0
  380. numba_cuda/numba/cuda/tests/cudapy/test_ssa.py +454 -0
  381. numba_cuda/numba/cuda/tests/cudapy/test_stream_api.py +56 -0
  382. numba_cuda/numba/cuda/tests/cudapy/test_sync.py +277 -0
  383. numba_cuda/numba/cuda/tests/cudapy/test_tracing.py +200 -0
  384. numba_cuda/numba/cuda/tests/cudapy/test_transpose.py +90 -0
  385. numba_cuda/numba/cuda/tests/cudapy/test_typeconv.py +333 -0
  386. numba_cuda/numba/cuda/tests/cudapy/test_typeinfer.py +538 -0
  387. numba_cuda/numba/cuda/tests/cudapy/test_ufuncs.py +585 -0
  388. numba_cuda/numba/cuda/tests/cudapy/test_userexc.py +42 -0
  389. numba_cuda/numba/cuda/tests/cudapy/test_vector_type.py +485 -0
  390. numba_cuda/numba/cuda/tests/cudapy/test_vectorize.py +312 -0
  391. numba_cuda/numba/cuda/tests/cudapy/test_vectorize_complex.py +23 -0
  392. numba_cuda/numba/cuda/tests/cudapy/test_vectorize_decor.py +183 -0
  393. numba_cuda/numba/cuda/tests/cudapy/test_vectorize_device.py +40 -0
  394. numba_cuda/numba/cuda/tests/cudapy/test_vectorize_scalar_arg.py +40 -0
  395. numba_cuda/numba/cuda/tests/cudapy/test_warning.py +206 -0
  396. numba_cuda/numba/cuda/tests/cudapy/test_warp_ops.py +331 -0
  397. numba_cuda/numba/cuda/tests/cudasim/__init__.py +9 -0
  398. numba_cuda/numba/cuda/tests/cudasim/support.py +9 -0
  399. numba_cuda/numba/cuda/tests/cudasim/test_cudasim_issues.py +111 -0
  400. numba_cuda/numba/cuda/tests/data/__init__.py +2 -0
  401. numba_cuda/numba/cuda/tests/data/cta_barrier.cu +28 -0
  402. numba_cuda/numba/cuda/tests/data/cuda_include.cu +10 -0
  403. numba_cuda/numba/cuda/tests/data/error.cu +12 -0
  404. numba_cuda/numba/cuda/tests/data/include/add.cuh +8 -0
  405. numba_cuda/numba/cuda/tests/data/jitlink.cu +28 -0
  406. numba_cuda/numba/cuda/tests/data/jitlink.ptx +49 -0
  407. numba_cuda/numba/cuda/tests/data/warn.cu +12 -0
  408. numba_cuda/numba/cuda/tests/doc_examples/__init__.py +9 -0
  409. numba_cuda/numba/cuda/tests/doc_examples/ffi/__init__.py +2 -0
  410. numba_cuda/numba/cuda/tests/doc_examples/ffi/functions.cu +54 -0
  411. numba_cuda/numba/cuda/tests/doc_examples/ffi/include/mul.cuh +8 -0
  412. numba_cuda/numba/cuda/tests/doc_examples/ffi/saxpy.cu +14 -0
  413. numba_cuda/numba/cuda/tests/doc_examples/test_cg.py +86 -0
  414. numba_cuda/numba/cuda/tests/doc_examples/test_cpointer.py +68 -0
  415. numba_cuda/numba/cuda/tests/doc_examples/test_cpu_gpu_compat.py +81 -0
  416. numba_cuda/numba/cuda/tests/doc_examples/test_ffi.py +141 -0
  417. numba_cuda/numba/cuda/tests/doc_examples/test_laplace.py +160 -0
  418. numba_cuda/numba/cuda/tests/doc_examples/test_matmul.py +180 -0
  419. numba_cuda/numba/cuda/tests/doc_examples/test_montecarlo.py +119 -0
  420. numba_cuda/numba/cuda/tests/doc_examples/test_random.py +66 -0
  421. numba_cuda/numba/cuda/tests/doc_examples/test_reduction.py +80 -0
  422. numba_cuda/numba/cuda/tests/doc_examples/test_sessionize.py +206 -0
  423. numba_cuda/numba/cuda/tests/doc_examples/test_ufunc.py +53 -0
  424. numba_cuda/numba/cuda/tests/doc_examples/test_vecadd.py +76 -0
  425. numba_cuda/numba/cuda/tests/nocuda/__init__.py +9 -0
  426. numba_cuda/numba/cuda/tests/nocuda/test_dummyarray.py +391 -0
  427. numba_cuda/numba/cuda/tests/nocuda/test_function_resolution.py +48 -0
  428. numba_cuda/numba/cuda/tests/nocuda/test_import.py +63 -0
  429. numba_cuda/numba/cuda/tests/nocuda/test_library_lookup.py +252 -0
  430. numba_cuda/numba/cuda/tests/nocuda/test_nvvm.py +59 -0
  431. numba_cuda/numba/cuda/tests/nrt/__init__.py +9 -0
  432. numba_cuda/numba/cuda/tests/nrt/test_nrt.py +387 -0
  433. numba_cuda/numba/cuda/tests/nrt/test_nrt_refct.py +124 -0
  434. numba_cuda/numba/cuda/tests/support.py +900 -0
  435. numba_cuda/numba/cuda/typeconv/__init__.py +4 -0
  436. numba_cuda/numba/cuda/typeconv/castgraph.py +137 -0
  437. numba_cuda/numba/cuda/typeconv/rules.py +63 -0
  438. numba_cuda/numba/cuda/typeconv/typeconv.py +121 -0
  439. numba_cuda/numba/cuda/types/__init__.py +233 -0
  440. numba_cuda/numba/cuda/types/__init__.pyi +167 -0
  441. numba_cuda/numba/cuda/types/abstract.py +9 -0
  442. numba_cuda/numba/cuda/types/common.py +9 -0
  443. numba_cuda/numba/cuda/types/containers.py +9 -0
  444. numba_cuda/numba/cuda/types/cuda_abstract.py +533 -0
  445. numba_cuda/numba/cuda/types/cuda_common.py +110 -0
  446. numba_cuda/numba/cuda/types/cuda_containers.py +971 -0
  447. numba_cuda/numba/cuda/types/cuda_function_type.py +230 -0
  448. numba_cuda/numba/cuda/types/cuda_functions.py +798 -0
  449. numba_cuda/numba/cuda/types/cuda_iterators.py +120 -0
  450. numba_cuda/numba/cuda/types/cuda_misc.py +569 -0
  451. numba_cuda/numba/cuda/types/cuda_npytypes.py +690 -0
  452. numba_cuda/numba/cuda/types/cuda_scalars.py +280 -0
  453. numba_cuda/numba/cuda/types/ext_types.py +101 -0
  454. numba_cuda/numba/cuda/types/function_type.py +11 -0
  455. numba_cuda/numba/cuda/types/functions.py +9 -0
  456. numba_cuda/numba/cuda/types/iterators.py +9 -0
  457. numba_cuda/numba/cuda/types/misc.py +9 -0
  458. numba_cuda/numba/cuda/types/npytypes.py +9 -0
  459. numba_cuda/numba/cuda/types/scalars.py +9 -0
  460. numba_cuda/numba/cuda/typing/__init__.py +19 -0
  461. numba_cuda/numba/cuda/typing/arraydecl.py +939 -0
  462. numba_cuda/numba/cuda/typing/asnumbatype.py +130 -0
  463. numba_cuda/numba/cuda/typing/bufproto.py +70 -0
  464. numba_cuda/numba/cuda/typing/builtins.py +1209 -0
  465. numba_cuda/numba/cuda/typing/cffi_utils.py +219 -0
  466. numba_cuda/numba/cuda/typing/cmathdecl.py +47 -0
  467. numba_cuda/numba/cuda/typing/collections.py +138 -0
  468. numba_cuda/numba/cuda/typing/context.py +782 -0
  469. numba_cuda/numba/cuda/typing/ctypes_utils.py +125 -0
  470. numba_cuda/numba/cuda/typing/dictdecl.py +63 -0
  471. numba_cuda/numba/cuda/typing/enumdecl.py +74 -0
  472. numba_cuda/numba/cuda/typing/listdecl.py +147 -0
  473. numba_cuda/numba/cuda/typing/mathdecl.py +158 -0
  474. numba_cuda/numba/cuda/typing/npdatetime.py +322 -0
  475. numba_cuda/numba/cuda/typing/npydecl.py +749 -0
  476. numba_cuda/numba/cuda/typing/setdecl.py +115 -0
  477. numba_cuda/numba/cuda/typing/templates.py +1446 -0
  478. numba_cuda/numba/cuda/typing/typeof.py +301 -0
  479. numba_cuda/numba/cuda/ufuncs.py +746 -0
  480. numba_cuda/numba/cuda/utils.py +724 -0
  481. numba_cuda/numba/cuda/vector_types.py +214 -0
  482. numba_cuda/numba/cuda/vectorizers.py +260 -0
  483. numba_cuda-0.21.1.dist-info/METADATA +109 -0
  484. numba_cuda-0.21.1.dist-info/RECORD +488 -0
  485. numba_cuda-0.21.1.dist-info/WHEEL +5 -0
  486. numba_cuda-0.21.1.dist-info/licenses/LICENSE +26 -0
  487. numba_cuda-0.21.1.dist-info/licenses/LICENSE.numba +24 -0
  488. numba_cuda-0.21.1.dist-info/top_level.txt +1 -0
@@ -0,0 +1,598 @@
1
+ # SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
+ # SPDX-License-Identifier: BSD-2-Clause
3
+
4
+ import unittest
5
+ from numba.cuda.testing import CUDATestCase, skip_on_cudasim
6
+ import warnings
7
+ import numpy as np
8
+
9
+ from numba.cuda import HAS_NUMBA
10
+
11
+ if HAS_NUMBA:
12
+ from numba import objmode
13
+ from numba import njit
14
+ from numba.cuda.core import ir
15
+ from numba.cuda import compiler
16
+ from numba.cuda.core import errors
17
+ from numba.cuda.core.compiler import (
18
+ CompilerBase,
19
+ )
20
+ from numba.cuda.core.compiler_machinery import (
21
+ FunctionPass,
22
+ PassManager,
23
+ register_pass,
24
+ )
25
+ from numba.cuda.core.untyped_passes import (
26
+ TranslateByteCode,
27
+ IRProcessing,
28
+ ReconstructSSA,
29
+ )
30
+ from numba.cuda.testing import skip_on_standalone_numba_cuda
31
+
32
+
33
+ def requires_fully_vendored_ir(fn):
34
+ return unittest.skip(
35
+ "Cannot run until the dependency on the un-vendored IR module is removed"
36
+ )(fn)
37
+
38
+
39
+ class TestIR(CUDATestCase):
40
+ def test_IRScope(self):
41
+ filename = "<?>"
42
+ top = ir.Scope(parent=None, loc=ir.Loc(filename=filename, line=1))
43
+ local = ir.Scope(parent=top, loc=ir.Loc(filename=filename, line=2))
44
+
45
+ apple = local.define("apple", loc=ir.Loc(filename=filename, line=3))
46
+ self.assertIs(local.get("apple"), apple)
47
+ self.assertEqual(len(local.localvars), 1)
48
+
49
+ orange = top.define("orange", loc=ir.Loc(filename=filename, line=4))
50
+ self.assertEqual(len(local.localvars), 1)
51
+ self.assertEqual(len(top.localvars), 1)
52
+ self.assertIs(top.get("orange"), orange)
53
+ self.assertIs(local.get("orange"), orange)
54
+
55
+ more_orange = local.define(
56
+ "orange", loc=ir.Loc(filename=filename, line=5)
57
+ )
58
+ self.assertIs(top.get("orange"), orange)
59
+ self.assertIsNot(local.get("orange"), not orange)
60
+ self.assertIs(local.get("orange"), more_orange)
61
+
62
+ try:
63
+ local.define("orange", loc=ir.Loc(filename=filename, line=5))
64
+ except ir.RedefinedError:
65
+ pass
66
+ else:
67
+ self.fail("Expecting an %s" % ir.RedefinedError)
68
+
69
+
70
+ class CheckEquality(CUDATestCase):
71
+ var_a = ir.Var(None, "a", ir.unknown_loc)
72
+ var_b = ir.Var(None, "b", ir.unknown_loc)
73
+ var_c = ir.Var(None, "c", ir.unknown_loc)
74
+ var_d = ir.Var(None, "d", ir.unknown_loc)
75
+ var_e = ir.Var(None, "e", ir.unknown_loc)
76
+ loc1 = ir.Loc("mock", 1, 0)
77
+ loc2 = ir.Loc("mock", 2, 0)
78
+ loc3 = ir.Loc("mock", 3, 0)
79
+
80
+ def check(self, base, same=[], different=[]):
81
+ for s in same:
82
+ self.assertTrue(base == s)
83
+ for d in different:
84
+ self.assertTrue(base != d)
85
+
86
+
87
+ class TestIRMeta(CheckEquality):
88
+ """
89
+ Tests IR node meta, like Loc and Scope
90
+ """
91
+
92
+ def test_loc(self):
93
+ a = ir.Loc("file", 1, 0)
94
+ b = ir.Loc("file", 1, 0)
95
+ c = ir.Loc("pile", 1, 0)
96
+ d = ir.Loc("file", 2, 0)
97
+ e = ir.Loc("file", 1, 1)
98
+ self.check(
99
+ a,
100
+ same=[
101
+ b,
102
+ ],
103
+ different=[c, d, e],
104
+ )
105
+
106
+ f = ir.Loc("file", 1, 0, maybe_decorator=False)
107
+ g = ir.Loc("file", 1, 0, maybe_decorator=True)
108
+ self.check(a, same=[f, g])
109
+
110
+ def test_scope(self):
111
+ parent1 = ir.Scope(None, self.loc1)
112
+ parent2 = ir.Scope(None, self.loc1)
113
+ parent3 = ir.Scope(None, self.loc2)
114
+ self.check(
115
+ parent1,
116
+ same=[
117
+ parent2,
118
+ parent3,
119
+ ],
120
+ )
121
+
122
+ a = ir.Scope(parent1, self.loc1)
123
+ b = ir.Scope(parent1, self.loc1)
124
+ c = ir.Scope(parent1, self.loc2)
125
+ d = ir.Scope(parent3, self.loc1)
126
+ self.check(a, same=[b, c, d])
127
+
128
+ # parent1 and parent2 are equal, so children referring to either parent
129
+ # should be equal
130
+ e = ir.Scope(parent2, self.loc1)
131
+ self.check(
132
+ a,
133
+ same=[
134
+ e,
135
+ ],
136
+ )
137
+
138
+
139
+ class TestIRNodes(CheckEquality):
140
+ """
141
+ Tests IR nodes
142
+ """
143
+
144
+ def test_terminator(self):
145
+ # terminator base class inst should always be equal
146
+ t1 = ir.Terminator()
147
+ t2 = ir.Terminator()
148
+ self.check(t1, same=[t2])
149
+
150
+ def test_jump(self):
151
+ a = ir.Jump(1, self.loc1)
152
+ b = ir.Jump(1, self.loc1)
153
+ c = ir.Jump(1, self.loc2)
154
+ d = ir.Jump(2, self.loc1)
155
+ self.check(a, same=[b, c], different=[d])
156
+
157
+ def test_return(self):
158
+ a = ir.Return(self.var_a, self.loc1)
159
+ b = ir.Return(self.var_a, self.loc1)
160
+ c = ir.Return(self.var_a, self.loc2)
161
+ d = ir.Return(self.var_b, self.loc1)
162
+ self.check(a, same=[b, c], different=[d])
163
+
164
+ def test_raise(self):
165
+ a = ir.Raise(self.var_a, self.loc1)
166
+ b = ir.Raise(self.var_a, self.loc1)
167
+ c = ir.Raise(self.var_a, self.loc2)
168
+ d = ir.Raise(self.var_b, self.loc1)
169
+ self.check(a, same=[b, c], different=[d])
170
+
171
+ def test_staticraise(self):
172
+ a = ir.StaticRaise(AssertionError, None, self.loc1)
173
+ b = ir.StaticRaise(AssertionError, None, self.loc1)
174
+ c = ir.StaticRaise(AssertionError, None, self.loc2)
175
+ e = ir.StaticRaise(AssertionError, ("str",), self.loc1)
176
+ d = ir.StaticRaise(RuntimeError, None, self.loc1)
177
+ self.check(a, same=[b, c], different=[d, e])
178
+
179
+ def test_branch(self):
180
+ a = ir.Branch(self.var_a, 1, 2, self.loc1)
181
+ b = ir.Branch(self.var_a, 1, 2, self.loc1)
182
+ c = ir.Branch(self.var_a, 1, 2, self.loc2)
183
+ d = ir.Branch(self.var_b, 1, 2, self.loc1)
184
+ e = ir.Branch(self.var_a, 2, 2, self.loc1)
185
+ f = ir.Branch(self.var_a, 1, 3, self.loc1)
186
+ self.check(a, same=[b, c], different=[d, e, f])
187
+
188
+ def test_expr(self):
189
+ a = ir.Expr("some_op", self.loc1)
190
+ b = ir.Expr("some_op", self.loc1)
191
+ c = ir.Expr("some_op", self.loc2)
192
+ d = ir.Expr("some_other_op", self.loc1)
193
+ self.check(a, same=[b, c], different=[d])
194
+
195
+ def test_setitem(self):
196
+ a = ir.SetItem(self.var_a, self.var_b, self.var_c, self.loc1)
197
+ b = ir.SetItem(self.var_a, self.var_b, self.var_c, self.loc1)
198
+ c = ir.SetItem(self.var_a, self.var_b, self.var_c, self.loc2)
199
+ d = ir.SetItem(self.var_d, self.var_b, self.var_c, self.loc1)
200
+ e = ir.SetItem(self.var_a, self.var_d, self.var_c, self.loc1)
201
+ f = ir.SetItem(self.var_a, self.var_b, self.var_d, self.loc1)
202
+ self.check(a, same=[b, c], different=[d, e, f])
203
+
204
+ def test_staticsetitem(self):
205
+ a = ir.StaticSetItem(self.var_a, 1, self.var_b, self.var_c, self.loc1)
206
+ b = ir.StaticSetItem(self.var_a, 1, self.var_b, self.var_c, self.loc1)
207
+ c = ir.StaticSetItem(self.var_a, 1, self.var_b, self.var_c, self.loc2)
208
+ d = ir.StaticSetItem(self.var_d, 1, self.var_b, self.var_c, self.loc1)
209
+ e = ir.StaticSetItem(self.var_a, 2, self.var_b, self.var_c, self.loc1)
210
+ f = ir.StaticSetItem(self.var_a, 1, self.var_d, self.var_c, self.loc1)
211
+ g = ir.StaticSetItem(self.var_a, 1, self.var_b, self.var_d, self.loc1)
212
+ self.check(a, same=[b, c], different=[d, e, f, g])
213
+
214
+ def test_delitem(self):
215
+ a = ir.DelItem(self.var_a, self.var_b, self.loc1)
216
+ b = ir.DelItem(self.var_a, self.var_b, self.loc1)
217
+ c = ir.DelItem(self.var_a, self.var_b, self.loc2)
218
+ d = ir.DelItem(self.var_c, self.var_b, self.loc1)
219
+ e = ir.DelItem(self.var_a, self.var_c, self.loc1)
220
+ self.check(a, same=[b, c], different=[d, e])
221
+
222
+ def test_del(self):
223
+ a = ir.Del(self.var_a.name, self.loc1)
224
+ b = ir.Del(self.var_a.name, self.loc1)
225
+ c = ir.Del(self.var_a.name, self.loc2)
226
+ d = ir.Del(self.var_b.name, self.loc1)
227
+ self.check(a, same=[b, c], different=[d])
228
+
229
+ def test_setattr(self):
230
+ a = ir.SetAttr(self.var_a, "foo", self.var_b, self.loc1)
231
+ b = ir.SetAttr(self.var_a, "foo", self.var_b, self.loc1)
232
+ c = ir.SetAttr(self.var_a, "foo", self.var_b, self.loc2)
233
+ d = ir.SetAttr(self.var_c, "foo", self.var_b, self.loc1)
234
+ e = ir.SetAttr(self.var_a, "bar", self.var_b, self.loc1)
235
+ f = ir.SetAttr(self.var_a, "foo", self.var_c, self.loc1)
236
+ self.check(a, same=[b, c], different=[d, e, f])
237
+
238
+ def test_delattr(self):
239
+ a = ir.DelAttr(self.var_a, "foo", self.loc1)
240
+ b = ir.DelAttr(self.var_a, "foo", self.loc1)
241
+ c = ir.DelAttr(self.var_a, "foo", self.loc2)
242
+ d = ir.DelAttr(self.var_c, "foo", self.loc1)
243
+ e = ir.DelAttr(self.var_a, "bar", self.loc1)
244
+ self.check(a, same=[b, c], different=[d, e])
245
+
246
+ def test_assign(self):
247
+ a = ir.Assign(self.var_a, self.var_b, self.loc1)
248
+ b = ir.Assign(self.var_a, self.var_b, self.loc1)
249
+ c = ir.Assign(self.var_a, self.var_b, self.loc2)
250
+ d = ir.Assign(self.var_c, self.var_b, self.loc1)
251
+ e = ir.Assign(self.var_a, self.var_c, self.loc1)
252
+ self.check(a, same=[b, c], different=[d, e])
253
+
254
+ def test_print(self):
255
+ a = ir.Print((self.var_a,), self.var_b, self.loc1)
256
+ b = ir.Print((self.var_a,), self.var_b, self.loc1)
257
+ c = ir.Print((self.var_a,), self.var_b, self.loc2)
258
+ d = ir.Print((self.var_c,), self.var_b, self.loc1)
259
+ e = ir.Print((self.var_a,), self.var_c, self.loc1)
260
+ self.check(a, same=[b, c], different=[d, e])
261
+
262
+ def test_storemap(self):
263
+ a = ir.StoreMap(self.var_a, self.var_b, self.var_c, self.loc1)
264
+ b = ir.StoreMap(self.var_a, self.var_b, self.var_c, self.loc1)
265
+ c = ir.StoreMap(self.var_a, self.var_b, self.var_c, self.loc2)
266
+ d = ir.StoreMap(self.var_d, self.var_b, self.var_c, self.loc1)
267
+ e = ir.StoreMap(self.var_a, self.var_d, self.var_c, self.loc1)
268
+ f = ir.StoreMap(self.var_a, self.var_b, self.var_d, self.loc1)
269
+ self.check(a, same=[b, c], different=[d, e, f])
270
+
271
+ def test_yield(self):
272
+ a = ir.Yield(self.var_a, self.loc1, 0)
273
+ b = ir.Yield(self.var_a, self.loc1, 0)
274
+ c = ir.Yield(self.var_a, self.loc2, 0)
275
+ d = ir.Yield(self.var_b, self.loc1, 0)
276
+ e = ir.Yield(self.var_a, self.loc1, 1)
277
+ self.check(a, same=[b, c], different=[d, e])
278
+
279
+ def test_enterwith(self):
280
+ a = ir.EnterWith(self.var_a, 0, 1, self.loc1)
281
+ b = ir.EnterWith(self.var_a, 0, 1, self.loc1)
282
+ c = ir.EnterWith(self.var_a, 0, 1, self.loc2)
283
+ d = ir.EnterWith(self.var_b, 0, 1, self.loc1)
284
+ e = ir.EnterWith(self.var_a, 1, 1, self.loc1)
285
+ f = ir.EnterWith(self.var_a, 0, 2, self.loc1)
286
+ self.check(a, same=[b, c], different=[d, e, f])
287
+
288
+ def test_arg(self):
289
+ a = ir.Arg("foo", 0, self.loc1)
290
+ b = ir.Arg("foo", 0, self.loc1)
291
+ c = ir.Arg("foo", 0, self.loc2)
292
+ d = ir.Arg("bar", 0, self.loc1)
293
+ e = ir.Arg("foo", 1, self.loc1)
294
+ self.check(a, same=[b, c], different=[d, e])
295
+
296
+ def test_const(self):
297
+ a = ir.Const(1, self.loc1)
298
+ b = ir.Const(1, self.loc1)
299
+ c = ir.Const(1, self.loc2)
300
+ d = ir.Const(2, self.loc1)
301
+ self.check(a, same=[b, c], different=[d])
302
+
303
+ def test_global(self):
304
+ a = ir.Global("foo", 0, self.loc1)
305
+ b = ir.Global("foo", 0, self.loc1)
306
+ c = ir.Global("foo", 0, self.loc2)
307
+ d = ir.Global("bar", 0, self.loc1)
308
+ e = ir.Global("foo", 1, self.loc1)
309
+ self.check(a, same=[b, c], different=[d, e])
310
+
311
+ def test_var(self):
312
+ a = ir.Var(None, "foo", self.loc1)
313
+ b = ir.Var(None, "foo", self.loc1)
314
+ c = ir.Var(None, "foo", self.loc2)
315
+ d = ir.Var(ir.Scope(None, ir.unknown_loc), "foo", self.loc1)
316
+ e = ir.Var(None, "bar", self.loc1)
317
+ self.check(a, same=[b, c, d], different=[e])
318
+
319
+ def test_undefinedtype(self):
320
+ a = ir.UndefinedType()
321
+ b = ir.UndefinedType()
322
+ self.check(a, same=[b])
323
+
324
+ def test_loop(self):
325
+ a = ir.Loop(1, 3)
326
+ b = ir.Loop(1, 3)
327
+ c = ir.Loop(2, 3)
328
+ d = ir.Loop(1, 4)
329
+ self.check(a, same=[b], different=[c, d])
330
+
331
+ def test_with(self):
332
+ a = ir.With(1, 3)
333
+ b = ir.With(1, 3)
334
+ c = ir.With(2, 3)
335
+ d = ir.With(1, 4)
336
+ self.check(a, same=[b], different=[c, d])
337
+
338
+
339
+ # used later
340
+ _GLOBAL = 1234
341
+
342
+
343
+ class TestIRCompounds(CheckEquality):
344
+ """
345
+ Tests IR concepts that have state
346
+ """
347
+
348
+ def test_varmap(self):
349
+ a = ir.VarMap()
350
+ a.define(self.var_a, "foo")
351
+ a.define(self.var_b, "bar")
352
+
353
+ b = ir.VarMap()
354
+ b.define(self.var_a, "foo")
355
+ b.define(self.var_b, "bar")
356
+
357
+ c = ir.VarMap()
358
+ c.define(self.var_a, "foo")
359
+ c.define(self.var_c, "bar")
360
+
361
+ self.check(a, same=[b], different=[c])
362
+
363
+ def test_block(self):
364
+ def gen_block():
365
+ parent = ir.Scope(None, self.loc1)
366
+ tmp = ir.Block(parent, self.loc2)
367
+ assign1 = ir.Assign(self.var_a, self.var_b, self.loc3)
368
+ assign2 = ir.Assign(self.var_a, self.var_c, self.loc3)
369
+ assign3 = ir.Assign(self.var_c, self.var_b, self.loc3)
370
+ tmp.append(assign1)
371
+ tmp.append(assign2)
372
+ tmp.append(assign3)
373
+ return tmp
374
+
375
+ a = gen_block()
376
+ b = gen_block()
377
+ c = gen_block().append(ir.Assign(self.var_a, self.var_b, self.loc3))
378
+
379
+ self.check(a, same=[b], different=[c])
380
+
381
+ @skip_on_cudasim("doesn't work in the simulator")
382
+ def test_functionir(self):
383
+ def run_frontend(x):
384
+ return compiler.run_frontend(x, emit_dels=True)
385
+
386
+ # this creates a function full of all sorts of things to ensure the IR
387
+ # is pretty involved, it then compares two instances of the compiled
388
+ # function IR to check the IR is the same invariant of objects, and then
389
+ # a tiny mutation is made to the IR in the second function and detection
390
+ # of this change is checked.
391
+ def gen():
392
+ _FREEVAR = 0xCAFE
393
+
394
+ def foo(a, b, c=12, d=1j, e=None):
395
+ f = a + b
396
+ a += _FREEVAR
397
+ g = np.zeros(c, dtype=np.complex64)
398
+ h = f + g
399
+ i = 1j / d
400
+ if np.abs(i) > 0:
401
+ k = h / i
402
+ l = np.arange(1, c + 1)
403
+ if HAS_NUMBA:
404
+ with objmode():
405
+ print(e, k)
406
+ m = np.sqrt(l - g)
407
+ if np.abs(m[0]) < 1:
408
+ n = 0
409
+ for o in range(a):
410
+ n += 0
411
+ if np.abs(n) < 3:
412
+ break
413
+ n += m[2]
414
+ p = g / l
415
+ q = []
416
+ for r in range(len(p)):
417
+ q.append(p[r])
418
+ if r > 4 + 1:
419
+ if HAS_NUMBA:
420
+ with objmode(s="intp", t="complex128"):
421
+ s = 123
422
+ t = 5
423
+ if s > 122:
424
+ t += s
425
+ t += q[0] + _GLOBAL
426
+
427
+ return f + o + r + t + r + a + n
428
+
429
+ return foo
430
+
431
+ x = gen()
432
+ y = gen()
433
+ x_ir = run_frontend(x)
434
+ y_ir = run_frontend(y)
435
+
436
+ self.assertTrue(x_ir.equal_ir(y_ir))
437
+
438
+ def check_diffstr(string, pointing_at=[]):
439
+ lines = string.splitlines()
440
+ for item in pointing_at:
441
+ for l in lines:
442
+ if l.startswith("->"):
443
+ if item in l:
444
+ break
445
+ else:
446
+ raise AssertionError("Could not find %s " % item)
447
+
448
+ self.assertIn("IR is considered equivalent", x_ir.diff_str(y_ir))
449
+
450
+ # minor mutation, simply switch branch targets on last branch
451
+ for label in reversed(list(y_ir.blocks.keys())):
452
+ blk = y_ir.blocks[label]
453
+ if isinstance(blk.body[-1], ir.Branch):
454
+ ref = blk.body[-1]
455
+ ref.truebr, ref.falsebr = ref.falsebr, ref.truebr
456
+ break
457
+
458
+ check_diffstr(x_ir.diff_str(y_ir), ["branch"])
459
+
460
+ z = gen()
461
+ self.assertFalse(x_ir.equal_ir(y_ir))
462
+
463
+ z_ir = run_frontend(z)
464
+
465
+ change_set = set()
466
+ for label in reversed(list(z_ir.blocks.keys())):
467
+ blk = z_ir.blocks[label]
468
+ ref = blk.body[:-1]
469
+ idx = None
470
+ for i in range(len(ref) - 1):
471
+ # look for two adjacent Del
472
+ if isinstance(ref[i], ir.Del) and isinstance(
473
+ ref[i + 1], ir.Del
474
+ ):
475
+ idx = i
476
+ break
477
+ if idx is not None:
478
+ b = blk.body
479
+ change_set.add(str(b[idx + 1]))
480
+ change_set.add(str(b[idx]))
481
+ b[idx], b[idx + 1] = b[idx + 1], b[idx]
482
+ break
483
+
484
+ # ensure that a mutation occurred.
485
+ self.assertTrue(change_set)
486
+
487
+ self.assertFalse(x_ir.equal_ir(z_ir))
488
+ self.assertEqual(len(change_set), 2)
489
+ for item in change_set:
490
+ self.assertTrue(item.startswith("del "))
491
+ check_diffstr(x_ir.diff_str(z_ir), change_set)
492
+
493
+ def foo(a, b):
494
+ c = a * 2
495
+ d = c + b
496
+ e = np.sqrt(d)
497
+ return e
498
+
499
+ def bar(a, b): # same as foo
500
+ c = a * 2
501
+ d = c + b
502
+ e = np.sqrt(d)
503
+ return e
504
+
505
+ def baz(a, b):
506
+ c = a * 2
507
+ d = b + c
508
+ e = np.sqrt(d + 1)
509
+ return e
510
+
511
+ foo_ir = run_frontend(foo)
512
+ bar_ir = run_frontend(bar)
513
+ self.assertTrue(foo_ir.equal_ir(bar_ir))
514
+ self.assertIn("IR is considered equivalent", foo_ir.diff_str(bar_ir))
515
+
516
+ baz_ir = run_frontend(baz)
517
+ self.assertFalse(foo_ir.equal_ir(baz_ir))
518
+ tmp = foo_ir.diff_str(baz_ir)
519
+ self.assertIn("Other block contains more statements", tmp)
520
+ check_diffstr(tmp, ["c + b", "b + c"])
521
+
522
+
523
+ class TestIRPedanticChecks(CUDATestCase):
524
+ @skip_on_standalone_numba_cuda
525
+ def test_var_in_scope_assumption(self):
526
+ # Create a pass that clears ir.Scope in ir.Block
527
+ @register_pass(mutates_CFG=False, analysis_only=False)
528
+ class RemoveVarInScope(FunctionPass):
529
+ _name = "_remove_var_in_scope"
530
+
531
+ def __init__(self):
532
+ FunctionPass.__init__(self)
533
+
534
+ # implement method to do the work, "state" is the internal compiler
535
+ # state from the CompilerBase instance.
536
+ def run_pass(self, state):
537
+ func_ir = state.func_ir
538
+ # walk the blocks
539
+ for blk in func_ir.blocks.values():
540
+ oldscope = blk.scope
541
+ # put in an empty Scope
542
+ blk.scope = ir.Scope(
543
+ parent=oldscope.parent, loc=oldscope.loc
544
+ )
545
+ return True
546
+
547
+ # Create a pass that always fails, to stop the compiler
548
+ @register_pass(mutates_CFG=False, analysis_only=False)
549
+ class FailPass(FunctionPass):
550
+ _name = "_fail"
551
+
552
+ def __init__(self, *args, **kwargs):
553
+ FunctionPass.__init__(self)
554
+
555
+ def run_pass(self, state):
556
+ # This is unreachable. SSA pass should have raised before this
557
+ # pass when run with `error.NumbaPedanticWarning`s raised as
558
+ # errors.
559
+ raise AssertionError("unreachable")
560
+
561
+ class MyCompiler(CompilerBase):
562
+ def define_pipelines(self):
563
+ pm = PassManager("testing pm")
564
+ pm.add_pass(TranslateByteCode, "analyzing bytecode")
565
+ pm.add_pass(IRProcessing, "processing IR")
566
+ pm.add_pass(RemoveVarInScope, "_remove_var_in_scope")
567
+ pm.add_pass(ReconstructSSA, "ssa")
568
+ pm.add_pass(FailPass, "_fail")
569
+ pm.finalize()
570
+ return [pm]
571
+
572
+ @njit(pipeline_class=MyCompiler)
573
+ def dummy(x):
574
+ # To trigger SSA and the pedantic check, this function must have
575
+ # multiple assignments to the same variable in different blocks.
576
+ a = 1
577
+ b = 2
578
+ if a < b:
579
+ a = 2
580
+ else:
581
+ b = 3
582
+ return a, b
583
+
584
+ with warnings.catch_warnings():
585
+ # Make NumbaPedanticWarning an error
586
+ warnings.simplefilter("error", errors.NumbaPedanticWarning)
587
+ # Catch NumbaIRAssumptionWarning
588
+ with self.assertRaises(errors.NumbaIRAssumptionWarning) as raises:
589
+ dummy(1)
590
+ # Verify the error message
591
+ self.assertRegex(
592
+ str(raises.exception),
593
+ r"variable '[a-z]' is not in scope",
594
+ )
595
+
596
+
597
+ if __name__ == "__main__":
598
+ unittest.main()