numba-cuda 0.22.0__cp312-cp312-manylinux_2_24_aarch64.manylinux_2_28_aarch64.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of numba-cuda might be problematic. Click here for more details.
- _numba_cuda_redirector.pth +4 -0
- _numba_cuda_redirector.py +89 -0
- numba_cuda/VERSION +1 -0
- numba_cuda/__init__.py +6 -0
- numba_cuda/_version.py +11 -0
- numba_cuda/numba/cuda/__init__.py +70 -0
- numba_cuda/numba/cuda/_internal/cuda_bf16.py +16394 -0
- numba_cuda/numba/cuda/_internal/cuda_fp16.py +8112 -0
- numba_cuda/numba/cuda/api.py +580 -0
- numba_cuda/numba/cuda/api_util.py +76 -0
- numba_cuda/numba/cuda/args.py +72 -0
- numba_cuda/numba/cuda/bf16.py +397 -0
- numba_cuda/numba/cuda/cache_hints.py +287 -0
- numba_cuda/numba/cuda/cext/__init__.py +2 -0
- numba_cuda/numba/cuda/cext/_devicearray.cpp +159 -0
- numba_cuda/numba/cuda/cext/_devicearray.cpython-312-aarch64-linux-gnu.so +0 -0
- numba_cuda/numba/cuda/cext/_devicearray.h +29 -0
- numba_cuda/numba/cuda/cext/_dispatcher.cpp +1098 -0
- numba_cuda/numba/cuda/cext/_dispatcher.cpython-312-aarch64-linux-gnu.so +0 -0
- numba_cuda/numba/cuda/cext/_hashtable.cpp +532 -0
- numba_cuda/numba/cuda/cext/_hashtable.h +135 -0
- numba_cuda/numba/cuda/cext/_helperlib.c +71 -0
- numba_cuda/numba/cuda/cext/_helperlib.cpython-312-aarch64-linux-gnu.so +0 -0
- numba_cuda/numba/cuda/cext/_helpermod.c +82 -0
- numba_cuda/numba/cuda/cext/_pymodule.h +38 -0
- numba_cuda/numba/cuda/cext/_typeconv.cpp +206 -0
- numba_cuda/numba/cuda/cext/_typeconv.cpython-312-aarch64-linux-gnu.so +0 -0
- numba_cuda/numba/cuda/cext/_typeof.cpp +1159 -0
- numba_cuda/numba/cuda/cext/_typeof.h +19 -0
- numba_cuda/numba/cuda/cext/capsulethunk.h +111 -0
- numba_cuda/numba/cuda/cext/mviewbuf.c +385 -0
- numba_cuda/numba/cuda/cext/mviewbuf.cpython-312-aarch64-linux-gnu.so +0 -0
- numba_cuda/numba/cuda/cext/typeconv.cpp +212 -0
- numba_cuda/numba/cuda/cext/typeconv.hpp +101 -0
- numba_cuda/numba/cuda/cg.py +67 -0
- numba_cuda/numba/cuda/cgutils.py +1294 -0
- numba_cuda/numba/cuda/cloudpickle/__init__.py +21 -0
- numba_cuda/numba/cuda/cloudpickle/cloudpickle.py +1598 -0
- numba_cuda/numba/cuda/cloudpickle/cloudpickle_fast.py +17 -0
- numba_cuda/numba/cuda/codegen.py +541 -0
- numba_cuda/numba/cuda/compiler.py +1396 -0
- numba_cuda/numba/cuda/core/analysis.py +758 -0
- numba_cuda/numba/cuda/core/annotations/__init__.py +0 -0
- numba_cuda/numba/cuda/core/annotations/pretty_annotate.py +288 -0
- numba_cuda/numba/cuda/core/annotations/type_annotations.py +305 -0
- numba_cuda/numba/cuda/core/base.py +1332 -0
- numba_cuda/numba/cuda/core/boxing.py +1411 -0
- numba_cuda/numba/cuda/core/bytecode.py +728 -0
- numba_cuda/numba/cuda/core/byteflow.py +2346 -0
- numba_cuda/numba/cuda/core/caching.py +744 -0
- numba_cuda/numba/cuda/core/callconv.py +392 -0
- numba_cuda/numba/cuda/core/codegen.py +171 -0
- numba_cuda/numba/cuda/core/compiler.py +199 -0
- numba_cuda/numba/cuda/core/compiler_lock.py +85 -0
- numba_cuda/numba/cuda/core/compiler_machinery.py +497 -0
- numba_cuda/numba/cuda/core/config.py +650 -0
- numba_cuda/numba/cuda/core/consts.py +124 -0
- numba_cuda/numba/cuda/core/controlflow.py +989 -0
- numba_cuda/numba/cuda/core/entrypoints.py +57 -0
- numba_cuda/numba/cuda/core/environment.py +66 -0
- numba_cuda/numba/cuda/core/errors.py +917 -0
- numba_cuda/numba/cuda/core/event.py +511 -0
- numba_cuda/numba/cuda/core/funcdesc.py +330 -0
- numba_cuda/numba/cuda/core/generators.py +387 -0
- numba_cuda/numba/cuda/core/imputils.py +509 -0
- numba_cuda/numba/cuda/core/inline_closurecall.py +1787 -0
- numba_cuda/numba/cuda/core/interpreter.py +3617 -0
- numba_cuda/numba/cuda/core/ir.py +1812 -0
- numba_cuda/numba/cuda/core/ir_utils.py +2638 -0
- numba_cuda/numba/cuda/core/optional.py +129 -0
- numba_cuda/numba/cuda/core/options.py +262 -0
- numba_cuda/numba/cuda/core/postproc.py +249 -0
- numba_cuda/numba/cuda/core/pythonapi.py +1859 -0
- numba_cuda/numba/cuda/core/registry.py +46 -0
- numba_cuda/numba/cuda/core/removerefctpass.py +123 -0
- numba_cuda/numba/cuda/core/rewrites/__init__.py +26 -0
- numba_cuda/numba/cuda/core/rewrites/ir_print.py +91 -0
- numba_cuda/numba/cuda/core/rewrites/registry.py +104 -0
- numba_cuda/numba/cuda/core/rewrites/static_binop.py +41 -0
- numba_cuda/numba/cuda/core/rewrites/static_getitem.py +189 -0
- numba_cuda/numba/cuda/core/rewrites/static_raise.py +100 -0
- numba_cuda/numba/cuda/core/sigutils.py +68 -0
- numba_cuda/numba/cuda/core/ssa.py +498 -0
- numba_cuda/numba/cuda/core/targetconfig.py +330 -0
- numba_cuda/numba/cuda/core/tracing.py +231 -0
- numba_cuda/numba/cuda/core/transforms.py +956 -0
- numba_cuda/numba/cuda/core/typed_passes.py +867 -0
- numba_cuda/numba/cuda/core/typeinfer.py +1950 -0
- numba_cuda/numba/cuda/core/unsafe/__init__.py +0 -0
- numba_cuda/numba/cuda/core/unsafe/bytes.py +67 -0
- numba_cuda/numba/cuda/core/unsafe/eh.py +67 -0
- numba_cuda/numba/cuda/core/unsafe/refcount.py +98 -0
- numba_cuda/numba/cuda/core/untyped_passes.py +1979 -0
- numba_cuda/numba/cuda/cpython/builtins.py +1153 -0
- numba_cuda/numba/cuda/cpython/charseq.py +1218 -0
- numba_cuda/numba/cuda/cpython/cmathimpl.py +560 -0
- numba_cuda/numba/cuda/cpython/enumimpl.py +103 -0
- numba_cuda/numba/cuda/cpython/iterators.py +167 -0
- numba_cuda/numba/cuda/cpython/listobj.py +1326 -0
- numba_cuda/numba/cuda/cpython/mathimpl.py +499 -0
- numba_cuda/numba/cuda/cpython/numbers.py +1475 -0
- numba_cuda/numba/cuda/cpython/rangeobj.py +289 -0
- numba_cuda/numba/cuda/cpython/slicing.py +322 -0
- numba_cuda/numba/cuda/cpython/tupleobj.py +456 -0
- numba_cuda/numba/cuda/cpython/unicode.py +2865 -0
- numba_cuda/numba/cuda/cpython/unicode_support.py +1597 -0
- numba_cuda/numba/cuda/cpython/unsafe/__init__.py +0 -0
- numba_cuda/numba/cuda/cpython/unsafe/numbers.py +64 -0
- numba_cuda/numba/cuda/cpython/unsafe/tuple.py +92 -0
- numba_cuda/numba/cuda/cuda_paths.py +691 -0
- numba_cuda/numba/cuda/cudadecl.py +543 -0
- numba_cuda/numba/cuda/cudadrv/__init__.py +14 -0
- numba_cuda/numba/cuda/cudadrv/devicearray.py +954 -0
- numba_cuda/numba/cuda/cudadrv/devices.py +249 -0
- numba_cuda/numba/cuda/cudadrv/driver.py +3238 -0
- numba_cuda/numba/cuda/cudadrv/drvapi.py +435 -0
- numba_cuda/numba/cuda/cudadrv/dummyarray.py +562 -0
- numba_cuda/numba/cuda/cudadrv/enums.py +613 -0
- numba_cuda/numba/cuda/cudadrv/error.py +48 -0
- numba_cuda/numba/cuda/cudadrv/libs.py +220 -0
- numba_cuda/numba/cuda/cudadrv/linkable_code.py +184 -0
- numba_cuda/numba/cuda/cudadrv/mappings.py +14 -0
- numba_cuda/numba/cuda/cudadrv/ndarray.py +26 -0
- numba_cuda/numba/cuda/cudadrv/nvrtc.py +193 -0
- numba_cuda/numba/cuda/cudadrv/nvvm.py +756 -0
- numba_cuda/numba/cuda/cudadrv/rtapi.py +13 -0
- numba_cuda/numba/cuda/cudadrv/runtime.py +34 -0
- numba_cuda/numba/cuda/cudaimpl.py +983 -0
- numba_cuda/numba/cuda/cudamath.py +149 -0
- numba_cuda/numba/cuda/datamodel/__init__.py +7 -0
- numba_cuda/numba/cuda/datamodel/cuda_manager.py +66 -0
- numba_cuda/numba/cuda/datamodel/cuda_models.py +1446 -0
- numba_cuda/numba/cuda/datamodel/cuda_packer.py +224 -0
- numba_cuda/numba/cuda/datamodel/cuda_registry.py +22 -0
- numba_cuda/numba/cuda/datamodel/cuda_testing.py +153 -0
- numba_cuda/numba/cuda/datamodel/manager.py +11 -0
- numba_cuda/numba/cuda/datamodel/models.py +9 -0
- numba_cuda/numba/cuda/datamodel/packer.py +9 -0
- numba_cuda/numba/cuda/datamodel/registry.py +11 -0
- numba_cuda/numba/cuda/datamodel/testing.py +11 -0
- numba_cuda/numba/cuda/debuginfo.py +997 -0
- numba_cuda/numba/cuda/decorators.py +294 -0
- numba_cuda/numba/cuda/descriptor.py +35 -0
- numba_cuda/numba/cuda/device_init.py +155 -0
- numba_cuda/numba/cuda/deviceufunc.py +1021 -0
- numba_cuda/numba/cuda/dispatcher.py +2463 -0
- numba_cuda/numba/cuda/errors.py +72 -0
- numba_cuda/numba/cuda/extending.py +697 -0
- numba_cuda/numba/cuda/flags.py +178 -0
- numba_cuda/numba/cuda/fp16.py +357 -0
- numba_cuda/numba/cuda/include/12/cuda_bf16.h +5118 -0
- numba_cuda/numba/cuda/include/12/cuda_bf16.hpp +3865 -0
- numba_cuda/numba/cuda/include/12/cuda_fp16.h +5363 -0
- numba_cuda/numba/cuda/include/12/cuda_fp16.hpp +3483 -0
- numba_cuda/numba/cuda/include/13/cuda_bf16.h +5118 -0
- numba_cuda/numba/cuda/include/13/cuda_bf16.hpp +3865 -0
- numba_cuda/numba/cuda/include/13/cuda_fp16.h +5363 -0
- numba_cuda/numba/cuda/include/13/cuda_fp16.hpp +3483 -0
- numba_cuda/numba/cuda/initialize.py +24 -0
- numba_cuda/numba/cuda/intrinsics.py +531 -0
- numba_cuda/numba/cuda/itanium_mangler.py +214 -0
- numba_cuda/numba/cuda/kernels/__init__.py +2 -0
- numba_cuda/numba/cuda/kernels/reduction.py +265 -0
- numba_cuda/numba/cuda/kernels/transpose.py +65 -0
- numba_cuda/numba/cuda/libdevice.py +3386 -0
- numba_cuda/numba/cuda/libdevicedecl.py +20 -0
- numba_cuda/numba/cuda/libdevicefuncs.py +1060 -0
- numba_cuda/numba/cuda/libdeviceimpl.py +88 -0
- numba_cuda/numba/cuda/locks.py +19 -0
- numba_cuda/numba/cuda/lowering.py +1980 -0
- numba_cuda/numba/cuda/mathimpl.py +374 -0
- numba_cuda/numba/cuda/memory_management/__init__.py +4 -0
- numba_cuda/numba/cuda/memory_management/memsys.cu +99 -0
- numba_cuda/numba/cuda/memory_management/memsys.cuh +22 -0
- numba_cuda/numba/cuda/memory_management/nrt.cu +212 -0
- numba_cuda/numba/cuda/memory_management/nrt.cuh +48 -0
- numba_cuda/numba/cuda/memory_management/nrt.py +390 -0
- numba_cuda/numba/cuda/memory_management/nrt_context.py +438 -0
- numba_cuda/numba/cuda/misc/appdirs.py +594 -0
- numba_cuda/numba/cuda/misc/cffiimpl.py +24 -0
- numba_cuda/numba/cuda/misc/coverage_support.py +43 -0
- numba_cuda/numba/cuda/misc/dump_style.py +41 -0
- numba_cuda/numba/cuda/misc/findlib.py +75 -0
- numba_cuda/numba/cuda/misc/firstlinefinder.py +96 -0
- numba_cuda/numba/cuda/misc/gdb_hook.py +240 -0
- numba_cuda/numba/cuda/misc/literal.py +28 -0
- numba_cuda/numba/cuda/misc/llvm_pass_timings.py +412 -0
- numba_cuda/numba/cuda/misc/special.py +94 -0
- numba_cuda/numba/cuda/models.py +56 -0
- numba_cuda/numba/cuda/np/arraymath.py +5130 -0
- numba_cuda/numba/cuda/np/arrayobj.py +7635 -0
- numba_cuda/numba/cuda/np/extensions.py +11 -0
- numba_cuda/numba/cuda/np/linalg.py +3087 -0
- numba_cuda/numba/cuda/np/math/__init__.py +0 -0
- numba_cuda/numba/cuda/np/math/cmathimpl.py +558 -0
- numba_cuda/numba/cuda/np/math/mathimpl.py +487 -0
- numba_cuda/numba/cuda/np/math/numbers.py +1461 -0
- numba_cuda/numba/cuda/np/npdatetime.py +969 -0
- numba_cuda/numba/cuda/np/npdatetime_helpers.py +217 -0
- numba_cuda/numba/cuda/np/npyfuncs.py +1808 -0
- numba_cuda/numba/cuda/np/npyimpl.py +1027 -0
- numba_cuda/numba/cuda/np/numpy_support.py +798 -0
- numba_cuda/numba/cuda/np/polynomial/__init__.py +4 -0
- numba_cuda/numba/cuda/np/polynomial/polynomial_core.py +242 -0
- numba_cuda/numba/cuda/np/polynomial/polynomial_functions.py +380 -0
- numba_cuda/numba/cuda/np/ufunc/__init__.py +4 -0
- numba_cuda/numba/cuda/np/ufunc/decorators.py +203 -0
- numba_cuda/numba/cuda/np/ufunc/sigparse.py +68 -0
- numba_cuda/numba/cuda/np/ufunc/ufuncbuilder.py +65 -0
- numba_cuda/numba/cuda/np/ufunc_db.py +1282 -0
- numba_cuda/numba/cuda/np/unsafe/__init__.py +0 -0
- numba_cuda/numba/cuda/np/unsafe/ndarray.py +84 -0
- numba_cuda/numba/cuda/nvvmutils.py +254 -0
- numba_cuda/numba/cuda/printimpl.py +126 -0
- numba_cuda/numba/cuda/random.py +308 -0
- numba_cuda/numba/cuda/reshape_funcs.cu +156 -0
- numba_cuda/numba/cuda/serialize.py +267 -0
- numba_cuda/numba/cuda/simulator/__init__.py +63 -0
- numba_cuda/numba/cuda/simulator/_internal/__init__.py +4 -0
- numba_cuda/numba/cuda/simulator/_internal/cuda_bf16.py +2 -0
- numba_cuda/numba/cuda/simulator/api.py +179 -0
- numba_cuda/numba/cuda/simulator/bf16.py +4 -0
- numba_cuda/numba/cuda/simulator/compiler.py +38 -0
- numba_cuda/numba/cuda/simulator/cudadrv/__init__.py +11 -0
- numba_cuda/numba/cuda/simulator/cudadrv/devicearray.py +462 -0
- numba_cuda/numba/cuda/simulator/cudadrv/devices.py +122 -0
- numba_cuda/numba/cuda/simulator/cudadrv/driver.py +66 -0
- numba_cuda/numba/cuda/simulator/cudadrv/drvapi.py +7 -0
- numba_cuda/numba/cuda/simulator/cudadrv/dummyarray.py +7 -0
- numba_cuda/numba/cuda/simulator/cudadrv/error.py +10 -0
- numba_cuda/numba/cuda/simulator/cudadrv/libs.py +10 -0
- numba_cuda/numba/cuda/simulator/cudadrv/linkable_code.py +61 -0
- numba_cuda/numba/cuda/simulator/cudadrv/nvrtc.py +11 -0
- numba_cuda/numba/cuda/simulator/cudadrv/nvvm.py +32 -0
- numba_cuda/numba/cuda/simulator/cudadrv/runtime.py +22 -0
- numba_cuda/numba/cuda/simulator/dispatcher.py +11 -0
- numba_cuda/numba/cuda/simulator/kernel.py +320 -0
- numba_cuda/numba/cuda/simulator/kernelapi.py +509 -0
- numba_cuda/numba/cuda/simulator/memory_management/__init__.py +4 -0
- numba_cuda/numba/cuda/simulator/memory_management/nrt.py +21 -0
- numba_cuda/numba/cuda/simulator/reduction.py +19 -0
- numba_cuda/numba/cuda/simulator/tests/support.py +4 -0
- numba_cuda/numba/cuda/simulator/vector_types.py +65 -0
- numba_cuda/numba/cuda/simulator_init.py +18 -0
- numba_cuda/numba/cuda/stubs.py +624 -0
- numba_cuda/numba/cuda/target.py +505 -0
- numba_cuda/numba/cuda/testing.py +347 -0
- numba_cuda/numba/cuda/tests/__init__.py +62 -0
- numba_cuda/numba/cuda/tests/benchmarks/__init__.py +0 -0
- numba_cuda/numba/cuda/tests/benchmarks/test_kernel_launch.py +119 -0
- numba_cuda/numba/cuda/tests/cloudpickle_main_class.py +9 -0
- numba_cuda/numba/cuda/tests/core/serialize_usecases.py +113 -0
- numba_cuda/numba/cuda/tests/core/test_itanium_mangler.py +83 -0
- numba_cuda/numba/cuda/tests/core/test_serialize.py +371 -0
- numba_cuda/numba/cuda/tests/cudadrv/__init__.py +9 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_array_attr.py +147 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_context_stack.py +161 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_cuda_array_slicing.py +397 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_cuda_auto_context.py +24 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_cuda_devicerecord.py +180 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_cuda_driver.py +313 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_cuda_memory.py +191 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_cuda_ndarray.py +621 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_deallocations.py +247 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_detect.py +100 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_emm_plugins.py +200 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_events.py +53 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_host_alloc.py +72 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_init.py +138 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_inline_ptx.py +43 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_is_fp16.py +15 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_linkable_code.py +58 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_linker.py +348 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_managed_alloc.py +128 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_module_callbacks.py +301 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_nvjitlink.py +174 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_nvrtc.py +28 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_nvvm_driver.py +185 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_pinned.py +39 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_profiler.py +23 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_reset_device.py +38 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_runtime.py +48 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_select_device.py +44 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_streams.py +127 -0
- numba_cuda/numba/cuda/tests/cudapy/__init__.py +9 -0
- numba_cuda/numba/cuda/tests/cudapy/cache_usecases.py +231 -0
- numba_cuda/numba/cuda/tests/cudapy/cache_with_cpu_usecases.py +50 -0
- numba_cuda/numba/cuda/tests/cudapy/cg_cache_usecases.py +36 -0
- numba_cuda/numba/cuda/tests/cudapy/complex_usecases.py +116 -0
- numba_cuda/numba/cuda/tests/cudapy/enum_usecases.py +59 -0
- numba_cuda/numba/cuda/tests/cudapy/extensions_usecases.py +62 -0
- numba_cuda/numba/cuda/tests/cudapy/jitlink.ptx +28 -0
- numba_cuda/numba/cuda/tests/cudapy/overload_usecases.py +33 -0
- numba_cuda/numba/cuda/tests/cudapy/recursion_usecases.py +104 -0
- numba_cuda/numba/cuda/tests/cudapy/test_alignment.py +47 -0
- numba_cuda/numba/cuda/tests/cudapy/test_analysis.py +1122 -0
- numba_cuda/numba/cuda/tests/cudapy/test_array.py +344 -0
- numba_cuda/numba/cuda/tests/cudapy/test_array_alignment.py +268 -0
- numba_cuda/numba/cuda/tests/cudapy/test_array_args.py +203 -0
- numba_cuda/numba/cuda/tests/cudapy/test_array_methods.py +63 -0
- numba_cuda/numba/cuda/tests/cudapy/test_array_reductions.py +360 -0
- numba_cuda/numba/cuda/tests/cudapy/test_atomics.py +1815 -0
- numba_cuda/numba/cuda/tests/cudapy/test_bfloat16.py +599 -0
- numba_cuda/numba/cuda/tests/cudapy/test_bfloat16_bindings.py +377 -0
- numba_cuda/numba/cuda/tests/cudapy/test_blackscholes.py +160 -0
- numba_cuda/numba/cuda/tests/cudapy/test_boolean.py +27 -0
- numba_cuda/numba/cuda/tests/cudapy/test_byteflow.py +98 -0
- numba_cuda/numba/cuda/tests/cudapy/test_cache_hints.py +210 -0
- numba_cuda/numba/cuda/tests/cudapy/test_caching.py +683 -0
- numba_cuda/numba/cuda/tests/cudapy/test_casting.py +265 -0
- numba_cuda/numba/cuda/tests/cudapy/test_cffi.py +42 -0
- numba_cuda/numba/cuda/tests/cudapy/test_compiler.py +718 -0
- numba_cuda/numba/cuda/tests/cudapy/test_complex.py +370 -0
- numba_cuda/numba/cuda/tests/cudapy/test_complex_kernel.py +23 -0
- numba_cuda/numba/cuda/tests/cudapy/test_const_string.py +142 -0
- numba_cuda/numba/cuda/tests/cudapy/test_constmem.py +178 -0
- numba_cuda/numba/cuda/tests/cudapy/test_cooperative_groups.py +193 -0
- numba_cuda/numba/cuda/tests/cudapy/test_copy_propagate.py +131 -0
- numba_cuda/numba/cuda/tests/cudapy/test_cuda_array_interface.py +438 -0
- numba_cuda/numba/cuda/tests/cudapy/test_cuda_jit_no_types.py +94 -0
- numba_cuda/numba/cuda/tests/cudapy/test_datetime.py +101 -0
- numba_cuda/numba/cuda/tests/cudapy/test_debug.py +105 -0
- numba_cuda/numba/cuda/tests/cudapy/test_debuginfo.py +978 -0
- numba_cuda/numba/cuda/tests/cudapy/test_debuginfo_types.py +476 -0
- numba_cuda/numba/cuda/tests/cudapy/test_device_func.py +500 -0
- numba_cuda/numba/cuda/tests/cudapy/test_dispatcher.py +820 -0
- numba_cuda/numba/cuda/tests/cudapy/test_enums.py +152 -0
- numba_cuda/numba/cuda/tests/cudapy/test_errors.py +111 -0
- numba_cuda/numba/cuda/tests/cudapy/test_exception.py +170 -0
- numba_cuda/numba/cuda/tests/cudapy/test_extending.py +1088 -0
- numba_cuda/numba/cuda/tests/cudapy/test_extending_types.py +71 -0
- numba_cuda/numba/cuda/tests/cudapy/test_fastmath.py +265 -0
- numba_cuda/numba/cuda/tests/cudapy/test_flow_control.py +1433 -0
- numba_cuda/numba/cuda/tests/cudapy/test_forall.py +57 -0
- numba_cuda/numba/cuda/tests/cudapy/test_freevar.py +34 -0
- numba_cuda/numba/cuda/tests/cudapy/test_frexp_ldexp.py +69 -0
- numba_cuda/numba/cuda/tests/cudapy/test_globals.py +62 -0
- numba_cuda/numba/cuda/tests/cudapy/test_gufunc.py +474 -0
- numba_cuda/numba/cuda/tests/cudapy/test_gufunc_scalar.py +167 -0
- numba_cuda/numba/cuda/tests/cudapy/test_gufunc_scheduling.py +92 -0
- numba_cuda/numba/cuda/tests/cudapy/test_idiv.py +39 -0
- numba_cuda/numba/cuda/tests/cudapy/test_inline.py +170 -0
- numba_cuda/numba/cuda/tests/cudapy/test_inspect.py +255 -0
- numba_cuda/numba/cuda/tests/cudapy/test_intrinsics.py +1219 -0
- numba_cuda/numba/cuda/tests/cudapy/test_ipc.py +263 -0
- numba_cuda/numba/cuda/tests/cudapy/test_ir.py +598 -0
- numba_cuda/numba/cuda/tests/cudapy/test_ir_utils.py +276 -0
- numba_cuda/numba/cuda/tests/cudapy/test_iterators.py +101 -0
- numba_cuda/numba/cuda/tests/cudapy/test_lang.py +68 -0
- numba_cuda/numba/cuda/tests/cudapy/test_laplace.py +123 -0
- numba_cuda/numba/cuda/tests/cudapy/test_libdevice.py +194 -0
- numba_cuda/numba/cuda/tests/cudapy/test_lineinfo.py +220 -0
- numba_cuda/numba/cuda/tests/cudapy/test_localmem.py +173 -0
- numba_cuda/numba/cuda/tests/cudapy/test_make_function_to_jit_function.py +364 -0
- numba_cuda/numba/cuda/tests/cudapy/test_mandel.py +47 -0
- numba_cuda/numba/cuda/tests/cudapy/test_math.py +842 -0
- numba_cuda/numba/cuda/tests/cudapy/test_matmul.py +76 -0
- numba_cuda/numba/cuda/tests/cudapy/test_minmax.py +78 -0
- numba_cuda/numba/cuda/tests/cudapy/test_montecarlo.py +25 -0
- numba_cuda/numba/cuda/tests/cudapy/test_multigpu.py +145 -0
- numba_cuda/numba/cuda/tests/cudapy/test_multiprocessing.py +39 -0
- numba_cuda/numba/cuda/tests/cudapy/test_multithreads.py +82 -0
- numba_cuda/numba/cuda/tests/cudapy/test_nondet.py +53 -0
- numba_cuda/numba/cuda/tests/cudapy/test_operator.py +504 -0
- numba_cuda/numba/cuda/tests/cudapy/test_optimization.py +93 -0
- numba_cuda/numba/cuda/tests/cudapy/test_overload.py +402 -0
- numba_cuda/numba/cuda/tests/cudapy/test_powi.py +128 -0
- numba_cuda/numba/cuda/tests/cudapy/test_print.py +193 -0
- numba_cuda/numba/cuda/tests/cudapy/test_py2_div_issue.py +37 -0
- numba_cuda/numba/cuda/tests/cudapy/test_random.py +117 -0
- numba_cuda/numba/cuda/tests/cudapy/test_record_dtype.py +614 -0
- numba_cuda/numba/cuda/tests/cudapy/test_recursion.py +130 -0
- numba_cuda/numba/cuda/tests/cudapy/test_reduction.py +94 -0
- numba_cuda/numba/cuda/tests/cudapy/test_retrieve_autoconverted_arrays.py +83 -0
- numba_cuda/numba/cuda/tests/cudapy/test_serialize.py +86 -0
- numba_cuda/numba/cuda/tests/cudapy/test_slicing.py +40 -0
- numba_cuda/numba/cuda/tests/cudapy/test_sm.py +457 -0
- numba_cuda/numba/cuda/tests/cudapy/test_sm_creation.py +233 -0
- numba_cuda/numba/cuda/tests/cudapy/test_ssa.py +454 -0
- numba_cuda/numba/cuda/tests/cudapy/test_stream_api.py +56 -0
- numba_cuda/numba/cuda/tests/cudapy/test_sync.py +277 -0
- numba_cuda/numba/cuda/tests/cudapy/test_tracing.py +200 -0
- numba_cuda/numba/cuda/tests/cudapy/test_transpose.py +90 -0
- numba_cuda/numba/cuda/tests/cudapy/test_typeconv.py +333 -0
- numba_cuda/numba/cuda/tests/cudapy/test_typeinfer.py +538 -0
- numba_cuda/numba/cuda/tests/cudapy/test_ufuncs.py +585 -0
- numba_cuda/numba/cuda/tests/cudapy/test_userexc.py +42 -0
- numba_cuda/numba/cuda/tests/cudapy/test_vector_type.py +485 -0
- numba_cuda/numba/cuda/tests/cudapy/test_vectorize.py +312 -0
- numba_cuda/numba/cuda/tests/cudapy/test_vectorize_complex.py +23 -0
- numba_cuda/numba/cuda/tests/cudapy/test_vectorize_decor.py +183 -0
- numba_cuda/numba/cuda/tests/cudapy/test_vectorize_device.py +40 -0
- numba_cuda/numba/cuda/tests/cudapy/test_vectorize_scalar_arg.py +40 -0
- numba_cuda/numba/cuda/tests/cudapy/test_warning.py +206 -0
- numba_cuda/numba/cuda/tests/cudapy/test_warp_ops.py +446 -0
- numba_cuda/numba/cuda/tests/cudasim/__init__.py +9 -0
- numba_cuda/numba/cuda/tests/cudasim/support.py +9 -0
- numba_cuda/numba/cuda/tests/cudasim/test_cudasim_issues.py +111 -0
- numba_cuda/numba/cuda/tests/data/__init__.py +2 -0
- numba_cuda/numba/cuda/tests/data/cta_barrier.cu +28 -0
- numba_cuda/numba/cuda/tests/data/cuda_include.cu +10 -0
- numba_cuda/numba/cuda/tests/data/error.cu +12 -0
- numba_cuda/numba/cuda/tests/data/include/add.cuh +8 -0
- numba_cuda/numba/cuda/tests/data/jitlink.cu +28 -0
- numba_cuda/numba/cuda/tests/data/jitlink.ptx +49 -0
- numba_cuda/numba/cuda/tests/data/warn.cu +12 -0
- numba_cuda/numba/cuda/tests/doc_examples/__init__.py +9 -0
- numba_cuda/numba/cuda/tests/doc_examples/ffi/__init__.py +2 -0
- numba_cuda/numba/cuda/tests/doc_examples/ffi/functions.cu +54 -0
- numba_cuda/numba/cuda/tests/doc_examples/ffi/include/mul.cuh +8 -0
- numba_cuda/numba/cuda/tests/doc_examples/ffi/saxpy.cu +14 -0
- numba_cuda/numba/cuda/tests/doc_examples/test_cg.py +86 -0
- numba_cuda/numba/cuda/tests/doc_examples/test_cpointer.py +68 -0
- numba_cuda/numba/cuda/tests/doc_examples/test_cpu_gpu_compat.py +81 -0
- numba_cuda/numba/cuda/tests/doc_examples/test_ffi.py +141 -0
- numba_cuda/numba/cuda/tests/doc_examples/test_laplace.py +160 -0
- numba_cuda/numba/cuda/tests/doc_examples/test_matmul.py +180 -0
- numba_cuda/numba/cuda/tests/doc_examples/test_montecarlo.py +119 -0
- numba_cuda/numba/cuda/tests/doc_examples/test_random.py +66 -0
- numba_cuda/numba/cuda/tests/doc_examples/test_reduction.py +80 -0
- numba_cuda/numba/cuda/tests/doc_examples/test_sessionize.py +206 -0
- numba_cuda/numba/cuda/tests/doc_examples/test_ufunc.py +53 -0
- numba_cuda/numba/cuda/tests/doc_examples/test_vecadd.py +76 -0
- numba_cuda/numba/cuda/tests/nocuda/__init__.py +9 -0
- numba_cuda/numba/cuda/tests/nocuda/test_dummyarray.py +452 -0
- numba_cuda/numba/cuda/tests/nocuda/test_function_resolution.py +48 -0
- numba_cuda/numba/cuda/tests/nocuda/test_import.py +63 -0
- numba_cuda/numba/cuda/tests/nocuda/test_library_lookup.py +252 -0
- numba_cuda/numba/cuda/tests/nocuda/test_nvvm.py +59 -0
- numba_cuda/numba/cuda/tests/nrt/__init__.py +9 -0
- numba_cuda/numba/cuda/tests/nrt/test_nrt.py +387 -0
- numba_cuda/numba/cuda/tests/nrt/test_nrt_refct.py +124 -0
- numba_cuda/numba/cuda/tests/support.py +900 -0
- numba_cuda/numba/cuda/typeconv/__init__.py +4 -0
- numba_cuda/numba/cuda/typeconv/castgraph.py +137 -0
- numba_cuda/numba/cuda/typeconv/rules.py +63 -0
- numba_cuda/numba/cuda/typeconv/typeconv.py +121 -0
- numba_cuda/numba/cuda/types/__init__.py +233 -0
- numba_cuda/numba/cuda/types/__init__.pyi +167 -0
- numba_cuda/numba/cuda/types/abstract.py +9 -0
- numba_cuda/numba/cuda/types/common.py +9 -0
- numba_cuda/numba/cuda/types/containers.py +9 -0
- numba_cuda/numba/cuda/types/cuda_abstract.py +533 -0
- numba_cuda/numba/cuda/types/cuda_common.py +110 -0
- numba_cuda/numba/cuda/types/cuda_containers.py +971 -0
- numba_cuda/numba/cuda/types/cuda_function_type.py +230 -0
- numba_cuda/numba/cuda/types/cuda_functions.py +798 -0
- numba_cuda/numba/cuda/types/cuda_iterators.py +120 -0
- numba_cuda/numba/cuda/types/cuda_misc.py +569 -0
- numba_cuda/numba/cuda/types/cuda_npytypes.py +690 -0
- numba_cuda/numba/cuda/types/cuda_scalars.py +280 -0
- numba_cuda/numba/cuda/types/ext_types.py +101 -0
- numba_cuda/numba/cuda/types/function_type.py +11 -0
- numba_cuda/numba/cuda/types/functions.py +9 -0
- numba_cuda/numba/cuda/types/iterators.py +9 -0
- numba_cuda/numba/cuda/types/misc.py +9 -0
- numba_cuda/numba/cuda/types/npytypes.py +9 -0
- numba_cuda/numba/cuda/types/scalars.py +9 -0
- numba_cuda/numba/cuda/typing/__init__.py +19 -0
- numba_cuda/numba/cuda/typing/arraydecl.py +939 -0
- numba_cuda/numba/cuda/typing/asnumbatype.py +130 -0
- numba_cuda/numba/cuda/typing/bufproto.py +70 -0
- numba_cuda/numba/cuda/typing/builtins.py +1209 -0
- numba_cuda/numba/cuda/typing/cffi_utils.py +219 -0
- numba_cuda/numba/cuda/typing/cmathdecl.py +47 -0
- numba_cuda/numba/cuda/typing/collections.py +138 -0
- numba_cuda/numba/cuda/typing/context.py +782 -0
- numba_cuda/numba/cuda/typing/ctypes_utils.py +125 -0
- numba_cuda/numba/cuda/typing/dictdecl.py +63 -0
- numba_cuda/numba/cuda/typing/enumdecl.py +74 -0
- numba_cuda/numba/cuda/typing/listdecl.py +147 -0
- numba_cuda/numba/cuda/typing/mathdecl.py +158 -0
- numba_cuda/numba/cuda/typing/npdatetime.py +322 -0
- numba_cuda/numba/cuda/typing/npydecl.py +749 -0
- numba_cuda/numba/cuda/typing/setdecl.py +115 -0
- numba_cuda/numba/cuda/typing/templates.py +1446 -0
- numba_cuda/numba/cuda/typing/typeof.py +301 -0
- numba_cuda/numba/cuda/ufuncs.py +746 -0
- numba_cuda/numba/cuda/utils.py +724 -0
- numba_cuda/numba/cuda/vector_types.py +214 -0
- numba_cuda/numba/cuda/vectorizers.py +260 -0
- numba_cuda-0.22.0.dist-info/METADATA +109 -0
- numba_cuda-0.22.0.dist-info/RECORD +487 -0
- numba_cuda-0.22.0.dist-info/WHEEL +6 -0
- numba_cuda-0.22.0.dist-info/licenses/LICENSE +26 -0
- numba_cuda-0.22.0.dist-info/licenses/LICENSE.numba +24 -0
- numba_cuda-0.22.0.dist-info/top_level.txt +1 -0
|
@@ -0,0 +1,224 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: BSD-2-Clause
|
|
3
|
+
|
|
4
|
+
from collections import deque
|
|
5
|
+
|
|
6
|
+
from numba.cuda import types
|
|
7
|
+
from numba.cuda import cgutils
|
|
8
|
+
|
|
9
|
+
|
|
10
|
+
class DataPacker(object):
|
|
11
|
+
"""
|
|
12
|
+
A helper to pack a number of typed arguments into a data structure.
|
|
13
|
+
Omitted arguments (i.e. values with the type `Omitted`) are automatically
|
|
14
|
+
skipped.
|
|
15
|
+
"""
|
|
16
|
+
|
|
17
|
+
# XXX should DataPacker be a model for a dedicated type?
|
|
18
|
+
|
|
19
|
+
def __init__(self, dmm, fe_types):
|
|
20
|
+
self._dmm = dmm
|
|
21
|
+
self._fe_types = fe_types
|
|
22
|
+
self._models = [dmm.lookup(ty) for ty in fe_types]
|
|
23
|
+
|
|
24
|
+
self._pack_map = []
|
|
25
|
+
self._be_types = []
|
|
26
|
+
for i, ty in enumerate(fe_types):
|
|
27
|
+
if not isinstance(ty, types.Omitted):
|
|
28
|
+
self._pack_map.append(i)
|
|
29
|
+
self._be_types.append(self._models[i].get_data_type())
|
|
30
|
+
|
|
31
|
+
def as_data(self, builder, values):
|
|
32
|
+
"""
|
|
33
|
+
Return the given values packed as a data structure.
|
|
34
|
+
"""
|
|
35
|
+
elems = [
|
|
36
|
+
self._models[i].as_data(builder, values[i]) for i in self._pack_map
|
|
37
|
+
]
|
|
38
|
+
return cgutils.make_anonymous_struct(builder, elems)
|
|
39
|
+
|
|
40
|
+
def _do_load(self, builder, ptr, formal_list=None):
|
|
41
|
+
res = []
|
|
42
|
+
for i, i_formal in enumerate(self._pack_map):
|
|
43
|
+
elem_ptr = cgutils.gep_inbounds(builder, ptr, 0, i)
|
|
44
|
+
val = self._models[i_formal].load_from_data_pointer(
|
|
45
|
+
builder, elem_ptr
|
|
46
|
+
)
|
|
47
|
+
if formal_list is None:
|
|
48
|
+
res.append((self._fe_types[i_formal], val))
|
|
49
|
+
else:
|
|
50
|
+
formal_list[i_formal] = val
|
|
51
|
+
return res
|
|
52
|
+
|
|
53
|
+
def load(self, builder, ptr):
|
|
54
|
+
"""
|
|
55
|
+
Load the packed values and return a (type, value) tuples.
|
|
56
|
+
"""
|
|
57
|
+
return self._do_load(builder, ptr)
|
|
58
|
+
|
|
59
|
+
def load_into(self, builder, ptr, formal_list):
|
|
60
|
+
"""
|
|
61
|
+
Load the packed values into a sequence indexed by formal
|
|
62
|
+
argument number (skipping any Omitted position).
|
|
63
|
+
"""
|
|
64
|
+
self._do_load(builder, ptr, formal_list)
|
|
65
|
+
|
|
66
|
+
|
|
67
|
+
class ArgPacker(object):
|
|
68
|
+
"""
|
|
69
|
+
Compute the position for each high-level typed argument.
|
|
70
|
+
It flattens every composite argument into primitive types.
|
|
71
|
+
It maintains a position map for unflattening the arguments.
|
|
72
|
+
|
|
73
|
+
Since struct (esp. nested struct) have specific ABI requirements (e.g.
|
|
74
|
+
alignment, pointer address-space, ...) in different architecture (e.g.
|
|
75
|
+
OpenCL, CUDA), flattening composite argument types simplifes the call
|
|
76
|
+
setup from the Python side. Functions are receiving simple primitive
|
|
77
|
+
types and there are only a handful of these.
|
|
78
|
+
"""
|
|
79
|
+
|
|
80
|
+
def __init__(self, dmm, fe_args):
|
|
81
|
+
self._dmm = dmm
|
|
82
|
+
self._fe_args = fe_args
|
|
83
|
+
self._nargs = len(fe_args)
|
|
84
|
+
|
|
85
|
+
self._dm_args = []
|
|
86
|
+
argtys = []
|
|
87
|
+
for ty in fe_args:
|
|
88
|
+
dm = self._dmm.lookup(ty)
|
|
89
|
+
self._dm_args.append(dm)
|
|
90
|
+
argtys.append(dm.get_argument_type())
|
|
91
|
+
self._unflattener = _Unflattener(argtys)
|
|
92
|
+
self._be_args = list(_flatten(argtys))
|
|
93
|
+
|
|
94
|
+
def as_arguments(self, builder, values):
|
|
95
|
+
"""Flatten all argument values"""
|
|
96
|
+
if len(values) != self._nargs:
|
|
97
|
+
raise TypeError(
|
|
98
|
+
"invalid number of args: expected %d, got %d"
|
|
99
|
+
% (self._nargs, len(values))
|
|
100
|
+
)
|
|
101
|
+
|
|
102
|
+
if not values:
|
|
103
|
+
return ()
|
|
104
|
+
|
|
105
|
+
args = [
|
|
106
|
+
dm.as_argument(builder, val)
|
|
107
|
+
for dm, val in zip(self._dm_args, values)
|
|
108
|
+
]
|
|
109
|
+
|
|
110
|
+
args = tuple(_flatten(args))
|
|
111
|
+
return args
|
|
112
|
+
|
|
113
|
+
def from_arguments(self, builder, args):
|
|
114
|
+
"""Unflatten all argument values"""
|
|
115
|
+
|
|
116
|
+
valtree = self._unflattener.unflatten(args)
|
|
117
|
+
values = [
|
|
118
|
+
dm.from_argument(builder, val)
|
|
119
|
+
for dm, val in zip(self._dm_args, valtree)
|
|
120
|
+
]
|
|
121
|
+
|
|
122
|
+
return values
|
|
123
|
+
|
|
124
|
+
def assign_names(self, args, names):
|
|
125
|
+
"""Assign names for each flattened argument values."""
|
|
126
|
+
|
|
127
|
+
valtree = self._unflattener.unflatten(args)
|
|
128
|
+
for aval, aname in zip(valtree, names):
|
|
129
|
+
self._assign_names(aval, aname)
|
|
130
|
+
|
|
131
|
+
def _assign_names(self, val_or_nested, name, depth=()):
|
|
132
|
+
if isinstance(val_or_nested, (tuple, list)):
|
|
133
|
+
for pos, aval in enumerate(val_or_nested):
|
|
134
|
+
self._assign_names(aval, name, depth=depth + (pos,))
|
|
135
|
+
else:
|
|
136
|
+
postfix = ".".join(map(str, depth))
|
|
137
|
+
parts = [name, postfix]
|
|
138
|
+
val_or_nested.name = ".".join(filter(bool, parts))
|
|
139
|
+
|
|
140
|
+
@property
|
|
141
|
+
def argument_types(self):
|
|
142
|
+
"""Return a list of LLVM types that are results of flattening
|
|
143
|
+
composite types.
|
|
144
|
+
"""
|
|
145
|
+
return tuple(ty for ty in self._be_args if ty != ())
|
|
146
|
+
|
|
147
|
+
|
|
148
|
+
def _flatten(iterable):
|
|
149
|
+
"""
|
|
150
|
+
Flatten nested iterable of (tuple, list).
|
|
151
|
+
"""
|
|
152
|
+
|
|
153
|
+
def rec(iterable):
|
|
154
|
+
for i in iterable:
|
|
155
|
+
if isinstance(i, (tuple, list)):
|
|
156
|
+
for j in rec(i):
|
|
157
|
+
yield j
|
|
158
|
+
else:
|
|
159
|
+
yield i
|
|
160
|
+
|
|
161
|
+
return rec(iterable)
|
|
162
|
+
|
|
163
|
+
|
|
164
|
+
_PUSH_LIST = 1
|
|
165
|
+
_APPEND_NEXT_VALUE = 2
|
|
166
|
+
_APPEND_EMPTY_TUPLE = 3
|
|
167
|
+
_POP = 4
|
|
168
|
+
|
|
169
|
+
|
|
170
|
+
class _Unflattener(object):
|
|
171
|
+
"""
|
|
172
|
+
An object used to unflatten nested sequences after a given pattern
|
|
173
|
+
(an arbitrarily nested sequence).
|
|
174
|
+
The pattern shows the nested sequence shape desired when unflattening;
|
|
175
|
+
the values it contains are irrelevant.
|
|
176
|
+
"""
|
|
177
|
+
|
|
178
|
+
def __init__(self, pattern):
|
|
179
|
+
self._code = self._build_unflatten_code(pattern)
|
|
180
|
+
|
|
181
|
+
def _build_unflatten_code(self, iterable):
|
|
182
|
+
"""Build the unflatten opcode sequence for the given *iterable* structure
|
|
183
|
+
(an iterable of nested sequences).
|
|
184
|
+
"""
|
|
185
|
+
code = []
|
|
186
|
+
|
|
187
|
+
def rec(iterable):
|
|
188
|
+
for i in iterable:
|
|
189
|
+
if isinstance(i, (tuple, list)):
|
|
190
|
+
if len(i) > 0:
|
|
191
|
+
code.append(_PUSH_LIST)
|
|
192
|
+
rec(i)
|
|
193
|
+
code.append(_POP)
|
|
194
|
+
else:
|
|
195
|
+
code.append(_APPEND_EMPTY_TUPLE)
|
|
196
|
+
else:
|
|
197
|
+
code.append(_APPEND_NEXT_VALUE)
|
|
198
|
+
|
|
199
|
+
rec(iterable)
|
|
200
|
+
return code
|
|
201
|
+
|
|
202
|
+
def unflatten(self, flatiter):
|
|
203
|
+
"""Rebuild a nested tuple structure."""
|
|
204
|
+
vals = deque(flatiter)
|
|
205
|
+
|
|
206
|
+
res = []
|
|
207
|
+
cur = res
|
|
208
|
+
stack = []
|
|
209
|
+
for op in self._code:
|
|
210
|
+
if op is _PUSH_LIST:
|
|
211
|
+
stack.append(cur)
|
|
212
|
+
cur.append([])
|
|
213
|
+
cur = cur[-1]
|
|
214
|
+
elif op is _APPEND_NEXT_VALUE:
|
|
215
|
+
cur.append(vals.popleft())
|
|
216
|
+
elif op is _APPEND_EMPTY_TUPLE:
|
|
217
|
+
cur.append(())
|
|
218
|
+
elif op is _POP:
|
|
219
|
+
cur = stack.pop()
|
|
220
|
+
|
|
221
|
+
assert not stack, stack
|
|
222
|
+
assert not vals, vals
|
|
223
|
+
|
|
224
|
+
return res
|
|
@@ -0,0 +1,22 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: BSD-2-Clause
|
|
3
|
+
|
|
4
|
+
import functools
|
|
5
|
+
from .manager import DataModelManager
|
|
6
|
+
|
|
7
|
+
|
|
8
|
+
def register(dmm, typecls):
|
|
9
|
+
"""Used as decorator to simplify datamodel registration.
|
|
10
|
+
Returns the object being decorated so that chaining is possible.
|
|
11
|
+
"""
|
|
12
|
+
|
|
13
|
+
def wraps(fn):
|
|
14
|
+
dmm.register(typecls, fn)
|
|
15
|
+
return fn
|
|
16
|
+
|
|
17
|
+
return wraps
|
|
18
|
+
|
|
19
|
+
|
|
20
|
+
default_manager = DataModelManager()
|
|
21
|
+
|
|
22
|
+
register_default = functools.partial(register, default_manager)
|
|
@@ -0,0 +1,153 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: BSD-2-Clause
|
|
3
|
+
|
|
4
|
+
from llvmlite import ir
|
|
5
|
+
from llvmlite import binding as ll
|
|
6
|
+
|
|
7
|
+
from numba.cuda import datamodel
|
|
8
|
+
import unittest
|
|
9
|
+
|
|
10
|
+
|
|
11
|
+
class DataModelTester(unittest.TestCase):
|
|
12
|
+
"""
|
|
13
|
+
Test the implementation of a DataModel for a frontend type.
|
|
14
|
+
"""
|
|
15
|
+
|
|
16
|
+
fe_type = NotImplemented
|
|
17
|
+
|
|
18
|
+
def setUp(self):
|
|
19
|
+
self.module = ir.Module()
|
|
20
|
+
self.datamodel = datamodel.default_manager[self.fe_type]
|
|
21
|
+
|
|
22
|
+
def test_as_arg(self):
|
|
23
|
+
"""
|
|
24
|
+
- Is as_arg() and from_arg() implemented?
|
|
25
|
+
- Are they the inverse of each other?
|
|
26
|
+
"""
|
|
27
|
+
fnty = ir.FunctionType(ir.VoidType(), [])
|
|
28
|
+
function = ir.Function(self.module, fnty, name="test_as_arg")
|
|
29
|
+
builder = ir.IRBuilder()
|
|
30
|
+
builder.position_at_end(function.append_basic_block())
|
|
31
|
+
|
|
32
|
+
undef_value = ir.Constant(self.datamodel.get_value_type(), None)
|
|
33
|
+
args = self.datamodel.as_argument(builder, undef_value)
|
|
34
|
+
self.assertIsNot(
|
|
35
|
+
args, NotImplemented, "as_argument returned NotImplementedError"
|
|
36
|
+
)
|
|
37
|
+
|
|
38
|
+
if isinstance(args, (tuple, list)):
|
|
39
|
+
|
|
40
|
+
def recur_tuplize(args, func=None):
|
|
41
|
+
for arg in args:
|
|
42
|
+
if isinstance(arg, (tuple, list)):
|
|
43
|
+
yield tuple(recur_tuplize(arg, func=func))
|
|
44
|
+
else:
|
|
45
|
+
if func is None:
|
|
46
|
+
yield arg
|
|
47
|
+
else:
|
|
48
|
+
yield func(arg)
|
|
49
|
+
|
|
50
|
+
argtypes = tuple(recur_tuplize(args, func=lambda x: x.type))
|
|
51
|
+
exptypes = tuple(recur_tuplize(self.datamodel.get_argument_type()))
|
|
52
|
+
self.assertEqual(exptypes, argtypes)
|
|
53
|
+
else:
|
|
54
|
+
self.assertEqual(args.type, self.datamodel.get_argument_type())
|
|
55
|
+
|
|
56
|
+
rev_value = self.datamodel.from_argument(builder, args)
|
|
57
|
+
self.assertEqual(rev_value.type, self.datamodel.get_value_type())
|
|
58
|
+
|
|
59
|
+
builder.ret_void() # end function
|
|
60
|
+
|
|
61
|
+
# Ensure valid LLVM generation
|
|
62
|
+
materialized = ll.parse_assembly(str(self.module))
|
|
63
|
+
str(materialized)
|
|
64
|
+
|
|
65
|
+
def test_as_return(self):
|
|
66
|
+
"""
|
|
67
|
+
- Is as_return() and from_return() implemented?
|
|
68
|
+
- Are they the inverse of each other?
|
|
69
|
+
"""
|
|
70
|
+
fnty = ir.FunctionType(ir.VoidType(), [])
|
|
71
|
+
function = ir.Function(self.module, fnty, name="test_as_return")
|
|
72
|
+
builder = ir.IRBuilder()
|
|
73
|
+
builder.position_at_end(function.append_basic_block())
|
|
74
|
+
|
|
75
|
+
undef_value = ir.Constant(self.datamodel.get_value_type(), None)
|
|
76
|
+
ret = self.datamodel.as_return(builder, undef_value)
|
|
77
|
+
self.assertIsNot(
|
|
78
|
+
ret, NotImplemented, "as_return returned NotImplementedError"
|
|
79
|
+
)
|
|
80
|
+
|
|
81
|
+
self.assertEqual(ret.type, self.datamodel.get_return_type())
|
|
82
|
+
|
|
83
|
+
rev_value = self.datamodel.from_return(builder, ret)
|
|
84
|
+
self.assertEqual(rev_value.type, self.datamodel.get_value_type())
|
|
85
|
+
|
|
86
|
+
builder.ret_void() # end function
|
|
87
|
+
|
|
88
|
+
# Ensure valid LLVM generation
|
|
89
|
+
materialized = ll.parse_assembly(str(self.module))
|
|
90
|
+
str(materialized)
|
|
91
|
+
|
|
92
|
+
|
|
93
|
+
class SupportAsDataMixin(object):
|
|
94
|
+
"""Test as_data() and from_data()"""
|
|
95
|
+
|
|
96
|
+
# XXX test load_from_data_pointer() as well
|
|
97
|
+
|
|
98
|
+
def test_as_data(self):
|
|
99
|
+
fnty = ir.FunctionType(ir.VoidType(), [])
|
|
100
|
+
function = ir.Function(self.module, fnty, name="test_as_data")
|
|
101
|
+
builder = ir.IRBuilder()
|
|
102
|
+
builder.position_at_end(function.append_basic_block())
|
|
103
|
+
|
|
104
|
+
undef_value = ir.Constant(self.datamodel.get_value_type(), None)
|
|
105
|
+
data = self.datamodel.as_data(builder, undef_value)
|
|
106
|
+
self.assertIsNot(
|
|
107
|
+
data, NotImplemented, "as_data returned NotImplemented"
|
|
108
|
+
)
|
|
109
|
+
|
|
110
|
+
self.assertEqual(data.type, self.datamodel.get_data_type())
|
|
111
|
+
|
|
112
|
+
rev_value = self.datamodel.from_data(builder, data)
|
|
113
|
+
self.assertEqual(rev_value.type, self.datamodel.get_value_type())
|
|
114
|
+
|
|
115
|
+
builder.ret_void() # end function
|
|
116
|
+
|
|
117
|
+
# Ensure valid LLVM generation
|
|
118
|
+
materialized = ll.parse_assembly(str(self.module))
|
|
119
|
+
str(materialized)
|
|
120
|
+
|
|
121
|
+
|
|
122
|
+
class NotSupportAsDataMixin(object):
|
|
123
|
+
"""Ensure as_data() and from_data() raise NotImplementedError."""
|
|
124
|
+
|
|
125
|
+
def test_as_data_not_supported(self):
|
|
126
|
+
fnty = ir.FunctionType(ir.VoidType(), [])
|
|
127
|
+
function = ir.Function(self.module, fnty, name="test_as_data")
|
|
128
|
+
builder = ir.IRBuilder()
|
|
129
|
+
builder.position_at_end(function.append_basic_block())
|
|
130
|
+
|
|
131
|
+
undef_value = ir.Constant(self.datamodel.get_value_type(), None)
|
|
132
|
+
with self.assertRaises(NotImplementedError):
|
|
133
|
+
data = self.datamodel.as_data(builder, undef_value) # noqa: F841
|
|
134
|
+
with self.assertRaises(NotImplementedError):
|
|
135
|
+
rev_data = self.datamodel.from_data(builder, undef_value) # noqa: F841
|
|
136
|
+
|
|
137
|
+
|
|
138
|
+
class DataModelTester_SupportAsDataMixin(DataModelTester, SupportAsDataMixin):
|
|
139
|
+
pass
|
|
140
|
+
|
|
141
|
+
|
|
142
|
+
class DataModelTester_NotSupportAsDataMixin(
|
|
143
|
+
DataModelTester, NotSupportAsDataMixin
|
|
144
|
+
):
|
|
145
|
+
pass
|
|
146
|
+
|
|
147
|
+
|
|
148
|
+
def test_factory(support_as_data=True):
|
|
149
|
+
"""A helper for returning a unittest TestCase for testing"""
|
|
150
|
+
if support_as_data:
|
|
151
|
+
return DataModelTester_SupportAsDataMixin
|
|
152
|
+
else:
|
|
153
|
+
return DataModelTester_NotSupportAsDataMixin
|
|
@@ -0,0 +1,11 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: BSD-2-Clause
|
|
3
|
+
|
|
4
|
+
import sys
|
|
5
|
+
from numba.cuda.utils import redirect_numba_module
|
|
6
|
+
|
|
7
|
+
sys.modules[__name__] = redirect_numba_module(
|
|
8
|
+
locals(),
|
|
9
|
+
"numba.core.datamodel.manager",
|
|
10
|
+
"numba.cuda.datamodel.cuda_manager",
|
|
11
|
+
)
|
|
@@ -0,0 +1,9 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: BSD-2-Clause
|
|
3
|
+
|
|
4
|
+
import sys
|
|
5
|
+
from numba.cuda.utils import redirect_numba_module
|
|
6
|
+
|
|
7
|
+
sys.modules[__name__] = redirect_numba_module(
|
|
8
|
+
locals(), "numba.core.datamodel.models", "numba.cuda.datamodel.cuda_models"
|
|
9
|
+
)
|
|
@@ -0,0 +1,9 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: BSD-2-Clause
|
|
3
|
+
|
|
4
|
+
import sys
|
|
5
|
+
from numba.cuda.utils import redirect_numba_module
|
|
6
|
+
|
|
7
|
+
sys.modules[__name__] = redirect_numba_module(
|
|
8
|
+
locals(), "numba.core.datamodel.packer", "numba.cuda.datamodel.cuda_packer"
|
|
9
|
+
)
|
|
@@ -0,0 +1,11 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: BSD-2-Clause
|
|
3
|
+
|
|
4
|
+
import sys
|
|
5
|
+
from numba.cuda.utils import redirect_numba_module
|
|
6
|
+
|
|
7
|
+
sys.modules[__name__] = redirect_numba_module(
|
|
8
|
+
locals(),
|
|
9
|
+
"numba.core.datamodel.registry",
|
|
10
|
+
"numba.cuda.datamodel.cuda_registry",
|
|
11
|
+
)
|
|
@@ -0,0 +1,11 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: BSD-2-Clause
|
|
3
|
+
|
|
4
|
+
import sys
|
|
5
|
+
from numba.cuda.utils import redirect_numba_module
|
|
6
|
+
|
|
7
|
+
sys.modules[__name__] = redirect_numba_module(
|
|
8
|
+
locals(),
|
|
9
|
+
"numba.core.datamodel.testing",
|
|
10
|
+
"numba.cuda.datamodel.cuda_testing",
|
|
11
|
+
)
|