numba-cuda 0.18.1__py3-none-any.whl → 0.19.1__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of numba-cuda might be problematic. Click here for more details.
- _numba_cuda_redirector.pth +3 -0
- _numba_cuda_redirector.py +3 -0
- numba_cuda/VERSION +1 -1
- numba_cuda/__init__.py +2 -1
- numba_cuda/_version.py +2 -13
- numba_cuda/numba/cuda/__init__.py +4 -1
- numba_cuda/numba/cuda/_internal/cuda_bf16.py +5 -2
- numba_cuda/numba/cuda/_internal/cuda_fp16.py +4 -1
- numba_cuda/numba/cuda/api.py +5 -7
- numba_cuda/numba/cuda/api_util.py +3 -0
- numba_cuda/numba/cuda/args.py +3 -0
- numba_cuda/numba/cuda/bf16.py +3 -0
- numba_cuda/numba/cuda/cg.py +3 -0
- numba_cuda/numba/cuda/cgutils.py +3 -0
- numba_cuda/numba/cuda/codegen.py +3 -0
- numba_cuda/numba/cuda/compiler.py +10 -4
- numba_cuda/numba/cuda/core/caching.py +3 -0
- numba_cuda/numba/cuda/core/callconv.py +3 -0
- numba_cuda/numba/cuda/core/codegen.py +3 -0
- numba_cuda/numba/cuda/core/compiler.py +3 -0
- numba_cuda/numba/cuda/core/interpreter.py +3595 -0
- numba_cuda/numba/cuda/core/ir_utils.py +2644 -0
- numba_cuda/numba/cuda/core/sigutils.py +58 -0
- numba_cuda/numba/cuda/core/typed_passes.py +3 -0
- numba_cuda/numba/cuda/cuda_paths.py +12 -17
- numba_cuda/numba/cuda/cudadecl.py +4 -1
- numba_cuda/numba/cuda/cudadrv/__init__.py +3 -0
- numba_cuda/numba/cuda/cudadrv/devicearray.py +3 -0
- numba_cuda/numba/cuda/cudadrv/devices.py +3 -0
- numba_cuda/numba/cuda/cudadrv/driver.py +7 -19
- numba_cuda/numba/cuda/cudadrv/drvapi.py +3 -0
- numba_cuda/numba/cuda/cudadrv/dummyarray.py +3 -0
- numba_cuda/numba/cuda/cudadrv/enums.py +3 -0
- numba_cuda/numba/cuda/cudadrv/error.py +4 -0
- numba_cuda/numba/cuda/cudadrv/libs.py +4 -2
- numba_cuda/numba/cuda/cudadrv/linkable_code.py +3 -0
- numba_cuda/numba/cuda/cudadrv/mappings.py +3 -0
- numba_cuda/numba/cuda/cudadrv/ndarray.py +3 -0
- numba_cuda/numba/cuda/cudadrv/nvrtc.py +47 -44
- numba_cuda/numba/cuda/cudadrv/nvvm.py +6 -18
- numba_cuda/numba/cuda/cudadrv/rtapi.py +3 -0
- numba_cuda/numba/cuda/cudadrv/runtime.py +15 -1
- numba_cuda/numba/cuda/cudaimpl.py +3 -0
- numba_cuda/numba/cuda/cudamath.py +4 -1
- numba_cuda/numba/cuda/debuginfo.py +3 -0
- numba_cuda/numba/cuda/decorators.py +7 -3
- numba_cuda/numba/cuda/descriptor.py +3 -0
- numba_cuda/numba/cuda/device_init.py +3 -0
- numba_cuda/numba/cuda/deviceufunc.py +5 -1
- numba_cuda/numba/cuda/dispatcher.py +6 -2
- numba_cuda/numba/cuda/errors.py +10 -0
- numba_cuda/numba/cuda/extending.py +4 -1
- numba_cuda/numba/cuda/flags.py +2 -0
- numba_cuda/numba/cuda/fp16.py +3 -0
- numba_cuda/numba/cuda/initialize.py +4 -0
- numba_cuda/numba/cuda/intrinsic_wrapper.py +3 -0
- numba_cuda/numba/cuda/intrinsics.py +3 -0
- numba_cuda/numba/cuda/itanium_mangler.py +214 -0
- numba_cuda/numba/cuda/kernels/__init__.py +2 -0
- numba_cuda/numba/cuda/kernels/reduction.py +3 -0
- numba_cuda/numba/cuda/kernels/transpose.py +3 -0
- numba_cuda/numba/cuda/libdevice.py +4 -0
- numba_cuda/numba/cuda/libdevicedecl.py +4 -1
- numba_cuda/numba/cuda/libdevicefuncs.py +4 -1
- numba_cuda/numba/cuda/libdeviceimpl.py +3 -0
- numba_cuda/numba/cuda/locks.py +3 -0
- numba_cuda/numba/cuda/lowering.py +53 -16
- numba_cuda/numba/cuda/mathimpl.py +3 -0
- numba_cuda/numba/cuda/memory_management/__init__.py +3 -0
- numba_cuda/numba/cuda/memory_management/memsys.cu +5 -0
- numba_cuda/numba/cuda/memory_management/memsys.cuh +5 -0
- numba_cuda/numba/cuda/memory_management/nrt.cu +5 -0
- numba_cuda/numba/cuda/memory_management/nrt.cuh +5 -0
- numba_cuda/numba/cuda/memory_management/nrt.py +5 -1
- numba_cuda/numba/cuda/models.py +3 -0
- numba_cuda/numba/cuda/nvvmutils.py +3 -0
- numba_cuda/numba/cuda/printimpl.py +3 -0
- numba_cuda/numba/cuda/random.py +3 -0
- numba_cuda/numba/cuda/reshape_funcs.cu +5 -0
- numba_cuda/numba/cuda/serialize.py +3 -0
- numba_cuda/numba/cuda/simulator/__init__.py +3 -0
- numba_cuda/numba/cuda/simulator/_internal/__init__.py +3 -0
- numba_cuda/numba/cuda/simulator/_internal/cuda_bf16.py +2 -0
- numba_cuda/numba/cuda/simulator/api.py +4 -1
- numba_cuda/numba/cuda/simulator/bf16.py +3 -0
- numba_cuda/numba/cuda/simulator/compiler.py +3 -0
- numba_cuda/numba/cuda/simulator/cudadrv/__init__.py +3 -0
- numba_cuda/numba/cuda/simulator/cudadrv/devicearray.py +3 -0
- numba_cuda/numba/cuda/simulator/cudadrv/devices.py +3 -0
- numba_cuda/numba/cuda/simulator/cudadrv/driver.py +3 -7
- numba_cuda/numba/cuda/simulator/cudadrv/drvapi.py +3 -0
- numba_cuda/numba/cuda/simulator/cudadrv/dummyarray.py +3 -0
- numba_cuda/numba/cuda/simulator/cudadrv/error.py +4 -0
- numba_cuda/numba/cuda/simulator/cudadrv/libs.py +4 -0
- numba_cuda/numba/cuda/simulator/cudadrv/linkable_code.py +4 -0
- numba_cuda/numba/cuda/simulator/cudadrv/nvrtc.py +3 -0
- numba_cuda/numba/cuda/simulator/cudadrv/nvvm.py +3 -0
- numba_cuda/numba/cuda/simulator/cudadrv/runtime.py +3 -0
- numba_cuda/numba/cuda/simulator/dispatcher.py +4 -0
- numba_cuda/numba/cuda/simulator/kernel.py +3 -0
- numba_cuda/numba/cuda/simulator/kernelapi.py +3 -0
- numba_cuda/numba/cuda/simulator/memory_management/__init__.py +3 -0
- numba_cuda/numba/cuda/simulator/memory_management/nrt.py +3 -0
- numba_cuda/numba/cuda/simulator/reduction.py +3 -0
- numba_cuda/numba/cuda/simulator/vector_types.py +3 -0
- numba_cuda/numba/cuda/simulator_init.py +3 -0
- numba_cuda/numba/cuda/stubs.py +3 -0
- numba_cuda/numba/cuda/target.py +4 -2
- numba_cuda/numba/cuda/testing.py +7 -6
- numba_cuda/numba/cuda/tests/__init__.py +3 -0
- numba_cuda/numba/cuda/tests/complex_usecases.py +3 -0
- numba_cuda/numba/cuda/tests/core/serialize_usecases.py +3 -0
- numba_cuda/numba/cuda/tests/core/test_itanium_mangler.py +83 -0
- numba_cuda/numba/cuda/tests/core/test_serialize.py +3 -0
- numba_cuda/numba/cuda/tests/cudadrv/__init__.py +3 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_array_attr.py +3 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_context_stack.py +3 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_cuda_array_slicing.py +3 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_cuda_auto_context.py +3 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_cuda_devicerecord.py +3 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_cuda_driver.py +3 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_cuda_libraries.py +3 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_cuda_memory.py +3 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_cuda_ndarray.py +4 -1
- numba_cuda/numba/cuda/tests/cudadrv/test_deallocations.py +4 -1
- numba_cuda/numba/cuda/tests/cudadrv/test_detect.py +4 -1
- numba_cuda/numba/cuda/tests/cudadrv/test_emm_plugins.py +4 -1
- numba_cuda/numba/cuda/tests/cudadrv/test_events.py +3 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_host_alloc.py +3 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_init.py +3 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_inline_ptx.py +3 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_is_fp16.py +3 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_linker.py +4 -1
- numba_cuda/numba/cuda/tests/cudadrv/test_managed_alloc.py +4 -1
- numba_cuda/numba/cuda/tests/cudadrv/test_module_callbacks.py +3 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_mvc.py +4 -1
- numba_cuda/numba/cuda/tests/cudadrv/test_nvjitlink.py +3 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_nvrtc.py +7 -6
- numba_cuda/numba/cuda/tests/cudadrv/test_nvvm_driver.py +3 -4
- numba_cuda/numba/cuda/tests/cudadrv/test_pinned.py +3 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_profiler.py +3 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_ptds.py +4 -1
- numba_cuda/numba/cuda/tests/cudadrv/test_reset_device.py +3 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_runtime.py +3 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_select_device.py +3 -0
- numba_cuda/numba/cuda/tests/cudadrv/test_streams.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/__init__.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/cache_usecases.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/cache_with_cpu_usecases.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/cg_cache_usecases.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/extensions_usecases.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/recursion_usecases.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_alignment.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_array.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_array_alignment.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_array_args.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_array_methods.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_atomics.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_bfloat16.py +4 -3
- numba_cuda/numba/cuda/tests/cudapy/test_bfloat16_bindings.py +4 -3
- numba_cuda/numba/cuda/tests/cudapy/test_blackscholes.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_boolean.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_caching.py +149 -3
- numba_cuda/numba/cuda/tests/cudapy/test_casting.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_cffi.py +4 -1
- numba_cuda/numba/cuda/tests/cudapy/test_compiler.py +3 -4
- numba_cuda/numba/cuda/tests/cudapy/test_complex.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_complex_kernel.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_const_string.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_constmem.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_cooperative_groups.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_cuda_array_interface.py +4 -1
- numba_cuda/numba/cuda/tests/cudapy/test_cuda_jit_no_types.py +4 -1
- numba_cuda/numba/cuda/tests/cudapy/test_datetime.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_debug.py +4 -1
- numba_cuda/numba/cuda/tests/cudapy/test_debuginfo.py +23 -284
- numba_cuda/numba/cuda/tests/cudapy/test_debuginfo_types.py +476 -0
- numba_cuda/numba/cuda/tests/cudapy/test_device_func.py +4 -1
- numba_cuda/numba/cuda/tests/cudapy/test_dispatcher.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_enums.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_errors.py +4 -1
- numba_cuda/numba/cuda/tests/cudapy/test_exception.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_extending.py +4 -6
- numba_cuda/numba/cuda/tests/cudapy/test_fastmath.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_forall.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_freevar.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_frexp_ldexp.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_globals.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_gufunc.py +4 -1
- numba_cuda/numba/cuda/tests/cudapy/test_gufunc_scalar.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_gufunc_scheduling.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_idiv.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_inline.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_inspect.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_intrinsics.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_ipc.py +4 -1
- numba_cuda/numba/cuda/tests/cudapy/test_ir_utils.py +298 -0
- numba_cuda/numba/cuda/tests/cudapy/test_iterators.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_lang.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_laplace.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_libdevice.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_lineinfo.py +4 -1
- numba_cuda/numba/cuda/tests/cudapy/test_localmem.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_mandel.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_math.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_matmul.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_minmax.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_montecarlo.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_multigpu.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_multiprocessing.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_multithreads.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_nondet.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_operator.py +4 -1
- numba_cuda/numba/cuda/tests/cudapy/test_optimization.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_overload.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_powi.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_print.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_py2_div_issue.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_random.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_record_dtype.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_recursion.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_reduction.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_retrieve_autoconverted_arrays.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_serialize.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_slicing.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_sm.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_sm_creation.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_stream_api.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_sync.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_transpose.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_ufuncs.py +4 -1
- numba_cuda/numba/cuda/tests/cudapy/test_userexc.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_vector_type.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_vectorize.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_vectorize_complex.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_vectorize_decor.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_vectorize_device.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_vectorize_scalar_arg.py +3 -0
- numba_cuda/numba/cuda/tests/cudapy/test_warning.py +8 -1
- numba_cuda/numba/cuda/tests/cudapy/test_warp_ops.py +3 -0
- numba_cuda/numba/cuda/tests/cudasim/__init__.py +3 -0
- numba_cuda/numba/cuda/tests/cudasim/support.py +3 -0
- numba_cuda/numba/cuda/tests/cudasim/test_cudasim_issues.py +3 -0
- numba_cuda/numba/cuda/tests/data/__init__.py +2 -0
- numba_cuda/numba/cuda/tests/data/cta_barrier.cu +5 -0
- numba_cuda/numba/cuda/tests/data/cuda_include.cu +5 -0
- numba_cuda/numba/cuda/tests/data/error.cu +5 -0
- numba_cuda/numba/cuda/tests/data/include/add.cuh +5 -0
- numba_cuda/numba/cuda/tests/data/jitlink.cu +5 -0
- numba_cuda/numba/cuda/tests/data/warn.cu +5 -0
- numba_cuda/numba/cuda/tests/doc_examples/__init__.py +3 -0
- numba_cuda/numba/cuda/tests/doc_examples/ffi/__init__.py +2 -0
- numba_cuda/numba/cuda/tests/doc_examples/ffi/functions.cu +5 -0
- numba_cuda/numba/cuda/tests/doc_examples/ffi/include/mul.cuh +5 -0
- numba_cuda/numba/cuda/tests/doc_examples/ffi/saxpy.cu +5 -0
- numba_cuda/numba/cuda/tests/doc_examples/test_cg.py +3 -0
- numba_cuda/numba/cuda/tests/doc_examples/test_cpointer.py +4 -1
- numba_cuda/numba/cuda/tests/doc_examples/test_cpu_gpu_compat.py +4 -1
- numba_cuda/numba/cuda/tests/doc_examples/test_ffi.py +4 -1
- numba_cuda/numba/cuda/tests/doc_examples/test_laplace.py +4 -1
- numba_cuda/numba/cuda/tests/doc_examples/test_matmul.py +4 -1
- numba_cuda/numba/cuda/tests/doc_examples/test_montecarlo.py +4 -1
- numba_cuda/numba/cuda/tests/doc_examples/test_random.py +3 -0
- numba_cuda/numba/cuda/tests/doc_examples/test_reduction.py +4 -1
- numba_cuda/numba/cuda/tests/doc_examples/test_sessionize.py +4 -1
- numba_cuda/numba/cuda/tests/doc_examples/test_ufunc.py +4 -1
- numba_cuda/numba/cuda/tests/doc_examples/test_vecadd.py +4 -1
- numba_cuda/numba/cuda/tests/enum_usecases.py +3 -0
- numba_cuda/numba/cuda/tests/nocuda/__init__.py +3 -0
- numba_cuda/numba/cuda/tests/nocuda/test_dummyarray.py +3 -0
- numba_cuda/numba/cuda/tests/nocuda/test_function_resolution.py +3 -0
- numba_cuda/numba/cuda/tests/nocuda/test_import.py +4 -1
- numba_cuda/numba/cuda/tests/nocuda/test_library_lookup.py +3 -0
- numba_cuda/numba/cuda/tests/nocuda/test_nvvm.py +3 -0
- numba_cuda/numba/cuda/tests/nrt/__init__.py +3 -0
- numba_cuda/numba/cuda/tests/nrt/test_nrt.py +5 -2
- numba_cuda/numba/cuda/tests/nrt/test_nrt_refct.py +4 -1
- numba_cuda/numba/cuda/tests/support.py +755 -0
- numba_cuda/numba/cuda/tests/test_binary_generation/Makefile +6 -3
- numba_cuda/numba/cuda/tests/test_binary_generation/generate_raw_ltoir.py +6 -2
- numba_cuda/numba/cuda/tests/test_binary_generation/nrt_extern.cu +5 -0
- numba_cuda/numba/cuda/tests/test_binary_generation/test_device_functions.cu +5 -0
- numba_cuda/numba/cuda/tests/test_binary_generation/undefined_extern.cu +5 -0
- numba_cuda/numba/cuda/types.py +3 -0
- numba_cuda/numba/cuda/typing/__init__.py +11 -0
- numba_cuda/numba/cuda/typing/templates.py +1448 -0
- numba_cuda/numba/cuda/ufuncs.py +3 -0
- numba_cuda/numba/cuda/utils.py +3 -0
- numba_cuda/numba/cuda/vector_types.py +6 -3
- numba_cuda/numba/cuda/vectorizers.py +3 -0
- {numba_cuda-0.18.1.dist-info → numba_cuda-0.19.1.dist-info}/METADATA +25 -29
- numba_cuda-0.19.1.dist-info/RECORD +302 -0
- {numba_cuda-0.18.1.dist-info → numba_cuda-0.19.1.dist-info}/licenses/LICENSE +1 -0
- numba_cuda-0.19.1.dist-info/licenses/LICENSE.numba +24 -0
- numba_cuda/numba/cuda/include/11/cuda_bf16.h +0 -3749
- numba_cuda/numba/cuda/include/11/cuda_bf16.hpp +0 -2683
- numba_cuda/numba/cuda/include/11/cuda_fp16.h +0 -3794
- numba_cuda/numba/cuda/include/11/cuda_fp16.hpp +0 -2614
- numba_cuda-0.18.1.dist-info/RECORD +0 -296
- {numba_cuda-0.18.1.dist-info → numba_cuda-0.19.1.dist-info}/WHEEL +0 -0
- {numba_cuda-0.18.1.dist-info → numba_cuda-0.19.1.dist-info}/top_level.txt +0 -0
|
@@ -1,3 +1,6 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: BSD-2-Clause
|
|
3
|
+
|
|
1
4
|
"""
|
|
2
5
|
The Device Array API is not implemented in the simulator. This module provides
|
|
3
6
|
stubs to allow tests to import correctly.
|
|
@@ -1,10 +1,11 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: BSD-2-Clause
|
|
3
|
+
|
|
1
4
|
"""
|
|
2
5
|
Most of the driver API is unsupported in the simulator, but some stubs are
|
|
3
6
|
provided to allow tests to import correctly.
|
|
4
7
|
"""
|
|
5
8
|
|
|
6
|
-
from numba import config
|
|
7
|
-
|
|
8
9
|
|
|
9
10
|
def device_memset(dst, val, size, stream=0):
|
|
10
11
|
dst.view("u1")[:size].fill(bytes([val])[0])
|
|
@@ -63,11 +64,6 @@ def launch_kernel(*args, **kwargs):
|
|
|
63
64
|
|
|
64
65
|
USE_NV_BINDING = False
|
|
65
66
|
|
|
66
|
-
PyNvJitLinker = None
|
|
67
|
-
|
|
68
|
-
if config.ENABLE_CUDASIM:
|
|
69
|
-
config.CUDA_ENABLE_PYNVJITLINK = False
|
|
70
|
-
|
|
71
67
|
|
|
72
68
|
def _have_nvjitlink():
|
|
73
69
|
return False
|
|
@@ -1,3 +1,6 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: BSD-2-Clause
|
|
3
|
+
|
|
1
4
|
# Dummy arrays are not implemented in the simulator. This file allows the dummy
|
|
2
5
|
# array tests to be imported, but they are skipped on the simulator.
|
|
3
6
|
|
|
@@ -1,3 +1,6 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: BSD-2-Clause
|
|
3
|
+
|
|
1
4
|
# We import * from simulator here because * is imported from simulator_init by
|
|
2
5
|
# numba.cuda.__init__.
|
|
3
6
|
from .simulator import * # noqa: F403, F401
|
numba_cuda/numba/cuda/stubs.py
CHANGED
numba_cuda/numba/cuda/target.py
CHANGED
|
@@ -1,13 +1,15 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: BSD-2-Clause
|
|
3
|
+
|
|
1
4
|
import re
|
|
2
5
|
from functools import cached_property
|
|
3
6
|
import llvmlite.binding as ll
|
|
4
7
|
from llvmlite import ir
|
|
5
8
|
import warnings
|
|
6
|
-
from numba.cuda import cgutils
|
|
9
|
+
from numba.cuda import cgutils, itanium_mangler
|
|
7
10
|
from numba.core import (
|
|
8
11
|
compiler,
|
|
9
12
|
config,
|
|
10
|
-
itanium_mangler,
|
|
11
13
|
targetconfig,
|
|
12
14
|
types,
|
|
13
15
|
typing,
|
numba_cuda/numba/cuda/testing.py
CHANGED
|
@@ -1,3 +1,6 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: BSD-2-Clause
|
|
3
|
+
|
|
1
4
|
import os
|
|
2
5
|
import platform
|
|
3
6
|
import shutil
|
|
@@ -8,7 +11,7 @@ from numba.cuda.cuda_paths import get_conda_ctk
|
|
|
8
11
|
from numba.cuda.cudadrv import driver, devices, libs
|
|
9
12
|
from numba.cuda.dispatcher import CUDADispatcher
|
|
10
13
|
from numba.core import config
|
|
11
|
-
from numba.tests.support import TestCase
|
|
14
|
+
from numba.cuda.tests.support import TestCase
|
|
12
15
|
from pathlib import Path
|
|
13
16
|
|
|
14
17
|
from typing import Iterable, Union
|
|
@@ -154,7 +157,6 @@ class CUDATestCase(TestCase):
|
|
|
154
157
|
matcher.stderr = StringIO()
|
|
155
158
|
result = matcher.run()
|
|
156
159
|
if result != 0:
|
|
157
|
-
dump_instructions = ""
|
|
158
160
|
if self._dump_failed_filechecks:
|
|
159
161
|
dump_directory = Path(
|
|
160
162
|
datetime.now().strftime("numba-ir-%Y_%m_%d_%H_%M_%S")
|
|
@@ -172,13 +174,12 @@ class CUDATestCase(TestCase):
|
|
|
172
174
|
):
|
|
173
175
|
_ = ir_file.write(ir_content + "\n")
|
|
174
176
|
_ = checks_file.write(check_patterns)
|
|
175
|
-
dump_instructions = f"Reproduce with:\n\nfilecheck --check-prefixes={','.join(check_prefixes)} {checks_dump} --input-file
|
|
177
|
+
dump_instructions = f"Reproduce with:\n\nfilecheck --check-prefixes={','.join(check_prefixes)} {checks_dump} --input-file {ir_dump}"
|
|
178
|
+
else:
|
|
179
|
+
dump_instructions = "Rerun with --dump-failed-filechecks to generate a reproducer."
|
|
176
180
|
|
|
177
181
|
self.fail(
|
|
178
182
|
f"FileCheck failed:\n{matcher.stderr.getvalue()}\n\n"
|
|
179
|
-
+ f"Check prefixes:\n{check_prefixes}\n\n"
|
|
180
|
-
+ f"Check patterns:\n{check_patterns}\n"
|
|
181
|
-
+ f"IR:\n{ir_content}\n\n"
|
|
182
183
|
+ dump_instructions
|
|
183
184
|
)
|
|
184
185
|
|
|
@@ -0,0 +1,83 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: BSD-2-Clause
|
|
3
|
+
|
|
4
|
+
# -*- coding: utf-8 -*-
|
|
5
|
+
from numba import int32, int64, uint32, uint64, float32, float64
|
|
6
|
+
from numba.core.types import range_iter32_type
|
|
7
|
+
from numba.cuda import itanium_mangler
|
|
8
|
+
import unittest
|
|
9
|
+
|
|
10
|
+
|
|
11
|
+
class TestItaniumManager(unittest.TestCase):
|
|
12
|
+
def test_ident(self):
|
|
13
|
+
got = itanium_mangler.mangle_identifier("apple")
|
|
14
|
+
expect = "5apple"
|
|
15
|
+
self.assertEqual(expect, got)
|
|
16
|
+
|
|
17
|
+
got = itanium_mangler.mangle_identifier("ap_ple")
|
|
18
|
+
expect = "6ap_ple"
|
|
19
|
+
self.assertEqual(expect, got)
|
|
20
|
+
|
|
21
|
+
got = itanium_mangler.mangle_identifier("apple213")
|
|
22
|
+
expect = "8apple213"
|
|
23
|
+
self.assertEqual(expect, got)
|
|
24
|
+
|
|
25
|
+
def test_types(self):
|
|
26
|
+
got = itanium_mangler.mangle_type(int32)
|
|
27
|
+
expect = "i"
|
|
28
|
+
self.assertEqual(expect, got)
|
|
29
|
+
|
|
30
|
+
got = itanium_mangler.mangle_type(int64)
|
|
31
|
+
expect = "x"
|
|
32
|
+
self.assertEqual(expect, got)
|
|
33
|
+
|
|
34
|
+
got = itanium_mangler.mangle_type(uint32)
|
|
35
|
+
expect = "j"
|
|
36
|
+
self.assertEqual(expect, got)
|
|
37
|
+
|
|
38
|
+
got = itanium_mangler.mangle_type(uint64)
|
|
39
|
+
expect = "y"
|
|
40
|
+
self.assertEqual(expect, got)
|
|
41
|
+
|
|
42
|
+
got = itanium_mangler.mangle_type(float32)
|
|
43
|
+
expect = "f"
|
|
44
|
+
self.assertEqual(expect, got)
|
|
45
|
+
|
|
46
|
+
got = itanium_mangler.mangle_type(float64)
|
|
47
|
+
expect = "d"
|
|
48
|
+
self.assertEqual(expect, got)
|
|
49
|
+
|
|
50
|
+
def test_function(self):
|
|
51
|
+
got = itanium_mangler.mangle("what", [int32, float32])
|
|
52
|
+
expect = "_Z4whatif"
|
|
53
|
+
self.assertEqual(expect, got)
|
|
54
|
+
|
|
55
|
+
got = itanium_mangler.mangle(
|
|
56
|
+
"a_little_brown_fox", [uint64, uint32, float64]
|
|
57
|
+
)
|
|
58
|
+
expect = "_Z18a_little_brown_foxyjd"
|
|
59
|
+
self.assertEqual(expect, got)
|
|
60
|
+
|
|
61
|
+
def test_custom_type(self):
|
|
62
|
+
got = itanium_mangler.mangle_type(range_iter32_type)
|
|
63
|
+
name = str(range_iter32_type)
|
|
64
|
+
expect = "{n}{name}".format(n=len(name), name=name)
|
|
65
|
+
self.assertEqual(expect, got)
|
|
66
|
+
|
|
67
|
+
def test_mangle_literal(self):
|
|
68
|
+
# check int
|
|
69
|
+
got = itanium_mangler.mangle_value(123)
|
|
70
|
+
expect = "Li123E"
|
|
71
|
+
self.assertEqual(expect, got)
|
|
72
|
+
# check float (not handled using standard)
|
|
73
|
+
got = itanium_mangler.mangle_value(12.3)
|
|
74
|
+
self.assertRegex(got, r"^\d+_12_[0-9a-z][0-9a-z]3$")
|
|
75
|
+
|
|
76
|
+
def test_mangle_unicode(self):
|
|
77
|
+
name = "f∂ƒ©z"
|
|
78
|
+
got = itanium_mangler.mangle_identifier(name)
|
|
79
|
+
self.assertRegex(got, r"^\d+f(_[a-z0-9][a-z0-9])+z$")
|
|
80
|
+
|
|
81
|
+
|
|
82
|
+
if __name__ == "__main__":
|
|
83
|
+
unittest.main()
|
|
@@ -1,3 +1,6 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: BSD-2-Clause
|
|
3
|
+
|
|
1
4
|
from numba.cuda.testing import unittest
|
|
2
5
|
from numba.cuda.testing import skip_on_cudasim, skip_unless_conda_cudatoolkit
|
|
3
6
|
from numba.misc.findlib import find_lib
|
|
@@ -1,10 +1,13 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: BSD-2-Clause
|
|
3
|
+
|
|
1
4
|
import itertools
|
|
2
5
|
import numpy as np
|
|
3
6
|
from numba.cuda.cudadrv import devicearray
|
|
4
7
|
from numba import cuda
|
|
5
8
|
from numba.cuda.testing import unittest, CUDATestCase
|
|
6
9
|
from numba.cuda.testing import skip_on_cudasim
|
|
7
|
-
from numba.tests.support import IS_NUMPY_2
|
|
10
|
+
from numba.cuda.tests.support import IS_NUMPY_2
|
|
8
11
|
|
|
9
12
|
|
|
10
13
|
class TestCudaNDArray(CUDATestCase):
|
|
@@ -1,3 +1,6 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: BSD-2-Clause
|
|
3
|
+
|
|
1
4
|
from contextlib import contextmanager
|
|
2
5
|
|
|
3
6
|
import numpy as np
|
|
@@ -9,7 +12,7 @@ from numba.cuda.testing import (
|
|
|
9
12
|
skip_if_external_memmgr,
|
|
10
13
|
CUDATestCase,
|
|
11
14
|
)
|
|
12
|
-
from numba.tests.support import captured_stderr
|
|
15
|
+
from numba.cuda.tests.support import captured_stderr
|
|
13
16
|
from numba.core import config
|
|
14
17
|
|
|
15
18
|
|
|
@@ -1,3 +1,6 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: BSD-2-Clause
|
|
3
|
+
|
|
1
4
|
import os
|
|
2
5
|
import sys
|
|
3
6
|
import subprocess
|
|
@@ -9,7 +12,7 @@ from numba.cuda.testing import (
|
|
|
9
12
|
skip_on_cudasim,
|
|
10
13
|
skip_under_cuda_memcheck,
|
|
11
14
|
)
|
|
12
|
-
from numba.tests.support import captured_stdout
|
|
15
|
+
from numba.cuda.tests.support import captured_stdout
|
|
13
16
|
|
|
14
17
|
|
|
15
18
|
class TestCudaDetect(CUDATestCase):
|
|
@@ -1,3 +1,6 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: BSD-2-Clause
|
|
3
|
+
|
|
1
4
|
import ctypes
|
|
2
5
|
import numpy as np
|
|
3
6
|
import weakref
|
|
@@ -5,7 +8,7 @@ import weakref
|
|
|
5
8
|
from numba import cuda
|
|
6
9
|
from numba.core import config
|
|
7
10
|
from numba.cuda.testing import unittest, CUDATestCase, skip_on_cudasim
|
|
8
|
-
from numba.tests.support import linux_only
|
|
11
|
+
from numba.cuda.tests.support import linux_only
|
|
9
12
|
|
|
10
13
|
if not config.ENABLE_CUDASIM:
|
|
11
14
|
|
|
@@ -1,3 +1,6 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: BSD-2-Clause
|
|
3
|
+
|
|
1
4
|
import numpy as np
|
|
2
5
|
import warnings
|
|
3
6
|
from numba import config
|
|
@@ -6,7 +9,7 @@ from numba.cuda.testing import skip_on_cudasim, skip_if_cuda_includes_missing
|
|
|
6
9
|
from numba.cuda.testing import CUDATestCase, test_data_dir
|
|
7
10
|
from numba.cuda.cudadrv.driver import CudaAPIError, _Linker, LinkerError
|
|
8
11
|
from numba.cuda import require_context
|
|
9
|
-
from numba.tests.support import ignore_internal_warnings
|
|
12
|
+
from numba.cuda.tests.support import ignore_internal_warnings
|
|
10
13
|
from numba import cuda, void, float64, int64, int32, typeof, float32
|
|
11
14
|
from numba.cuda.cudadrv.error import NvrtcError
|
|
12
15
|
|
|
@@ -1,10 +1,13 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: BSD-2-Clause
|
|
3
|
+
|
|
1
4
|
import numpy as np
|
|
2
5
|
from ctypes import byref, c_size_t
|
|
3
6
|
from numba.cuda.cudadrv.driver import device_memset, driver, USE_NV_BINDING
|
|
4
7
|
from numba import cuda
|
|
5
8
|
from numba.cuda.testing import unittest, ContextResettingTestCase
|
|
6
9
|
from numba.cuda.testing import skip_on_cudasim, skip_on_arm
|
|
7
|
-
from numba.tests.support import linux_only
|
|
10
|
+
from numba.cuda.tests.support import linux_only
|
|
8
11
|
|
|
9
12
|
|
|
10
13
|
@skip_on_cudasim("CUDA Driver API unsupported in the simulator")
|
|
@@ -1,3 +1,6 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: BSD-2-Clause
|
|
3
|
+
|
|
1
4
|
import multiprocessing as mp
|
|
2
5
|
import traceback
|
|
3
6
|
from numba.cuda.testing import unittest, CUDATestCase
|
|
@@ -6,7 +9,7 @@ from numba.cuda.testing import (
|
|
|
6
9
|
skip_under_cuda_memcheck,
|
|
7
10
|
skip_if_mvc_libraries_unavailable,
|
|
8
11
|
)
|
|
9
|
-
from numba.tests.support import linux_only
|
|
12
|
+
from numba.cuda.tests.support import linux_only
|
|
10
13
|
|
|
11
14
|
|
|
12
15
|
def child_test():
|
|
@@ -1,3 +1,6 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: BSD-2-Clause
|
|
3
|
+
|
|
1
4
|
from numba.cuda.testing import unittest
|
|
2
5
|
from numba.cuda.testing import skip_on_cudasim
|
|
3
6
|
from numba.cuda.testing import CUDATestCase
|
|
@@ -1,3 +1,6 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: BSD-2-Clause
|
|
3
|
+
|
|
1
4
|
from numba.cuda.cudadrv import nvrtc
|
|
2
5
|
from numba.cuda.testing import skip_on_cudasim
|
|
3
6
|
|
|
@@ -13,13 +16,11 @@ class TestArchOption(unittest.TestCase):
|
|
|
13
16
|
self.assertEqual(nvrtc.get_arch_option(8, 5), "compute_80")
|
|
14
17
|
self.assertEqual(nvrtc.get_arch_option(9, 1), "compute_90")
|
|
15
18
|
# Test known arch.
|
|
16
|
-
|
|
17
|
-
for
|
|
18
|
-
self.assertEqual(
|
|
19
|
-
nvrtc.get_arch_option(*arch), "compute_%d%d" % arch
|
|
20
|
-
)
|
|
19
|
+
supported_ccs = nvrtc.get_supported_ccs()
|
|
20
|
+
for cc in supported_ccs:
|
|
21
|
+
self.assertEqual(nvrtc.get_arch_option(*cc), "compute_%d%d" % cc)
|
|
21
22
|
self.assertEqual(
|
|
22
|
-
nvrtc.get_arch_option(1000, 0), "compute_%d%d" %
|
|
23
|
+
nvrtc.get_arch_option(1000, 0), "compute_%d%d" % supported_ccs[-1]
|
|
23
24
|
)
|
|
24
25
|
|
|
25
26
|
|