PyPI - numba-cuda - Versions diffs - 0.8.1__py3-none-any.whl → 0.10.0__py3-none-any.whl - Mend

numba-cuda 0.8.1py3-none-any.whl → 0.10.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (237) hide show

_numba_cuda_redirector.py +17 -13
numba_cuda/VERSION +1 -1
numba_cuda/_version.py +4 -1
numba_cuda/numba/cuda/__init__.py +6 -2
numba_cuda/numba/cuda/api.py +129 -86
numba_cuda/numba/cuda/api_util.py +3 -3
numba_cuda/numba/cuda/args.py +12 -16
numba_cuda/numba/cuda/cg.py +6 -6
numba_cuda/numba/cuda/codegen.py +74 -43
numba_cuda/numba/cuda/compiler.py +246 -114
numba_cuda/numba/cuda/cpp_function_wrappers.cu +1 -2
numba_cuda/numba/cuda/cuda_bf16.py +5155 -0
numba_cuda/numba/cuda/cuda_paths.py +293 -99
numba_cuda/numba/cuda/cudadecl.py +93 -79
numba_cuda/numba/cuda/cudadrv/__init__.py +3 -1
numba_cuda/numba/cuda/cudadrv/devicearray.py +185 -135
numba_cuda/numba/cuda/cudadrv/devices.py +16 -11
numba_cuda/numba/cuda/cudadrv/driver.py +460 -297
numba_cuda/numba/cuda/cudadrv/drvapi.py +241 -207
numba_cuda/numba/cuda/cudadrv/dummyarray.py +66 -54
numba_cuda/numba/cuda/cudadrv/enums.py +1 -1
numba_cuda/numba/cuda/cudadrv/error.py +6 -2
numba_cuda/numba/cuda/cudadrv/libs.py +67 -63
numba_cuda/numba/cuda/cudadrv/linkable_code.py +27 -3
numba_cuda/numba/cuda/cudadrv/mappings.py +16 -14
numba_cuda/numba/cuda/cudadrv/nvrtc.py +146 -30
numba_cuda/numba/cuda/cudadrv/nvvm.py +296 -161
numba_cuda/numba/cuda/cudadrv/rtapi.py +1 -1
numba_cuda/numba/cuda/cudadrv/runtime.py +20 -8
numba_cuda/numba/cuda/cudaimpl.py +296 -275
numba_cuda/numba/cuda/cudamath.py +1 -1
numba_cuda/numba/cuda/debuginfo.py +99 -7
numba_cuda/numba/cuda/decorators.py +87 -45
numba_cuda/numba/cuda/descriptor.py +1 -1
numba_cuda/numba/cuda/device_init.py +68 -18
numba_cuda/numba/cuda/deviceufunc.py +143 -98
numba_cuda/numba/cuda/dispatcher.py +300 -213
numba_cuda/numba/cuda/errors.py +13 -10
numba_cuda/numba/cuda/extending.py +55 -1
numba_cuda/numba/cuda/include/11/cuda_bf16.h +3749 -0
numba_cuda/numba/cuda/include/11/cuda_bf16.hpp +2683 -0
numba_cuda/numba/cuda/{cuda_fp16.h → include/11/cuda_fp16.h} +1090 -927
numba_cuda/numba/cuda/{cuda_fp16.hpp → include/11/cuda_fp16.hpp} +468 -319
numba_cuda/numba/cuda/include/12/cuda_bf16.h +5118 -0
numba_cuda/numba/cuda/include/12/cuda_bf16.hpp +3865 -0
numba_cuda/numba/cuda/include/12/cuda_fp16.h +5363 -0
numba_cuda/numba/cuda/include/12/cuda_fp16.hpp +3483 -0
numba_cuda/numba/cuda/initialize.py +5 -3
numba_cuda/numba/cuda/intrinsic_wrapper.py +0 -39
numba_cuda/numba/cuda/intrinsics.py +203 -28
numba_cuda/numba/cuda/kernels/reduction.py +13 -13
numba_cuda/numba/cuda/kernels/transpose.py +3 -6
numba_cuda/numba/cuda/libdevice.py +317 -317
numba_cuda/numba/cuda/libdeviceimpl.py +3 -2
numba_cuda/numba/cuda/locks.py +16 -0
numba_cuda/numba/cuda/lowering.py +43 -0
numba_cuda/numba/cuda/mathimpl.py +62 -57
numba_cuda/numba/cuda/models.py +1 -5
numba_cuda/numba/cuda/nvvmutils.py +103 -88
numba_cuda/numba/cuda/printimpl.py +9 -5
numba_cuda/numba/cuda/random.py +46 -36
numba_cuda/numba/cuda/reshape_funcs.cu +1 -1
numba_cuda/numba/cuda/runtime/__init__.py +1 -1
numba_cuda/numba/cuda/runtime/memsys.cu +1 -1
numba_cuda/numba/cuda/runtime/memsys.cuh +1 -1
numba_cuda/numba/cuda/runtime/nrt.cu +3 -3
numba_cuda/numba/cuda/runtime/nrt.py +48 -43
numba_cuda/numba/cuda/simulator/__init__.py +22 -12
numba_cuda/numba/cuda/simulator/api.py +38 -22
numba_cuda/numba/cuda/simulator/compiler.py +2 -2
numba_cuda/numba/cuda/simulator/cudadrv/__init__.py +8 -2
numba_cuda/numba/cuda/simulator/cudadrv/devicearray.py +63 -55
numba_cuda/numba/cuda/simulator/cudadrv/devices.py +13 -11
numba_cuda/numba/cuda/simulator/cudadrv/driver.py +5 -5
numba_cuda/numba/cuda/simulator/cudadrv/drvapi.py +2 -2
numba_cuda/numba/cuda/simulator/cudadrv/libs.py +1 -1
numba_cuda/numba/cuda/simulator/cudadrv/nvvm.py +3 -3
numba_cuda/numba/cuda/simulator/cudadrv/runtime.py +3 -3
numba_cuda/numba/cuda/simulator/kernel.py +43 -34
numba_cuda/numba/cuda/simulator/kernelapi.py +31 -26
numba_cuda/numba/cuda/simulator/reduction.py +1 -0
numba_cuda/numba/cuda/simulator/vector_types.py +13 -9
numba_cuda/numba/cuda/simulator_init.py +2 -4
numba_cuda/numba/cuda/stubs.py +134 -108
numba_cuda/numba/cuda/target.py +92 -47
numba_cuda/numba/cuda/testing.py +24 -19
numba_cuda/numba/cuda/tests/__init__.py +14 -12
numba_cuda/numba/cuda/tests/cudadrv/test_array_attr.py +16 -17
numba_cuda/numba/cuda/tests/cudadrv/test_context_stack.py +7 -7
numba_cuda/numba/cuda/tests/cudadrv/test_cuda_array_slicing.py +73 -54
numba_cuda/numba/cuda/tests/cudadrv/test_cuda_auto_context.py +1 -1
numba_cuda/numba/cuda/tests/cudadrv/test_cuda_devicerecord.py +48 -50
numba_cuda/numba/cuda/tests/cudadrv/test_cuda_driver.py +47 -29
numba_cuda/numba/cuda/tests/cudadrv/test_cuda_libraries.py +3 -3
numba_cuda/numba/cuda/tests/cudadrv/test_cuda_memory.py +19 -19
numba_cuda/numba/cuda/tests/cudadrv/test_cuda_ndarray.py +108 -103
numba_cuda/numba/cuda/tests/cudadrv/test_deallocations.py +20 -11
numba_cuda/numba/cuda/tests/cudadrv/test_detect.py +20 -17
numba_cuda/numba/cuda/tests/cudadrv/test_emm_plugins.py +8 -6
numba_cuda/numba/cuda/tests/cudadrv/test_events.py +1 -1
numba_cuda/numba/cuda/tests/cudadrv/test_host_alloc.py +8 -7
numba_cuda/numba/cuda/tests/cudadrv/test_init.py +13 -13
numba_cuda/numba/cuda/tests/cudadrv/test_inline_ptx.py +12 -9
numba_cuda/numba/cuda/tests/cudadrv/test_linker.py +36 -31
numba_cuda/numba/cuda/tests/cudadrv/test_managed_alloc.py +8 -7
numba_cuda/numba/cuda/tests/cudadrv/test_module_callbacks.py +294 -0
numba_cuda/numba/cuda/tests/cudadrv/test_mvc.py +10 -7
numba_cuda/numba/cuda/tests/cudadrv/test_nvjitlink.py +24 -15
numba_cuda/numba/cuda/tests/cudadrv/test_nvvm_driver.py +43 -41
numba_cuda/numba/cuda/tests/cudadrv/test_pinned.py +4 -5
numba_cuda/numba/cuda/tests/cudadrv/test_profiler.py +2 -2
numba_cuda/numba/cuda/tests/cudadrv/test_ptds.py +28 -17
numba_cuda/numba/cuda/tests/cudadrv/test_reset_device.py +1 -2
numba_cuda/numba/cuda/tests/cudadrv/test_runtime.py +22 -14
numba_cuda/numba/cuda/tests/cudadrv/test_select_device.py +1 -1
numba_cuda/numba/cuda/tests/cudadrv/test_streams.py +4 -3
numba_cuda/numba/cuda/tests/cudapy/cache_usecases.py +10 -4
numba_cuda/numba/cuda/tests/cudapy/cache_with_cpu_usecases.py +1 -0
numba_cuda/numba/cuda/tests/cudapy/extensions_usecases.py +10 -7
numba_cuda/numba/cuda/tests/cudapy/jitlink.ptx +0 -2
numba_cuda/numba/cuda/tests/cudapy/recursion_usecases.py +1 -0
numba_cuda/numba/cuda/tests/cudapy/test_alignment.py +6 -5
numba_cuda/numba/cuda/tests/cudapy/test_array.py +52 -42
numba_cuda/numba/cuda/tests/cudapy/test_array_args.py +5 -6
numba_cuda/numba/cuda/tests/cudapy/test_array_methods.py +1 -1
numba_cuda/numba/cuda/tests/cudapy/test_atomics.py +501 -304
numba_cuda/numba/cuda/tests/cudapy/test_bfloat16_bindings.py +257 -0
numba_cuda/numba/cuda/tests/cudapy/test_blackscholes.py +59 -23
numba_cuda/numba/cuda/tests/cudapy/test_boolean.py +3 -3
numba_cuda/numba/cuda/tests/cudapy/test_caching.py +50 -37
numba_cuda/numba/cuda/tests/cudapy/test_casting.py +29 -24
numba_cuda/numba/cuda/tests/cudapy/test_cffi.py +11 -6
numba_cuda/numba/cuda/tests/cudapy/test_compiler.py +84 -50
numba_cuda/numba/cuda/tests/cudapy/test_complex.py +144 -73
numba_cuda/numba/cuda/tests/cudapy/test_complex_kernel.py +2 -2
numba_cuda/numba/cuda/tests/cudapy/test_const_string.py +37 -27
numba_cuda/numba/cuda/tests/cudapy/test_constmem.py +43 -45
numba_cuda/numba/cuda/tests/cudapy/test_cooperative_groups.py +21 -14
numba_cuda/numba/cuda/tests/cudapy/test_cuda_array_interface.py +60 -55
numba_cuda/numba/cuda/tests/cudapy/test_cuda_jit_no_types.py +3 -2
numba_cuda/numba/cuda/tests/cudapy/test_datetime.py +26 -22
numba_cuda/numba/cuda/tests/cudapy/test_debug.py +29 -27
numba_cuda/numba/cuda/tests/cudapy/test_debuginfo.py +77 -28
numba_cuda/numba/cuda/tests/cudapy/test_device_func.py +52 -45
numba_cuda/numba/cuda/tests/cudapy/test_dispatcher.py +55 -43
numba_cuda/numba/cuda/tests/cudapy/test_enums.py +24 -7
numba_cuda/numba/cuda/tests/cudapy/test_errors.py +30 -15
numba_cuda/numba/cuda/tests/cudapy/test_exception.py +11 -12
numba_cuda/numba/cuda/tests/cudapy/test_extending.py +21 -12
numba_cuda/numba/cuda/tests/cudapy/test_fastmath.py +77 -66
numba_cuda/numba/cuda/tests/cudapy/test_forall.py +5 -3
numba_cuda/numba/cuda/tests/cudapy/test_freevar.py +5 -3
numba_cuda/numba/cuda/tests/cudapy/test_frexp_ldexp.py +1 -1
numba_cuda/numba/cuda/tests/cudapy/test_globals.py +3 -5
numba_cuda/numba/cuda/tests/cudapy/test_gufunc.py +144 -126
numba_cuda/numba/cuda/tests/cudapy/test_gufunc_scalar.py +23 -18
numba_cuda/numba/cuda/tests/cudapy/test_gufunc_scheduling.py +16 -22
numba_cuda/numba/cuda/tests/cudapy/test_idiv.py +1 -3
numba_cuda/numba/cuda/tests/cudapy/test_inline.py +59 -0
numba_cuda/numba/cuda/tests/cudapy/test_inspect.py +29 -20
numba_cuda/numba/cuda/tests/cudapy/test_intrinsics.py +147 -99
numba_cuda/numba/cuda/tests/cudapy/test_ipc.py +50 -36
numba_cuda/numba/cuda/tests/cudapy/test_iterators.py +1 -2
numba_cuda/numba/cuda/tests/cudapy/test_lang.py +4 -4
numba_cuda/numba/cuda/tests/cudapy/test_laplace.py +7 -7
numba_cuda/numba/cuda/tests/cudapy/test_libdevice.py +24 -20
numba_cuda/numba/cuda/tests/cudapy/test_lineinfo.py +36 -31
numba_cuda/numba/cuda/tests/cudapy/test_localmem.py +13 -13
numba_cuda/numba/cuda/tests/cudapy/test_mandel.py +13 -6
numba_cuda/numba/cuda/tests/cudapy/test_math.py +83 -66
numba_cuda/numba/cuda/tests/cudapy/test_matmul.py +1 -3
numba_cuda/numba/cuda/tests/cudapy/test_minmax.py +19 -58
numba_cuda/numba/cuda/tests/cudapy/test_montecarlo.py +4 -4
numba_cuda/numba/cuda/tests/cudapy/test_multigpu.py +9 -7
numba_cuda/numba/cuda/tests/cudapy/test_multiprocessing.py +9 -8
numba_cuda/numba/cuda/tests/cudapy/test_multithreads.py +12 -10
numba_cuda/numba/cuda/tests/cudapy/test_nondet.py +1 -1
numba_cuda/numba/cuda/tests/cudapy/test_operator.py +180 -96
numba_cuda/numba/cuda/tests/cudapy/test_optimization.py +5 -5
numba_cuda/numba/cuda/tests/cudapy/test_overload.py +37 -18
numba_cuda/numba/cuda/tests/cudapy/test_powi.py +7 -7
numba_cuda/numba/cuda/tests/cudapy/test_print.py +9 -7
numba_cuda/numba/cuda/tests/cudapy/test_py2_div_issue.py +1 -1
numba_cuda/numba/cuda/tests/cudapy/test_random.py +15 -10
numba_cuda/numba/cuda/tests/cudapy/test_record_dtype.py +88 -87
numba_cuda/numba/cuda/tests/cudapy/test_recursion.py +12 -10
numba_cuda/numba/cuda/tests/cudapy/test_reduction.py +26 -11
numba_cuda/numba/cuda/tests/cudapy/test_retrieve_autoconverted_arrays.py +7 -10
numba_cuda/numba/cuda/tests/cudapy/test_serialize.py +4 -6
numba_cuda/numba/cuda/tests/cudapy/test_slicing.py +1 -1
numba_cuda/numba/cuda/tests/cudapy/test_sm.py +10 -9
numba_cuda/numba/cuda/tests/cudapy/test_sm_creation.py +62 -43
numba_cuda/numba/cuda/tests/cudapy/test_stream_api.py +7 -3
numba_cuda/numba/cuda/tests/cudapy/test_sync.py +7 -5
numba_cuda/numba/cuda/tests/cudapy/test_transpose.py +18 -11
numba_cuda/numba/cuda/tests/cudapy/test_ufuncs.py +111 -88
numba_cuda/numba/cuda/tests/cudapy/test_userexc.py +2 -3
numba_cuda/numba/cuda/tests/cudapy/test_vector_type.py +305 -130
numba_cuda/numba/cuda/tests/cudapy/test_vectorize.py +33 -36
numba_cuda/numba/cuda/tests/cudapy/test_vectorize_complex.py +5 -5
numba_cuda/numba/cuda/tests/cudapy/test_vectorize_decor.py +16 -12
numba_cuda/numba/cuda/tests/cudapy/test_vectorize_device.py +7 -7
numba_cuda/numba/cuda/tests/cudapy/test_vectorize_scalar_arg.py +6 -7
numba_cuda/numba/cuda/tests/cudapy/test_warning.py +31 -29
numba_cuda/numba/cuda/tests/cudapy/test_warp_ops.py +81 -30
numba_cuda/numba/cuda/tests/cudasim/test_cudasim_issues.py +19 -13
numba_cuda/numba/cuda/tests/data/jitlink.cu +1 -1
numba_cuda/numba/cuda/tests/data/jitlink.ptx +0 -2
numba_cuda/numba/cuda/tests/doc_examples/test_cg.py +15 -8
numba_cuda/numba/cuda/tests/doc_examples/test_cpu_gpu_compat.py +4 -7
numba_cuda/numba/cuda/tests/doc_examples/test_ffi.py +14 -9
numba_cuda/numba/cuda/tests/doc_examples/test_laplace.py +22 -18
numba_cuda/numba/cuda/tests/doc_examples/test_matmul.py +7 -4
numba_cuda/numba/cuda/tests/doc_examples/test_montecarlo.py +2 -0
numba_cuda/numba/cuda/tests/doc_examples/test_random.py +8 -4
numba_cuda/numba/cuda/tests/doc_examples/test_reduction.py +2 -1
numba_cuda/numba/cuda/tests/doc_examples/test_sessionize.py +94 -19
numba_cuda/numba/cuda/tests/doc_examples/test_vecadd.py +2 -2
numba_cuda/numba/cuda/tests/nocuda/test_dummyarray.py +91 -62
numba_cuda/numba/cuda/tests/nocuda/test_function_resolution.py +14 -5
numba_cuda/numba/cuda/tests/nocuda/test_import.py +25 -25
numba_cuda/numba/cuda/tests/nocuda/test_library_lookup.py +40 -40
numba_cuda/numba/cuda/tests/nocuda/test_nvvm.py +12 -10
numba_cuda/numba/cuda/tests/nrt/test_nrt.py +16 -20
numba_cuda/numba/cuda/tests/nrt/test_nrt_refct.py +12 -10
numba_cuda/numba/cuda/tests/test_binary_generation/generate_raw_ltoir.py +2 -2
numba_cuda/numba/cuda/types.py +5 -2
numba_cuda/numba/cuda/ufuncs.py +382 -362
numba_cuda/numba/cuda/utils.py +2 -2
numba_cuda/numba/cuda/vector_types.py +5 -3
numba_cuda/numba/cuda/vectorizers.py +38 -33
{numba_cuda-0.8.1.dist-info → numba_cuda-0.10.0.dist-info}/METADATA +1 -1
numba_cuda-0.10.0.dist-info/RECORD +263 -0
{numba_cuda-0.8.1.dist-info → numba_cuda-0.10.0.dist-info}/WHEEL +1 -1
numba_cuda-0.8.1.dist-info/RECORD +0 -251
{numba_cuda-0.8.1.dist-info → numba_cuda-0.10.0.dist-info}/licenses/LICENSE +0 -0
{numba_cuda-0.8.1.dist-info → numba_cuda-0.10.0.dist-info}/top_level.txt +0 -0

numba_cuda/numba/cuda/tests/cudapy/test_math.py CHANGED Viewed

@@ -1,8 +1,10 @@
 import numpy as np
-from numba.cuda.testing import (skip_unless_cc_53,
-                                unittest,
-                                CUDATestCase,
-                                skip_on_cudasim)
+from numba.cuda.testing import (
+    skip_unless_cc_53,
+    unittest,
+    CUDATestCase,
+    skip_on_cudasim,
+)
 from numba.np import numpy_support
 from numba import cuda, float32, float64, int32, vectorize, void, int64
 import math
@@ -253,8 +255,10 @@ class TestCudaMath(CUDATestCase):
     def unary_bool_special_values(self, func, npfunc, npdtype, npmtype):
         fi = np.finfo(npdtype)
         denorm = fi.tiny / 4
-        A = np.array([0., denorm, fi.tiny, 0.5, 1., fi.max, np.inf, np.nan],
-                     dtype=npdtype)
+        A = np.array(
+            [0.0, denorm, fi.tiny, 0.5, 1.0, fi.max, np.inf, np.nan],
+            dtype=npdtype,
+        )
         B = np.empty_like(A, dtype=np.int32)
         cfunc = cuda.jit((npmtype[::1], int32[::1]))(func)
@@ -314,7 +318,7 @@ class TestCudaMath(CUDATestCase):
         cfunc[1, nelem](A, A, B)
         np.testing.assert_allclose(npfunc(A, A), B)
-    #---------------------------------------------------------------------------
+    # ---------------------------------------------------------------------------
     # test_math_acos
     def test_math_acos(self):
@@ -325,7 +329,7 @@ class TestCudaMath(CUDATestCase):
         self.unary_template_int64(math_acos, np.arccos, start=0, stop=0)
         self.unary_template_uint64(math_acos, np.arccos, start=0, stop=0)
-    #---------------------------------------------------------------------------
+    # ---------------------------------------------------------------------------
     # test_math_asin
     def test_math_asin(self):
@@ -336,7 +340,7 @@ class TestCudaMath(CUDATestCase):
         self.unary_template_int64(math_asin, np.arcsin, start=0, stop=0)
         self.unary_template_uint64(math_asin, np.arcsin, start=0, stop=0)
-    #---------------------------------------------------------------------------
+    # ---------------------------------------------------------------------------
     # test_math_atan
     def test_math_atan(self):
@@ -345,7 +349,7 @@ class TestCudaMath(CUDATestCase):
         self.unary_template_int64(math_atan, np.arctan)
         self.unary_template_uint64(math_atan, np.arctan)
-    #---------------------------------------------------------------------------
+    # ---------------------------------------------------------------------------
     # test_math_acosh
     def test_math_acosh(self):
@@ -354,7 +358,7 @@ class TestCudaMath(CUDATestCase):
         self.unary_template_int64(math_acosh, np.arccosh, start=1, stop=2)
         self.unary_template_uint64(math_acosh, np.arccosh, start=1, stop=2)
-    #---------------------------------------------------------------------------
+    # ---------------------------------------------------------------------------
     # test_math_asinh
     def test_math_asinh(self):
@@ -363,16 +367,16 @@ class TestCudaMath(CUDATestCase):
         self.unary_template_int64(math_asinh, np.arcsinh)
         self.unary_template_uint64(math_asinh, np.arcsinh)
-    #---------------------------------------------------------------------------
+    # ---------------------------------------------------------------------------
     # test_math_atanh
     def test_math_atanh(self):
-        self.unary_template_float32(math_atanh, np.arctanh, start=0, stop=.9)
-        self.unary_template_float64(math_atanh, np.arctanh, start=0, stop=.9)
-        self.unary_template_int64(math_atanh, np.arctanh, start=0, stop=.9)
-        self.unary_template_uint64(math_atanh, np.arctanh, start=0, stop=.9)
+        self.unary_template_float32(math_atanh, np.arctanh, start=0, stop=0.9)
+        self.unary_template_float64(math_atanh, np.arctanh, start=0, stop=0.9)
+        self.unary_template_int64(math_atanh, np.arctanh, start=0, stop=0.9)
+        self.unary_template_uint64(math_atanh, np.arctanh, start=0, stop=0.9)
-    #---------------------------------------------------------------------------
+    # ---------------------------------------------------------------------------
     # test_math_cos
     def test_math_cos(self):
@@ -399,7 +403,7 @@ class TestCudaMath(CUDATestCase):
     def test_math_fp16_trunc(self):
         self.unary_template_float16(math_trunc, np.trunc)
-    #---------------------------------------------------------------------------
+    # ---------------------------------------------------------------------------
     # test_math_sin
     def test_math_sin(self):
@@ -408,7 +412,7 @@ class TestCudaMath(CUDATestCase):
         self.unary_template_int64(math_sin, np.sin)
         self.unary_template_uint64(math_sin, np.sin)
-    #---------------------------------------------------------------------------
+    # ---------------------------------------------------------------------------
     # test_math_tan
     def test_math_tan(self):
@@ -417,7 +421,7 @@ class TestCudaMath(CUDATestCase):
         self.unary_template_int64(math_tan, np.tan)
         self.unary_template_uint64(math_tan, np.tan)
-    #---------------------------------------------------------------------------
+    # ---------------------------------------------------------------------------
     # test_math_cosh
     def test_math_cosh(self):
@@ -426,7 +430,7 @@ class TestCudaMath(CUDATestCase):
         self.unary_template_int64(math_cosh, np.cosh)
         self.unary_template_uint64(math_cosh, np.cosh)
-    #---------------------------------------------------------------------------
+    # ---------------------------------------------------------------------------
     # test_math_sinh
     def test_math_sinh(self):
@@ -435,7 +439,7 @@ class TestCudaMath(CUDATestCase):
         self.unary_template_int64(math_sinh, np.sinh)
         self.unary_template_uint64(math_sinh, np.sinh)
-    #---------------------------------------------------------------------------
+    # ---------------------------------------------------------------------------
     # test_math_tanh
     def test_math_tanh(self):
@@ -444,7 +448,7 @@ class TestCudaMath(CUDATestCase):
         self.unary_template_int64(math_tanh, np.tanh)
         self.unary_template_uint64(math_tanh, np.tanh)
-    #---------------------------------------------------------------------------
+    # ---------------------------------------------------------------------------
     # test_math_atan2
     def test_math_atan2(self):
@@ -453,31 +457,33 @@ class TestCudaMath(CUDATestCase):
         self.binary_template_int64(math_atan2, np.arctan2)
         self.binary_template_uint64(math_atan2, np.arctan2)
-    #---------------------------------------------------------------------------
+    # ---------------------------------------------------------------------------
     # test_math_erf
     def test_math_erf(self):
         @vectorize
         def ufunc(x):
             return math.erf(x)
         self.unary_template_float32(math_erf, ufunc)
         self.unary_template_float64(math_erf, ufunc)
         self.unary_template_int64(math_erf, ufunc)
         self.unary_template_uint64(math_erf, ufunc)
-    #---------------------------------------------------------------------------
+    # ---------------------------------------------------------------------------
     # test_math_erfc
     def test_math_erfc(self):
         @vectorize
         def ufunc(x):
             return math.erfc(x)
         self.unary_template_float32(math_erfc, ufunc)
         self.unary_template_float64(math_erfc, ufunc)
         self.unary_template_int64(math_erfc, ufunc)
         self.unary_template_uint64(math_erfc, ufunc)
-    #---------------------------------------------------------------------------
+    # ---------------------------------------------------------------------------
     # test_math_exp
     def test_math_exp(self):
@@ -486,7 +492,7 @@ class TestCudaMath(CUDATestCase):
         self.unary_template_int64(math_exp, np.exp)
         self.unary_template_uint64(math_exp, np.exp)
-    #---------------------------------------------------------------------------
+    # ---------------------------------------------------------------------------
     # test_math_expm1
     def test_math_expm1(self):
@@ -495,7 +501,7 @@ class TestCudaMath(CUDATestCase):
         self.unary_template_int64(math_expm1, np.expm1)
         self.unary_template_uint64(math_expm1, np.expm1)
-    #---------------------------------------------------------------------------
+    # ---------------------------------------------------------------------------
     # test_math_fabs
     def test_math_fabs(self):
@@ -504,31 +510,33 @@ class TestCudaMath(CUDATestCase):
         self.unary_template_int64(math_fabs, np.fabs, start=-1)
         self.unary_template_uint64(math_fabs, np.fabs, start=-1)
-    #---------------------------------------------------------------------------
+    # ---------------------------------------------------------------------------
     # test_math_gamma
     def test_math_gamma(self):
         @vectorize
         def ufunc(x):
             return math.gamma(x)
         self.unary_template_float32(math_gamma, ufunc, start=0.1)
         self.unary_template_float64(math_gamma, ufunc, start=0.1)
         self.unary_template_int64(math_gamma, ufunc, start=1)
         self.unary_template_uint64(math_gamma, ufunc, start=1)
-    #---------------------------------------------------------------------------
+    # ---------------------------------------------------------------------------
     # test_math_lgamma
     def test_math_lgamma(self):
         @vectorize
         def ufunc(x):
             return math.lgamma(x)
         self.unary_template_float32(math_lgamma, ufunc, start=0.1)
         self.unary_template_float64(math_lgamma, ufunc, start=0.1)
         self.unary_template_int64(math_lgamma, ufunc, start=1)
         self.unary_template_uint64(math_lgamma, ufunc, start=1)
-    #---------------------------------------------------------------------------
+    # ---------------------------------------------------------------------------
     # test_math_log
     def test_math_log(self):
@@ -537,7 +545,7 @@ class TestCudaMath(CUDATestCase):
         self.unary_template_int64(math_log, np.log, start=1)
         self.unary_template_uint64(math_log, np.log, start=1)
-    #---------------------------------------------------------------------------
+    # ---------------------------------------------------------------------------
     # test_math_log2
     def test_math_log2(self):
@@ -546,7 +554,7 @@ class TestCudaMath(CUDATestCase):
         self.unary_template_int64(math_log2, np.log2, start=1)
         self.unary_template_uint64(math_log2, np.log2, start=1)
-    #---------------------------------------------------------------------------
+    # ---------------------------------------------------------------------------
     # test_math_log10
     def test_math_log10(self):
@@ -555,7 +563,7 @@ class TestCudaMath(CUDATestCase):
         self.unary_template_int64(math_log10, np.log10, start=1)
         self.unary_template_uint64(math_log10, np.log10, start=1)
-    #---------------------------------------------------------------------------
+    # ---------------------------------------------------------------------------
     # test_math_log1p
     def test_math_log1p(self):
@@ -564,7 +572,7 @@ class TestCudaMath(CUDATestCase):
         self.unary_template_int64(math_log1p, np.log1p)
         self.unary_template_uint64(math_log1p, np.log1p)
-    #---------------------------------------------------------------------------
+    # ---------------------------------------------------------------------------
     # test_math_remainder
     def test_math_remainder(self):
@@ -573,16 +581,17 @@ class TestCudaMath(CUDATestCase):
         self.binary_template_int64(math_remainder, np.remainder, start=1)
         self.binary_template_uint64(math_remainder, np.remainder, start=1)
-    @skip_on_cudasim('math.remainder(0, 0) raises a ValueError on CUDASim')
+    @skip_on_cudasim("math.remainder(0, 0) raises a ValueError on CUDASim")
     def test_math_remainder_0_0(self):
         @cuda.jit(void(float64[::1], int64, int64))
         def test_0_0(r, x, y):
             r[0] = math.remainder(x, y)
         r = np.zeros(1, np.float64)
         test_0_0[1, 1](r, 0, 0)
         self.assertTrue(np.isnan(r[0]))
-    #---------------------------------------------------------------------------
+    # ---------------------------------------------------------------------------
     # test_math_sqrt
     def test_math_sqrt(self):
@@ -591,7 +600,7 @@ class TestCudaMath(CUDATestCase):
         self.unary_template_int64(math_sqrt, np.sqrt)
         self.unary_template_uint64(math_sqrt, np.sqrt)
-    #---------------------------------------------------------------------------
+    # ---------------------------------------------------------------------------
     # test_math_hypot
     def test_math_hypot(self):
@@ -600,7 +609,7 @@ class TestCudaMath(CUDATestCase):
         self.binary_template_int64(math_hypot, np.hypot)
         self.binary_template_uint64(math_hypot, np.hypot)
-    #---------------------------------------------------------------------------
+    # ---------------------------------------------------------------------------
     # test_math_pow
     def pow_template_int32(self, npdtype):
@@ -626,14 +635,14 @@ class TestCudaMath(CUDATestCase):
         self.pow_template_int32(np.float32)
         self.pow_template_int32(np.float64)
-    #---------------------------------------------------------------------------
+    # ---------------------------------------------------------------------------
     # test_math_pow_binop
     def test_math_pow_binop(self):
         self.binary_template_float32(math_pow_binop, np.power)
         self.binary_template_float64(math_pow_binop, np.power)
-    #---------------------------------------------------------------------------
+    # ---------------------------------------------------------------------------
     # test_math_ceil
     def test_math_ceil(self):
@@ -642,7 +651,7 @@ class TestCudaMath(CUDATestCase):
         self.unary_template_int64(math_ceil, np.ceil)
         self.unary_template_uint64(math_ceil, np.ceil)
-    #---------------------------------------------------------------------------
+    # ---------------------------------------------------------------------------
     # test_math_floor
     def test_math_floor(self):
@@ -651,7 +660,7 @@ class TestCudaMath(CUDATestCase):
         self.unary_template_int64(math_floor, np.floor)
         self.unary_template_uint64(math_floor, np.floor)
-    #---------------------------------------------------------------------------
+    # ---------------------------------------------------------------------------
     # test_math_trunc
     #
     # Note that math.trunc() is only supported on NumPy float64s, and not
@@ -663,20 +672,20 @@ class TestCudaMath(CUDATestCase):
     def test_math_trunc(self):
         self.unary_template_float64(math_trunc, np.trunc)
-    @skip_on_cudasim('trunc only supported on NumPy float64')
+    @skip_on_cudasim("trunc only supported on NumPy float64")
     def test_math_trunc_non_float64(self):
         self.unary_template_float32(math_trunc, np.trunc)
         self.unary_template_int64(math_trunc, np.trunc)
         self.unary_template_uint64(math_trunc, np.trunc)
-    #---------------------------------------------------------------------------
+    # ---------------------------------------------------------------------------
     # test_math_copysign
     def test_math_copysign(self):
         self.binary_template_float32(math_copysign, np.copysign, start=-1)
         self.binary_template_float64(math_copysign, np.copysign, start=-1)
-    #---------------------------------------------------------------------------
+    # ---------------------------------------------------------------------------
     # test_math_modf
     def test_math_modf(self):
@@ -696,45 +705,53 @@ class TestCudaMath(CUDATestCase):
             cfunc = cuda.jit((arytype, arytype, arytype))(math_modf)
             cfunc[1, len(A)](A, B, C)
             D, E = np.modf(A)
-            self.assertTrue(np.array_equal(B,D))
-            self.assertTrue(np.array_equal(C,E))
+            self.assertTrue(np.array_equal(B, D))
+            self.assertTrue(np.array_equal(C, E))
         nelem = 50
-        #32 bit float
+        # 32 bit float
         with self.subTest("float32 modf on simple float"):
-            modf_template_compare(np.linspace(0, 10, nelem), dtype=np.float32,
-                                  arytype=float32[:])
+            modf_template_compare(
+                np.linspace(0, 10, nelem), dtype=np.float32, arytype=float32[:]
+            )
         with self.subTest("float32 modf on +- infinity"):
-            modf_template_compare(np.array([np.inf, -np.inf]), dtype=np.float32,
-                                  arytype=float32[:])
+            modf_template_compare(
+                np.array([np.inf, -np.inf]),
+                dtype=np.float32,
+                arytype=float32[:],
+            )
         with self.subTest("float32 modf on nan"):
             modf_template_nan(dtype=np.float32, arytype=float32[:])
-        #64 bit float
+        # 64 bit float
         with self.subTest("float64 modf on simple float"):
-            modf_template_compare(np.linspace(0, 10, nelem), dtype=np.float64,
-                                  arytype=float64[:])
+            modf_template_compare(
+                np.linspace(0, 10, nelem), dtype=np.float64, arytype=float64[:]
+            )
         with self.subTest("float64 modf on +- infinity"):
-            modf_template_compare(np.array([np.inf, -np.inf]), dtype=np.float64,
-                                  arytype=float64[:])
+            modf_template_compare(
+                np.array([np.inf, -np.inf]),
+                dtype=np.float64,
+                arytype=float64[:],
+            )
         with self.subTest("float64 modf on nan"):
             modf_template_nan(dtype=np.float64, arytype=float64[:])
-    #---------------------------------------------------------------------------
+    # ---------------------------------------------------------------------------
     # test_math_fmod
     def test_math_fmod(self):
         self.binary_template_float32(math_fmod, np.fmod, start=1)
         self.binary_template_float64(math_fmod, np.fmod, start=1)
-    #---------------------------------------------------------------------------
+    # ---------------------------------------------------------------------------
     # test_math_mod_binop
     def test_math_mod_binop(self):
         self.binary_template_float32(math_mod_binop, np.fmod, start=1)
         self.binary_template_float64(math_mod_binop, np.fmod, start=1)
-    #---------------------------------------------------------------------------
+    # ---------------------------------------------------------------------------
     # test_math_isnan
     def test_math_isnan(self):
@@ -745,7 +762,7 @@ class TestCudaMath(CUDATestCase):
         self.unary_bool_special_values_float32(math_isnan, np.isnan)
         self.unary_bool_special_values_float64(math_isnan, np.isnan)
-    #---------------------------------------------------------------------------
+    # ---------------------------------------------------------------------------
     # test_math_isinf
     def test_math_isinf(self):
@@ -756,7 +773,7 @@ class TestCudaMath(CUDATestCase):
         self.unary_bool_special_values_float32(math_isinf, np.isinf)
         self.unary_bool_special_values_float64(math_isinf, np.isinf)
-    #---------------------------------------------------------------------------
+    # ---------------------------------------------------------------------------
     # test_math_isfinite
     def test_math_isfinite(self):
@@ -767,14 +784,14 @@ class TestCudaMath(CUDATestCase):
         self.unary_bool_special_values_float32(math_isfinite, np.isfinite)
         self.unary_bool_special_values_float64(math_isfinite, np.isfinite)
-    #---------------------------------------------------------------------------
+    # ---------------------------------------------------------------------------
     # test_math_degrees
     def test_math_degrees(self):
         self.unary_bool_template_float32(math_degrees, np.degrees)
         self.unary_bool_template_float64(math_degrees, np.degrees)
-    #---------------------------------------------------------------------------
+    # ---------------------------------------------------------------------------
     # test_math_radians
     def test_math_radians(self):
@@ -782,5 +799,5 @@ class TestCudaMath(CUDATestCase):
         self.unary_bool_template_float64(math_radians, np.radians)
-if __name__ == '__main__':
+if __name__ == "__main__":
     unittest.main()

numba_cuda/numba/cuda/tests/cudapy/test_matmul.py CHANGED Viewed

@@ -15,9 +15,7 @@ SM_SIZE = (tpb, tpb)
 class TestCudaMatMul(CUDATestCase):
     def test_func(self):
         @cuda.jit(void(float32[:, ::1], float32[:, ::1], float32[:, ::1]))
         def cu_square_matrix_mul(A, B, C):
             sA = cuda.shared.array(shape=SM_SIZE, dtype=float32)
@@ -70,5 +68,5 @@ class TestCudaMatMul(CUDATestCase):
         np.testing.assert_allclose(C, Cans, rtol=1e-5)
-if __name__ == '__main__':
+if __name__ == "__main__":
     unittest.main()

numba_cuda/numba/cuda/tests/cudapy/test_minmax.py CHANGED Viewed

@@ -22,20 +22,21 @@ def builtin_min(A, B, C):
     C[i] = float64(min(A[i], B[i]))
-@skip_on_cudasim('Tests PTX emission')
+@skip_on_cudasim("Tests PTX emission")
 class TestCudaMinMax(CUDATestCase):
     def _run(
-            self,
-            kernel,
-            numpy_equivalent,
-            ptx_instruction,
-            dtype_left,
-            dtype_right,
-            n=5):
+        self,
+        kernel,
+        numpy_equivalent,
+        ptx_instruction,
+        dtype_left,
+        dtype_right,
+        n=5,
+    ):
         kernel = cuda.jit(kernel)
         c = np.zeros(n, dtype=np.float64)
-        a = np.arange(n, dtype=dtype_left) + .5
+        a = np.arange(n, dtype=dtype_left) + 0.5
         b = np.full(n, fill_value=2, dtype=dtype_right)
         kernel[1, c.shape](a, b, c)
@@ -45,69 +46,29 @@ class TestCudaMinMax(CUDATestCase):
         self.assertIn(ptx_instruction, ptx)
     def test_max_f8f8(self):
-        self._run(
-            builtin_max,
-            np.maximum,
-            'max.f64',
-            np.float64,
-            np.float64)
+        self._run(builtin_max, np.maximum, "max.f64", np.float64, np.float64)
     def test_max_f4f8(self):
-        self._run(
-            builtin_max,
-            np.maximum,
-            'max.f64',
-            np.float32,
-            np.float64)
+        self._run(builtin_max, np.maximum, "max.f64", np.float32, np.float64)
     def test_max_f8f4(self):
-        self._run(
-            builtin_max,
-            np.maximum,
-            'max.f64',
-            np.float64,
-            np.float32)
+        self._run(builtin_max, np.maximum, "max.f64", np.float64, np.float32)
     def test_max_f4f4(self):
-        self._run(
-            builtin_max,
-            np.maximum,
-            'max.f32',
-            np.float32,
-            np.float32)
+        self._run(builtin_max, np.maximum, "max.f32", np.float32, np.float32)
     def test_min_f8f8(self):
-        self._run(
-            builtin_min,
-            np.minimum,
-            'min.f64',
-            np.float64,
-            np.float64)
+        self._run(builtin_min, np.minimum, "min.f64", np.float64, np.float64)
     def test_min_f4f8(self):
-        self._run(
-            builtin_min,
-            np.minimum,
-            'min.f64',
-            np.float32,
-            np.float64)
+        self._run(builtin_min, np.minimum, "min.f64", np.float32, np.float64)
     def test_min_f8f4(self):
-        self._run(
-            builtin_min,
-            np.minimum,
-            'min.f64',
-            np.float64,
-            np.float32)
+        self._run(builtin_min, np.minimum, "min.f64", np.float64, np.float32)
     def test_min_f4f4(self):
-        self._run(
-            builtin_min,
-            np.minimum,
-            'min.f32',
-            np.float32,
-            np.float32)
+        self._run(builtin_min, np.minimum, "min.f32", np.float32, np.float32)
-if __name__ == '__main__':
+if __name__ == "__main__":
     unittest.main()

numba_cuda/numba/cuda/tests/cudapy/test_montecarlo.py CHANGED Viewed

@@ -5,11 +5,11 @@ from numba.cuda.testing import unittest, CUDATestCase
 class TestCudaMonteCarlo(CUDATestCase):
     def test_montecarlo(self):
-        """Just make sure we can compile this
-        """
+        """Just make sure we can compile this"""
         @cuda.jit(
-            'void(double[:], double[:], double, double, double, double[:])')
+            "void(double[:], double[:], double, double, double, double[:])"
+        )
         def step(last, paths, dt, c0, c1, normdist):
             i = cuda.grid(1)
             if i >= paths.shape[0]:
@@ -18,5 +18,5 @@ class TestCudaMonteCarlo(CUDATestCase):
             paths[i] = last[i] * math.exp(c0 * dt + c1 * noise)
-if __name__ == '__main__':
+if __name__ == "__main__":
     unittest.main()

numba_cuda/numba/cuda/tests/cudapy/test_multigpu.py CHANGED Viewed

@@ -47,7 +47,7 @@ class TestMultiGPUContext(CUDATestCase):
         copy_plus_1[1, N](A, B)
         check(A, B)
-    @skip_on_cudasim('Simulator does not support multiple threads')
+    @skip_on_cudasim("Simulator does not support multiple threads")
     def test_multithreaded(self):
         def work(gpu, dA, results, ridx):
             try:
@@ -64,9 +64,12 @@ class TestMultiGPUContext(CUDATestCase):
         nthreads = 10
         results = [None] * nthreads
-        threads = [threading.Thread(target=work, args=(cuda.gpus.current,
-                                                       dA, results, i))
-                   for i in range(nthreads)]
+        threads = [
+            threading.Thread(
+                target=work, args=(cuda.gpus.current, dA, results, i)
+            )
+            for i in range(nthreads)
+        ]
         for th in threads:
             th.start()
@@ -81,7 +84,6 @@ class TestMultiGPUContext(CUDATestCase):
     @unittest.skipIf(len(cuda.gpus) < 2, "need more than 1 gpus")
     def test_with_context(self):
         @cuda.jit
         def vector_add_scalar(arr, val):
             i = cuda.grid(1)
@@ -115,7 +117,7 @@ class TestMultiGPUContext(CUDATestCase):
         with cuda.gpus[0]:
             ctx = cuda.current_context()
             if not ctx.can_access_peer(1):
-                self.skipTest('Peer access between GPUs disabled')
+                self.skipTest("Peer access between GPUs disabled")
         # 1. Create a range in an array
         hostarr = np.arange(10, dtype=np.float32)
@@ -136,5 +138,5 @@ class TestMultiGPUContext(CUDATestCase):
             np.testing.assert_equal(arr2.copy_to_host(), hostarr)
-if __name__ == '__main__':
+if __name__ == "__main__":
     unittest.main()

numba-cuda 0.8.1__py3-none-any.whl → 0.10.0__py3-none-any.whl

numba-cuda 0.8.1py3-none-any.whl → 0.10.0py3-none-any.whl