PyPI - numba-cuda - Versions diffs - 0.17.0__py3-none-any.whl → 0.18.0__py3-none-any.whl - Mend

numba-cuda 0.17.0py3-none-any.whl → 0.18.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (62) hide show

numba_cuda/VERSION +1 -1
numba_cuda/numba/cuda/__init__.py +0 -8
numba_cuda/numba/cuda/_internal/cuda_fp16.py +14225 -0
numba_cuda/numba/cuda/api_util.py +6 -0
numba_cuda/numba/cuda/cgutils.py +1291 -0
numba_cuda/numba/cuda/codegen.py +32 -14
numba_cuda/numba/cuda/compiler.py +113 -10
numba_cuda/numba/cuda/core/caching.py +741 -0
numba_cuda/numba/cuda/core/callconv.py +338 -0
numba_cuda/numba/cuda/core/codegen.py +168 -0
numba_cuda/numba/cuda/core/compiler.py +205 -0
numba_cuda/numba/cuda/core/typed_passes.py +139 -0
numba_cuda/numba/cuda/cudadecl.py +0 -268
numba_cuda/numba/cuda/cudadrv/devicearray.py +3 -0
numba_cuda/numba/cuda/cudadrv/driver.py +2 -1
numba_cuda/numba/cuda/cudadrv/nvvm.py +1 -1
numba_cuda/numba/cuda/cudaimpl.py +4 -178
numba_cuda/numba/cuda/debuginfo.py +469 -3
numba_cuda/numba/cuda/device_init.py +0 -1
numba_cuda/numba/cuda/dispatcher.py +309 -11
numba_cuda/numba/cuda/extending.py +2 -1
numba_cuda/numba/cuda/fp16.py +348 -0
numba_cuda/numba/cuda/intrinsics.py +1 -1
numba_cuda/numba/cuda/libdeviceimpl.py +2 -1
numba_cuda/numba/cuda/lowering.py +1833 -8
numba_cuda/numba/cuda/mathimpl.py +2 -90
numba_cuda/numba/cuda/nvvmutils.py +2 -1
numba_cuda/numba/cuda/printimpl.py +2 -1
numba_cuda/numba/cuda/serialize.py +264 -0
numba_cuda/numba/cuda/simulator/__init__.py +2 -0
numba_cuda/numba/cuda/simulator/dispatcher.py +7 -0
numba_cuda/numba/cuda/stubs.py +0 -308
numba_cuda/numba/cuda/target.py +13 -5
numba_cuda/numba/cuda/testing.py +156 -5
numba_cuda/numba/cuda/tests/complex_usecases.py +113 -0
numba_cuda/numba/cuda/tests/core/serialize_usecases.py +110 -0
numba_cuda/numba/cuda/tests/core/test_serialize.py +359 -0
numba_cuda/numba/cuda/tests/cudadrv/test_cuda_ndarray.py +33 -0
numba_cuda/numba/cuda/tests/cudadrv/test_runtime.py +2 -2
numba_cuda/numba/cuda/tests/cudadrv/test_streams.py +1 -0
numba_cuda/numba/cuda/tests/cudapy/extensions_usecases.py +1 -1
numba_cuda/numba/cuda/tests/cudapy/test_caching.py +5 -10
numba_cuda/numba/cuda/tests/cudapy/test_complex.py +1 -1
numba_cuda/numba/cuda/tests/cudapy/test_debuginfo.py +381 -0
numba_cuda/numba/cuda/tests/cudapy/test_enums.py +1 -1
numba_cuda/numba/cuda/tests/cudapy/test_extending.py +1 -1
numba_cuda/numba/cuda/tests/cudapy/test_inspect.py +94 -24
numba_cuda/numba/cuda/tests/cudapy/test_intrinsics.py +37 -23
numba_cuda/numba/cuda/tests/cudapy/test_operator.py +43 -27
numba_cuda/numba/cuda/tests/cudapy/test_ufuncs.py +26 -9
numba_cuda/numba/cuda/tests/cudapy/test_warning.py +27 -2
numba_cuda/numba/cuda/tests/enum_usecases.py +56 -0
numba_cuda/numba/cuda/tests/nocuda/test_library_lookup.py +1 -2
numba_cuda/numba/cuda/tests/nocuda/test_nvvm.py +1 -1
numba_cuda/numba/cuda/utils.py +785 -0
numba_cuda/numba/cuda/vector_types.py +1 -1
{numba_cuda-0.17.0.dist-info → numba_cuda-0.18.0.dist-info}/METADATA +18 -4
{numba_cuda-0.17.0.dist-info → numba_cuda-0.18.0.dist-info}/RECORD +61 -48
numba_cuda/numba/cuda/cpp_function_wrappers.cu +0 -46
{numba_cuda-0.17.0.dist-info → numba_cuda-0.18.0.dist-info}/WHEEL +0 -0
{numba_cuda-0.17.0.dist-info → numba_cuda-0.18.0.dist-info}/licenses/LICENSE +0 -0
{numba_cuda-0.17.0.dist-info → numba_cuda-0.18.0.dist-info}/top_level.txt +0 -0

numba_cuda/numba/cuda/fp16.py ADDED Viewed

@@ -0,0 +1,348 @@
+import numba.core.types as types
+from numba.cuda._internal.cuda_fp16 import (
+    typing_registry,
+    target_registry,
+    __half,
+    __double2half,
+    __float2half,
+    __float2half_rd,
+    __float2half_rn,
+    __float2half_ru,
+    __float2half_rz,
+    __int2half_rd,
+    __int2half_rn,
+    __int2half_ru,
+    __int2half_rz,
+    __ll2half_rd,
+    __ll2half_rn,
+    __ll2half_ru,
+    __ll2half_rz,
+    __short2half_rd,
+    __short2half_rn,
+    __short2half_ru,
+    __short2half_rz,
+    __uint2half_rd,
+    __uint2half_rn,
+    __uint2half_ru,
+    __uint2half_rz,
+    __ull2half_rd,
+    __ull2half_rn,
+    __ull2half_ru,
+    __ull2half_rz,
+    __ushort2half_rd,
+    __ushort2half_rn,
+    __ushort2half_ru,
+    __ushort2half_rz,
+    __half2char_rz,
+    __half2float,
+    __half2int_rd,
+    __half2int_rn,
+    __half2int_ru,
+    __half2int_rz,
+    __half2ll_rd,
+    __half2ll_rn,
+    __half2ll_ru,
+    __half2ll_rz,
+    __half2short_rd,
+    __half2short_rn,
+    __half2short_ru,
+    __half2short_rz,
+    __half2uchar_rz,
+    __half2uint_rd,
+    __half2uint_rn,
+    __half2uint_ru,
+    __half2uint_rz,
+    __half2ull_rd,
+    __half2ull_rn,
+    __half2ull_ru,
+    __half2ull_rz,
+    __half2ushort_rd,
+    __half2ushort_rn,
+    __half2ushort_ru,
+    __half2ushort_rz,
+    __short_as_half,
+    __ushort_as_half,
+    __half_as_short,
+    __half_as_ushort,
+    __habs as habs,
+    __habs,
+    __hadd as hadd,
+    __hadd,
+    __hadd_rn,
+    __hadd_sat,
+    __hcmadd,
+    __hdiv as hdiv,
+    __hdiv,
+    __heq as heq,
+    __heq,
+    __hequ,
+    __hfma as hfma,
+    __hfma,
+    __hfma_relu,
+    __hfma_sat,
+    __hge as hge,
+    __hge,
+    __hgeu,
+    __hgt as hgt,
+    __hgt,
+    __hgtu,
+    __hisinf,
+    __hisnan,
+    __hle as hle,
+    __hle,
+    __hleu,
+    __hlt as hlt,
+    __hlt,
+    __hltu,
+    __hmax as hmax,
+    __hmax,
+    __hmax_nan,
+    __hmin as hmin,
+    __hmin,
+    __hmin_nan,
+    __hmul as hmul,
+    __hmul,
+    __hmul_rn,
+    __hmul_sat,
+    __hne as hne,
+    __hne,
+    __hneg as hneg,
+    __hneg,
+    __hneu,
+    __hsub as hsub,
+    __hsub,
+    __hsub_rn,
+    __hsub_sat,
+    atomicAdd,
+    hceil,
+    hcos,
+    hexp,
+    hexp10,
+    hexp2,
+    hfloor,
+    hlog,
+    hlog10,
+    hlog2,
+    hrcp,
+    hrint,
+    hrsqrt,
+    hsin,
+    hsqrt,
+    htanh,
+    htanh_approx,
+    htrunc,
+)
+from numba.extending import overload
+import math
+def _make_unary(a, func):
+    if isinstance(a, types.Float) and a.bitwidth == 16:
+        return lambda a: func(a)
+# Bind low++ bindings to math APIs
+@overload(math.trunc, target="cuda")
+def trunc_ol(a):
+    return _make_unary(a, htrunc)
+@overload(math.ceil, target="cuda")
+def ceil_ol(a):
+    return _make_unary(a, hceil)
+@overload(math.floor, target="cuda")
+def floor_ol(a):
+    return _make_unary(a, hfloor)
+@overload(math.fabs, target="cuda")
+def fabs_ol(a):
+    return _make_unary(a, habs)
+@overload(math.sqrt, target="cuda")
+def sqrt_ol(a):
+    return _make_unary(a, hsqrt)
+@overload(math.log, target="cuda")
+def log_ol(a):
+    return _make_unary(a, hlog)
+@overload(math.log2, target="cuda")
+def log2_ol(a):
+    return _make_unary(a, hlog2)
+@overload(math.log10, target="cuda")
+def log10_ol(a):
+    return _make_unary(a, hlog10)
+@overload(math.exp, target="cuda")
+def exp_ol(a):
+    return _make_unary(a, hexp)
+@overload(math.tanh, target="cuda")
+def tanh_ol(a):
+    return _make_unary(a, htanh)
+@overload(math.cos, target="cuda")
+def cos_ol(a):
+    return _make_unary(a, hcos)
+@overload(math.sin, target="cuda")
+def sin_ol(a):
+    return _make_unary(a, hsin)
+try:
+    from math import exp2
+    @overload(exp2, target="cuda")
+    def exp2_ol(a):
+        return _make_unary(a, hexp2)
+except ImportError:
+    pass
+__all__ = [
+    "typing_registry",
+    "target_registry",
+    "__half",
+    "__double2half",
+    "__float2half",
+    "__float2half_rd",
+    "__float2half_rn",
+    "__float2half_ru",
+    "__float2half_rz",
+    "__int2half_rd",
+    "__int2half_rn",
+    "__int2half_ru",
+    "__int2half_rz",
+    "__ll2half_rd",
+    "__ll2half_rn",
+    "__ll2half_ru",
+    "__ll2half_rz",
+    "__short2half_rd",
+    "__short2half_rn",
+    "__short2half_ru",
+    "__short2half_rz",
+    "__uint2half_rd",
+    "__uint2half_rn",
+    "__uint2half_ru",
+    "__uint2half_rz",
+    "__ull2half_rd",
+    "__ull2half_rn",
+    "__ull2half_ru",
+    "__ull2half_rz",
+    "__ushort2half_rd",
+    "__ushort2half_rn",
+    "__ushort2half_ru",
+    "__ushort2half_rz",
+    "__half2char_rz",
+    "__half2float",
+    "__half2int_rd",
+    "__half2int_rn",
+    "__half2int_ru",
+    "__half2int_rz",
+    "__half2ll_rd",
+    "__half2ll_rn",
+    "__half2ll_ru",
+    "__half2ll_rz",
+    "__half2short_rd",
+    "__half2short_rn",
+    "__half2short_ru",
+    "__half2short_rz",
+    "__half2uchar_rz",
+    "__half2uint_rd",
+    "__half2uint_rn",
+    "__half2uint_ru",
+    "__half2uint_rz",
+    "__half2ull_rd",
+    "__half2ull_rn",
+    "__half2ull_ru",
+    "__half2ull_rz",
+    "__half2ushort_rd",
+    "__half2ushort_rn",
+    "__half2ushort_ru",
+    "__half2ushort_rz",
+    "__short_as_half",
+    "__ushort_as_half",
+    "__half_as_short",
+    "__half_as_ushort",
+    "habs",
+    "__habs",
+    "hadd",
+    "__hadd",
+    "__hadd_rn",
+    "__hadd_sat",
+    "__hcmadd",
+    "hdiv",
+    "__hdiv",
+    "heq",
+    "__heq",
+    "__hequ",
+    "hfma",
+    "__hfma",
+    "__hfma_relu",
+    "__hfma_sat",
+    "hge",
+    "__hge",
+    "__hgeu",
+    "hgt",
+    "__hgt",
+    "__hgtu",
+    "__hisinf",
+    "__hisnan",
+    "hle",
+    "__hle",
+    "__hleu",
+    "hlt",
+    "__hlt",
+    "__hltu",
+    "hmax",
+    "__hmax",
+    "__hmax_nan",
+    "hmin",
+    "__hmin",
+    "__hmin_nan",
+    "hmul",
+    "__hmul",
+    "__hmul_rn",
+    "__hmul_sat",
+    "hne",
+    "__hne",
+    "hneg",
+    "__hneg",
+    "__hneu",
+    "hsub",
+    "__hsub",
+    "__hsub_rn",
+    "__hsub_sat",
+    "atomicAdd",
+    "hceil",
+    "hcos",
+    "hexp",
+    "hexp10",
+    "hexp2",
+    "hfloor",
+    "hlog",
+    "hlog10",
+    "hlog2",
+    "hrcp",
+    "hrint",
+    "hrsqrt",
+    "hsin",
+    "hsqrt",
+    "htanh",
+    "htanh_approx",
+    "htrunc",
+]

numba_cuda/numba/cuda/intrinsics.py CHANGED Viewed

@@ -1,7 +1,7 @@
 from llvmlite import ir
 from numba import cuda, types
-from numba.core import cgutils
+from numba.cuda import cgutils
 from numba.core.errors import RequireLiteralValue, TypingError
 from numba.core.typing import signature
 from numba.core.extending import overload_attribute, overload_method

numba_cuda/numba/cuda/libdeviceimpl.py CHANGED Viewed

@@ -1,5 +1,6 @@
 from llvmlite import ir
-from numba.core import cgutils, types
+from numba.core import types
+from numba.cuda import cgutils
 from numba.core.imputils import Registry
 from numba.cuda import libdevice, libdevicefuncs

numba-cuda 0.17.0__py3-none-any.whl → 0.18.0__py3-none-any.whl

numba-cuda 0.17.0py3-none-any.whl → 0.18.0py3-none-any.whl