PyPI - pyopencl - Versions diffs - 2025.2.5__cp313-cp313-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl - Mend

pyopencl 2025.2.5__cp313-cp313-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of pyopencl might be problematic. Click here for more details.

Files changed (47) hide show

pyopencl/.libs/libOpenCL-83a5a7fd.so.1.0.0 +0 -0
pyopencl/__init__.py +1995 -0
pyopencl/_cl.cpython-313-x86_64-linux-gnu.so +0 -0
pyopencl/_cl.pyi +2006 -0
pyopencl/_cluda.py +57 -0
pyopencl/_monkeypatch.py +1069 -0
pyopencl/_mymako.py +17 -0
pyopencl/algorithm.py +1454 -0
pyopencl/array.py +3441 -0
pyopencl/bitonic_sort.py +245 -0
pyopencl/bitonic_sort_templates.py +597 -0
pyopencl/cache.py +535 -0
pyopencl/capture_call.py +200 -0
pyopencl/characterize/__init__.py +463 -0
pyopencl/characterize/performance.py +240 -0
pyopencl/cl/pyopencl-airy.cl +324 -0
pyopencl/cl/pyopencl-bessel-j-complex.cl +238 -0
pyopencl/cl/pyopencl-bessel-j.cl +1084 -0
pyopencl/cl/pyopencl-bessel-y.cl +435 -0
pyopencl/cl/pyopencl-complex.h +303 -0
pyopencl/cl/pyopencl-eval-tbl.cl +120 -0
pyopencl/cl/pyopencl-hankel-complex.cl +444 -0
pyopencl/cl/pyopencl-random123/array.h +325 -0
pyopencl/cl/pyopencl-random123/openclfeatures.h +93 -0
pyopencl/cl/pyopencl-random123/philox.cl +486 -0
pyopencl/cl/pyopencl-random123/threefry.cl +864 -0
pyopencl/clmath.py +282 -0
pyopencl/clrandom.py +412 -0
pyopencl/cltypes.py +202 -0
pyopencl/compyte/.gitignore +21 -0
pyopencl/compyte/__init__.py +0 -0
pyopencl/compyte/array.py +241 -0
pyopencl/compyte/dtypes.py +316 -0
pyopencl/compyte/pyproject.toml +52 -0
pyopencl/elementwise.py +1178 -0
pyopencl/invoker.py +417 -0
pyopencl/ipython_ext.py +70 -0
pyopencl/py.typed +0 -0
pyopencl/reduction.py +815 -0
pyopencl/scan.py +1916 -0
pyopencl/tools.py +1565 -0
pyopencl/typing.py +61 -0
pyopencl/version.py +11 -0
pyopencl-2025.2.5.dist-info/METADATA +109 -0
pyopencl-2025.2.5.dist-info/RECORD +47 -0
pyopencl-2025.2.5.dist-info/WHEEL +6 -0
pyopencl-2025.2.5.dist-info/licenses/LICENSE +104 -0

pyopencl/cl/pyopencl-complex.h ADDED Viewed

@@ -0,0 +1,303 @@
+/*
+ * Copyright (c) 1999
+ * Silicon Graphics Computer Systems, Inc.
+ *
+ * Copyright (c) 1999
+ * Boris Fomitchev
+ *
+ * Copyright (c) 2012
+ * Andreas Kloeckner
+ *
+ * This material is provided "as is", with absolutely no warranty expressed
+ * or implied. Any use is at your own risk.
+ *
+ * Permission to use or copy this software for any purpose is hereby granted
+ * without fee, provided the above notices are retained on all copies.
+ * Permission to modify the code and to distribute modified code is granted,
+ * provided the above notices are retained, and a notice that the code was
+ * modified is included with the above copyright notice.
+ *
+ */
+// This file is available for inclusion in pyopencl kernels and provides
+// complex types 'cfloat_t' and 'cdouble_t', along with a number of special
+// functions as visible below, e.g. cdouble_log(z).
+//
+// Under the hood, the complex types are simply float2 and double2.
+// Note that native (operator-based) addition (float + float2) and
+// multiplication (float2*float1) is defined for these types,
+// but do not match the rules of complex arithmetic.
+#pragma once
+#define PYOPENCL_DECLARE_COMPLEX_TYPE_INT(REAL_TP, REAL_3LTR, TPROOT, TP) \
+  \
+  inline REAL_TP TPROOT##_real(TP a) { return a.real; } \
+  inline REAL_TP TPROOT##_imag(TP a) { return a.imag; }        \
+  inline REAL_TP TPROOT##_abs(TP a) { return hypot(a.real, a.imag); }   \
+  inline REAL_TP TPROOT##_abs_squared(TP a) { return a.real * a.real + a.imag * a.imag; } \
+  \
+  inline TP TPROOT##_new(REAL_TP real, REAL_TP imag)  \
+  { \
+    TP result; \
+    result.real = real; \
+    result.imag = imag; \
+    return result; \
+  } \
+  \
+  inline TP TPROOT##_fromreal(REAL_TP real)     \
+  { \
+    TP result; \
+    result.real = real; \
+    result.imag = 0; \
+    return result; \
+  } \
+  \
+  \
+  inline TP TPROOT##_neg(TP a) { return TPROOT##_new(-a.real, -a.imag); } \
+  inline TP TPROOT##_conj(TP a) { return TPROOT##_new(a.real, -a.imag); } \
+  \
+  inline TP TPROOT##_add(TP a, TP b)            \
+  { \
+    return TPROOT##_new(a.real + b.real, a.imag + b.imag); \
+    ; \
+  } \
+  inline TP TPROOT##_addr(TP a, REAL_TP b)      \
+  { \
+    return TPROOT##_new(b+a.real, a.imag); \
+  } \
+  inline TP TPROOT##_radd(REAL_TP a, TP b)      \
+  { \
+    return TPROOT##_new(a+b.real, b.imag); \
+  } \
+  \
+  inline TP TPROOT##_sub(TP a, TP b)            \
+  { \
+    return TPROOT##_new(a.real - b.real, a.imag - b.imag); \
+    ; \
+  } \
+  \
+  inline TP TPROOT##_fma(TP a, TP b, TP c)           \
+  { \
+    return TPROOT##_new( \
+        fma(a.real, b.real, c.real) - a.imag*b.imag, \
+        fma(a.imag, b.real, fma(a.real, b.imag, c.imag))); \
+  } \
+  \
+  inline TP TPROOT##_mul(TP a, TP b)            \
+  { \
+    return TPROOT##_new( \
+        a.real*b.real - a.imag*b.imag, \
+        a.real*b.imag + a.imag*b.real); \
+  } \
+  \
+  inline TP TPROOT##_mulr(TP a, REAL_TP b)      \
+  { \
+    return TPROOT##_new(a.real*b, a.imag*b); \
+  } \
+  \
+  inline TP TPROOT##_rmul(REAL_TP a, TP b)      \
+  { \
+    return TPROOT##_new(a*b.real, a*b.imag); \
+  } \
+  \
+  inline TP TPROOT##_rdivide(REAL_TP z1, TP z2) \
+  { \
+    if (fabs(z2.real) <= fabs(z2.imag)) { \
+      REAL_TP ratio = z2.real / z2.imag; \
+      REAL_TP denom = z2.imag * (1 + ratio * ratio); \
+      return TPROOT##_new((z1 * ratio) / denom, - z1 / denom); \
+    } \
+    else { \
+      REAL_TP ratio = z2.imag / z2.real; \
+      REAL_TP denom = z2.real * (1 + ratio * ratio); \
+      return TPROOT##_new(z1 / denom, - (z1 * ratio) / denom); \
+    } \
+  } \
+  \
+  inline TP TPROOT##_divide(TP z1, TP z2)       \
+  { \
+    REAL_TP ratio, denom, a, b, c, d; \
+    \
+    if (fabs(z2.real) <= fabs(z2.imag)) { \
+      ratio = z2.real / z2.imag; \
+      denom = z2.imag; \
+      a = z1.imag; \
+      b = z1.real; \
+      c = -z1.real; \
+      d = z1.imag; \
+    } \
+    else { \
+      ratio = z2.imag / z2.real; \
+      denom = z2.real; \
+      a = z1.real; \
+      b = z1.imag; \
+      c = z1.imag; \
+      d = -z1.real; \
+    } \
+    denom *= (1 + ratio * ratio); \
+    return TPROOT##_new( \
+       (a + b * ratio) / denom, \
+       (c + d * ratio) / denom); \
+  } \
+  \
+  inline TP TPROOT##_divider(TP a, REAL_TP b)   \
+  { \
+    return TPROOT##_new(a.real/b, a.imag/b); \
+  } \
+  \
+  inline TP TPROOT##_pow(TP a, TP b)            \
+  { \
+    REAL_TP logr = log(hypot(a.real, a.imag)); \
+    REAL_TP logi = atan2(a.imag, a.real); \
+    REAL_TP x = exp(logr * b.real - logi * b.imag); \
+    REAL_TP y = logr * b.imag + logi * b.real; \
+    \
+    REAL_TP cosy; \
+    REAL_TP siny = sincos(y, &cosy); \
+    return TPROOT##_new(x*cosy, x*siny); \
+  } \
+  \
+  inline TP TPROOT##_powr(TP a, REAL_TP b)      \
+  { \
+    REAL_TP logr = log(hypot(a.real, a.imag)); \
+    REAL_TP logi = atan2(a.imag, a.real); \
+    REAL_TP x = exp(logr * b); \
+    REAL_TP y = logi * b; \
+    \
+    REAL_TP cosy; \
+    REAL_TP siny = sincos(y, &cosy); \
+    \
+    return TPROOT##_new(x * cosy, x*siny); \
+  } \
+  \
+  inline TP TPROOT##_rpow(REAL_TP a, TP b)      \
+  { \
+    REAL_TP logr = log(a); \
+    REAL_TP x = exp(logr * b.real); \
+    REAL_TP y = logr * b.imag; \
+    \
+    REAL_TP cosy; \
+    REAL_TP siny = sincos(y, &cosy); \
+    return TPROOT##_new(x * cosy, x * siny); \
+  } \
+  \
+  inline TP TPROOT##_sqrt(TP a)                 \
+  { \
+    REAL_TP re = a.real; \
+    REAL_TP im = a.imag; \
+    REAL_TP mag = hypot(re, im); \
+    TP result; \
+    \
+    if (mag == 0.f) { \
+      result.real = result.imag = 0.f; \
+    } else if (re > 0.f) { \
+      result.real = sqrt(0.5f * (mag + re)); \
+      result.imag = im/result.real/2.f; \
+    } else { \
+      result.imag = sqrt(0.5f * (mag - re)); \
+      if (im < 0.f) \
+        result.imag = - result.imag; \
+      result.real = im/result.imag/2.f; \
+    } \
+    return result; \
+  } \
+  \
+  inline TP TPROOT##_exp(TP a) \
+  { \
+    REAL_TP expr = exp(a.real); \
+    REAL_TP cosi; \
+    REAL_TP sini = sincos(a.imag, &cosi); \
+    return TPROOT##_new(expr * cosi, expr * sini); \
+  } \
+  \
+  inline TP TPROOT##_log(TP a)                                                 \
+  { return TPROOT##_new(log(hypot(a.real, a.imag)), atan2(a.imag, a.real)); } \
+  \
+  inline TP TPROOT##_sin(TP a) \
+  { \
+    REAL_TP cosr; \
+    REAL_TP sinr = sincos(a.real, &cosr); \
+    return TPROOT##_new(sinr*cosh(a.imag), cosr*sinh(a.imag)); \
+  } \
+  \
+  inline TP TPROOT##_cos(TP a) \
+  { \
+    REAL_TP cosr; \
+    REAL_TP sinr = sincos(a.real, &cosr); \
+    return TPROOT##_new(cosr*cosh(a.imag), -sinr*sinh(a.imag)); \
+  } \
+  \
+  inline TP TPROOT##_tan(TP a) \
+  { \
+    REAL_TP re2 = 2.f * a.real; \
+    REAL_TP im2 = 2.f * a.imag; \
+    \
+    const REAL_TP limit = log(REAL_3LTR##_MAX); \
+    \
+    if (fabs(im2) > limit) \
+      return TPROOT##_new(0.f, (im2 > 0 ? 1.f : -1.f)); \
+    else \
+    { \
+      REAL_TP den = cos(re2) + cosh(im2); \
+      return TPROOT##_new(sin(re2) / den, sinh(im2) / den); \
+    } \
+  } \
+  \
+  inline TP TPROOT##_sinh(TP a) \
+  { \
+    REAL_TP cosi; \
+    REAL_TP sini = sincos(a.imag, &cosi); \
+    return TPROOT##_new(sinh(a.real)*cosi, cosh(a.real)*sini); \
+  } \
+  \
+  inline TP TPROOT##_cosh(TP a) \
+  { \
+    REAL_TP cosi; \
+    REAL_TP sini = sincos(a.imag, &cosi); \
+    return TPROOT##_new(cosh(a.real)*cosi, sinh(a.real)*sini); \
+  } \
+  \
+  inline TP TPROOT##_tanh(TP a) \
+  { \
+    REAL_TP re2 = 2.f * a.real; \
+    REAL_TP im2 = 2.f * a.imag; \
+    \
+    const REAL_TP limit = log(REAL_3LTR##_MAX); \
+    \
+    if (fabs(re2) > limit) \
+      return TPROOT##_new((re2 > 0 ? 1.f : -1.f), 0.f); \
+    else \
+    { \
+      REAL_TP den = cosh(re2) + cos(im2); \
+      return TPROOT##_new(sinh(re2) / den, sin(im2) / den); \
+    } \
+  } \
+// This is undocumented and may disappear at any time
+#if PYOPENCL_COMPLEX_ENABLE_EXTENDED_ALIGNMENT
+#define PYOPENCL_COMPLEX_ALIGNMENT(TYPE) 2*sizeof(TYPE)
+#else
+#define PYOPENCL_COMPLEX_ALIGNMENT(TYPE) sizeof(TYPE)
+#endif
+#define PYOPENCL_DECLARE_COMPLEX_TYPE(BASE, BASE_3LTR) \
+  typedef union \
+  { \
+    struct { BASE x, y; } \
+      __attribute__ ((aligned (PYOPENCL_COMPLEX_ALIGNMENT(BASE)))); \
+    struct { BASE real, imag; } \
+      __attribute__ ((aligned (PYOPENCL_COMPLEX_ALIGNMENT(BASE)))); \
+  } c##BASE##_t; \
+  \
+  PYOPENCL_DECLARE_COMPLEX_TYPE_INT(BASE, BASE_3LTR, c##BASE, c##BASE##_t)
+PYOPENCL_DECLARE_COMPLEX_TYPE(float, FLT);
+#define cfloat_cast(a) cfloat_new((a).real, (a).imag)
+#ifdef PYOPENCL_DEFINE_CDOUBLE
+PYOPENCL_DECLARE_COMPLEX_TYPE(double, DBL);
+#define cdouble_cast(a) cdouble_new((a).real, (a).imag)
+#endif
+#undef PYOPENCL_COMPLEX_ALIGNMENT

pyopencl/cl/pyopencl-eval-tbl.cl ADDED Viewed

@@ -0,0 +1,120 @@
+//  Pieced together from Boost C++ and Cephes by
+//  Andreas Kloeckner (C) 2012
+//
+//  Pieces from:
+//
+//  Copyright (c) 2006 Xiaogang Zhang, John Maddock
+//  Use, modification and distribution are subject to the
+//  Boost Software License, Version 1.0. (See
+//  http://www.boost.org/LICENSE_1_0.txt)
+//
+// Cephes Math Library Release 2.8:  June, 2000
+// Copyright 1984, 1987, 1989, 1992, 2000 by Stephen L. Moshier
+// What you see here may be used freely, but it comes with no support or
+// guarantee.
+#pragma once
+typedef double special_func_scalar_type;
+// {{{ cephes_polevl
+/*
+ * DESCRIPTION:
+ *
+ * Evaluates polynomial of degree N:
+ *
+ *                     2          N
+ * y  =  C  + C x + C x  +...+ C x
+ *        0    1     2          N
+ *
+ * Coefficients are stored in reverse order:
+ *
+ * coef[0] = C  , ..., coef[N] = C  .
+ *            N                   0
+ *
+ *  The function p1evl() assumes that coef[N] = 1.0 and is
+ * omitted from the array.  Its calling arguments are
+ * otherwise the same as polevl().
+ *
+ */
+special_func_scalar_type cephes_polevl(special_func_scalar_type x, __constant const special_func_scalar_type *coef, int N)
+{
+  special_func_scalar_type ans;
+  int i;
+  __constant const special_func_scalar_type *p;
+  p = coef;
+  ans = *p++;
+  i = N;
+  do
+    ans = ans * x  +  *p++;
+  while( --i );
+  return( ans );
+}
+// }}}
+// {{{ cephes_p1evl
+special_func_scalar_type cephes_p1evl( special_func_scalar_type x, __constant const special_func_scalar_type *coef, int N )
+{
+  special_func_scalar_type ans;
+  __constant const special_func_scalar_type *p;
+  int i;
+  p = coef;
+  ans = x + *p++;
+  i = N-1;
+  do
+    ans = ans * x  + *p++;
+  while( --i );
+  return( ans );
+}
+// }}}
+// {{{ boost_evaluate_rational
+special_func_scalar_type boost_evaluate_rational_backend(__constant const special_func_scalar_type* num, __constant const special_func_scalar_type* denom, special_func_scalar_type z, int count)
+{
+   special_func_scalar_type s1, s2;
+   if(z <= 1)
+   {
+      s1 = num[count-1];
+      s2 = denom[count-1];
+      for(int i = (int)count - 2; i >= 0; --i)
+      {
+         s1 *= z;
+         s2 *= z;
+         s1 += num[i];
+         s2 += denom[i];
+      }
+   }
+   else
+   {
+      z = 1 / z;
+      s1 = num[0];
+      s2 = denom[0];
+      for(unsigned i = 1; i < count; ++i)
+      {
+         s1 *= z;
+         s2 *= z;
+         s1 += num[i];
+         s2 += denom[i];
+      }
+   }
+   return s1 / s2;
+}
+#define boost_evaluate_rational(num, denom, z) \
+  boost_evaluate_rational_backend(num, denom, z, sizeof(num)/sizeof(special_func_scalar_type))
+// }}}
+// vim: fdm=marker