mkl-devel-dpcpp 2025.1.0__py2.py3-none-win_amd64.whl → 2025.3.0__py2.py3-none-win_amd64.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {mkl_devel_dpcpp-2025.1.0.data → mkl_devel_dpcpp-2025.3.0.data}/data/Library/lib/mkl_sycl.lib +0 -0
- {mkl_devel_dpcpp-2025.1.0.data → mkl_devel_dpcpp-2025.3.0.data}/data/Library/lib/mkl_sycl_blas_dll.lib +0 -0
- mkl_devel_dpcpp-2025.3.0.data/data/Library/lib/mkl_sycl_dft_dll.lib +0 -0
- {mkl_devel_dpcpp-2025.1.0.data → mkl_devel_dpcpp-2025.3.0.data}/data/Library/lib/mkl_sycl_dll.lib +0 -0
- mkl_devel_dpcpp-2025.3.0.data/data/Library/lib/mkl_sycl_lapack_dll.lib +0 -0
- {mkl_devel_dpcpp-2025.1.0.data → mkl_devel_dpcpp-2025.3.0.data}/data/Library/lib/mkl_sycl_rng_dll.lib +0 -0
- mkl_devel_dpcpp-2025.3.0.data/data/Library/lib/mkl_sycl_sparse_dll.lib +0 -0
- {mkl_devel_dpcpp-2025.1.0.dist-info → mkl_devel_dpcpp-2025.3.0.dist-info}/METADATA +5 -4
- mkl_devel_dpcpp-2025.3.0.dist-info/RECORD +15 -0
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/bfloat16.hpp +0 -26
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/blas/buffer.hpp +0 -42
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/blas/buffer_decls.hpp +0 -880
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/blas/spec.hpp +0 -42
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/blas/types.hpp +0 -60
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/blas/usm.hpp +0 -42
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/blas/usm_decls.hpp +0 -1240
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/blas.hpp +0 -34
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/dft/spec.hpp +0 -42
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/dft.hpp +0 -254
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/dfti.hpp +0 -22
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/exceptions.hpp +0 -110
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/experimental/data_fitting/interpolate.hpp +0 -67
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/experimental/data_fitting/spline_and_data_params.hpp +0 -68
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/experimental/data_fitting/splines.hpp +0 -177
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/experimental/data_fitting.hpp +0 -22
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/export.hpp +0 -25
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/lapack/concepts.hpp +0 -55
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/lapack/exceptions.hpp +0 -75
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/lapack/lapack.hpp +0 -1096
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/lapack/scratchpad.hpp +0 -107
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/lapack/spec.hpp +0 -42
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/lapack.hpp +0 -24
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/rng/detail/engine_base.hpp +0 -48
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/rng/device/detail/bernoulli_impl.hpp +0 -89
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/rng/device/detail/beta_impl.hpp +0 -463
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/rng/device/detail/bits_impl.hpp +0 -71
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/rng/device/detail/distribution_base.hpp +0 -85
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/rng/device/detail/engine_base.hpp +0 -43
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/rng/device/detail/engine_helpers_base.hpp +0 -54
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/rng/device/detail/exponential_impl.hpp +0 -116
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/rng/device/detail/gamma_impl.hpp +0 -285
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/rng/device/detail/gaussian_impl.hpp +0 -270
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/rng/device/detail/geometric_impl.hpp +0 -99
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/rng/device/detail/lognormal_impl.hpp +0 -105
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/rng/device/detail/mcg31m1_helpers_impl.hpp +0 -117
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/rng/device/detail/mcg31m1_impl.hpp +0 -223
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/rng/device/detail/mcg59_helpers_impl.hpp +0 -118
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/rng/device/detail/mcg59_impl.hpp +0 -266
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/rng/device/detail/mrg32k3a_helpers_impl.hpp +0 -125
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/rng/device/detail/mrg32k3a_impl.hpp +0 -385
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/rng/device/detail/mrg32k3a_skip_ahead_matrix.hpp +0 -3668
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/rng/device/detail/philox4x32x10_helpers_impl.hpp +0 -141
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/rng/device/detail/philox4x32x10_impl.hpp +0 -552
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/rng/device/detail/poisson_impl.hpp +0 -328
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/rng/device/detail/types.hpp +0 -58
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/rng/device/detail/uniform_bits_impl.hpp +0 -51
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/rng/device/detail/uniform_impl.hpp +0 -287
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/rng/device/detail/vm_wrappers.hpp +0 -183
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/rng/device/distributions.hpp +0 -700
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/rng/device/engine_helpers.hpp +0 -116
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/rng/device/engines.hpp +0 -187
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/rng/device/functions.hpp +0 -59
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/rng/device/types.hpp +0 -79
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/rng/device.hpp +0 -29
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/rng/distributions.hpp +0 -1913
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/rng/engines.hpp +0 -788
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/rng/functions.hpp +0 -163
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/rng/spec.hpp +0 -42
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/rng.hpp +0 -23
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/spblas/sparse_auxiliary.hpp +0 -111
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/spblas/sparse_operations.hpp +0 -446
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/spblas/sparse_structures.hpp +0 -193
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/spblas/spec.hpp +0 -42
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/spblas.hpp +0 -33
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/spec.hpp +0 -42
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/stats/spec.hpp +0 -42
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/stats.hpp +0 -357
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/types.hpp +0 -321
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/vm/buffer.hpp +0 -3529
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/vm/decls.hpp +0 -280
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/vm/device/detail/decls.hpp +0 -81
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/vm/device/detail/dispatch.hpp +0 -1059
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/vm/device/detail/ep.hpp +0 -861
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/vm/device/detail/ha.hpp +0 -860
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/vm/device/detail/la.hpp +0 -860
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/vm/device/detail/rts.hpp +0 -4608
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/vm/device/detail/scalar.hpp +0 -8963
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/vm/device/vm.hpp +0 -460
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/vm/span.hpp +0 -3813
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/vm/spec.hpp +0 -42
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/vm/usm.hpp +0 -3581
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl/vm.hpp +0 -31
- mkl_devel_dpcpp-2025.1.0.data/data/Library/include/oneapi/mkl.hpp +0 -35
- mkl_devel_dpcpp-2025.1.0.data/data/Library/lib/mkl_sycl_dft_dll.lib +0 -0
- mkl_devel_dpcpp-2025.1.0.data/data/Library/lib/mkl_sycl_lapack_dll.lib +0 -0
- mkl_devel_dpcpp-2025.1.0.data/data/Library/lib/mkl_sycl_sparse_dll.lib +0 -0
- mkl_devel_dpcpp-2025.1.0.dist-info/RECORD +0 -99
- {mkl_devel_dpcpp-2025.1.0.data → mkl_devel_dpcpp-2025.3.0.data}/data/Library/lib/mkl_sycl_data_fitting_dll.lib +0 -0
- {mkl_devel_dpcpp-2025.1.0.data → mkl_devel_dpcpp-2025.3.0.data}/data/Library/lib/mkl_sycl_stats_dll.lib +0 -0
- {mkl_devel_dpcpp-2025.1.0.data → mkl_devel_dpcpp-2025.3.0.data}/data/Library/lib/mkl_sycl_vm_dll.lib +0 -0
- {mkl_devel_dpcpp-2025.1.0.dist-info → mkl_devel_dpcpp-2025.3.0.dist-info}/LICENSE.txt +0 -0
- {mkl_devel_dpcpp-2025.1.0.dist-info → mkl_devel_dpcpp-2025.3.0.dist-info}/WHEEL +0 -0
- {mkl_devel_dpcpp-2025.1.0.dist-info → mkl_devel_dpcpp-2025.3.0.dist-info}/top_level.txt +0 -0
|
@@ -1,880 +0,0 @@
|
|
|
1
|
-
/*******************************************************************************
|
|
2
|
-
* Copyright (C) 2018 Intel Corporation
|
|
3
|
-
*
|
|
4
|
-
* This software and the related documents are Intel copyrighted materials, and
|
|
5
|
-
* your use of them is governed by the express license under which they were
|
|
6
|
-
* provided to you (License). Unless the License provides otherwise, you may not
|
|
7
|
-
* use, modify, copy, publish, distribute, disclose or transmit this software or
|
|
8
|
-
* the related documents without Intel's prior written permission.
|
|
9
|
-
*
|
|
10
|
-
* This software and the related documents are provided as is, with no express
|
|
11
|
-
* or implied warranties, other than those that are expressly stated in the
|
|
12
|
-
* License.
|
|
13
|
-
*******************************************************************************/
|
|
14
|
-
|
|
15
|
-
// Level 3
|
|
16
|
-
|
|
17
|
-
#define ONEMKL_DECLARE_BUF_GEMM(Ta, Tb, Tc, Ts) \
|
|
18
|
-
DLL_EXPORT void gemm(sycl::queue &queue, transpose transa, transpose transb, \
|
|
19
|
-
std::int64_t m, std::int64_t n, std::int64_t k, \
|
|
20
|
-
Ts alpha, sycl::buffer<Ta, 1> &a, std::int64_t lda, \
|
|
21
|
-
sycl::buffer<Tb, 1> &b, std::int64_t ldb, \
|
|
22
|
-
Ts beta, sycl::buffer<Tc, 1> &c, std::int64_t ldc, \
|
|
23
|
-
compute_mode mode = MKL_BLAS_COMPUTE_MODE);
|
|
24
|
-
|
|
25
|
-
ONEMKL_DECLARE_BUF_GEMM(float, float, float, float)
|
|
26
|
-
ONEMKL_DECLARE_BUF_GEMM(double, double, double, double)
|
|
27
|
-
ONEMKL_DECLARE_BUF_GEMM(std::complex<float>, std::complex<float>, std::complex<float>, std::complex<float>)
|
|
28
|
-
ONEMKL_DECLARE_BUF_GEMM(std::complex<double>, std::complex<double>, std::complex<double>, std::complex<double>)
|
|
29
|
-
ONEMKL_DECLARE_BUF_GEMM(sycl::half, sycl::half, sycl::half, sycl::half)
|
|
30
|
-
ONEMKL_DECLARE_BUF_GEMM(sycl::half, sycl::half, float, float)
|
|
31
|
-
ONEMKL_DECLARE_BUF_GEMM(bfloat16, bfloat16, bfloat16, float)
|
|
32
|
-
ONEMKL_DECLARE_BUF_GEMM(bfloat16, bfloat16, float, float)
|
|
33
|
-
ONEMKL_DECLARE_BUF_GEMM(std::int8_t, std::int8_t, std::int32_t, float)
|
|
34
|
-
ONEMKL_DECLARE_BUF_GEMM(std::int8_t, std::int8_t, float, float)
|
|
35
|
-
|
|
36
|
-
#undef ONEMKL_DECLARE_BUF_GEMM
|
|
37
|
-
|
|
38
|
-
#define ONEMKL_DECLARE_BUF_SYMM(T) \
|
|
39
|
-
DLL_EXPORT void symm(sycl::queue &queue, side left_right, uplo upper_lower, std::int64_t m, std::int64_t n, \
|
|
40
|
-
T alpha, sycl::buffer<T, 1> &a, std::int64_t lda, \
|
|
41
|
-
sycl::buffer<T, 1> &b, std::int64_t ldb, T beta, sycl::buffer<T, 1> &c, \
|
|
42
|
-
std::int64_t ldc, compute_mode mode = MKL_BLAS_COMPUTE_MODE);
|
|
43
|
-
|
|
44
|
-
ONEMKL_DECLARE_BUF_SYMM(float)
|
|
45
|
-
ONEMKL_DECLARE_BUF_SYMM(double)
|
|
46
|
-
ONEMKL_DECLARE_BUF_SYMM(std::complex<float>)
|
|
47
|
-
ONEMKL_DECLARE_BUF_SYMM(std::complex<double>)
|
|
48
|
-
|
|
49
|
-
#undef ONEMKL_DECLARE_BUF_SYMM
|
|
50
|
-
|
|
51
|
-
#define ONEMKL_DECLARE_BUF_HEMM(T) \
|
|
52
|
-
DLL_EXPORT void hemm(sycl::queue &queue, side left_right, uplo upper_lower, std::int64_t m, std::int64_t n, \
|
|
53
|
-
T alpha, sycl::buffer<T, 1> &a, std::int64_t lda, \
|
|
54
|
-
sycl::buffer<T, 1> &b, std::int64_t ldb, T beta, sycl::buffer<T, 1> &c, \
|
|
55
|
-
std::int64_t ldc, compute_mode mode = MKL_BLAS_COMPUTE_MODE);
|
|
56
|
-
|
|
57
|
-
ONEMKL_DECLARE_BUF_HEMM(std::complex<float>)
|
|
58
|
-
ONEMKL_DECLARE_BUF_HEMM(std::complex<double>)
|
|
59
|
-
|
|
60
|
-
#undef ONEMKL_DECLARE_BUF_HEMM
|
|
61
|
-
|
|
62
|
-
#define ONEMKL_DECLARE_BUF_SYRK(T) \
|
|
63
|
-
DLL_EXPORT void syrk(sycl::queue &queue, uplo upper_lower, transpose trans, std::int64_t n, std::int64_t k, \
|
|
64
|
-
T alpha, sycl::buffer<T, 1> &a, std::int64_t lda, \
|
|
65
|
-
T beta, sycl::buffer<T, 1> &c, std::int64_t ldc, \
|
|
66
|
-
compute_mode mode = MKL_BLAS_COMPUTE_MODE);
|
|
67
|
-
|
|
68
|
-
ONEMKL_DECLARE_BUF_SYRK(float)
|
|
69
|
-
ONEMKL_DECLARE_BUF_SYRK(double)
|
|
70
|
-
ONEMKL_DECLARE_BUF_SYRK(std::complex<float>)
|
|
71
|
-
ONEMKL_DECLARE_BUF_SYRK(std::complex<double>)
|
|
72
|
-
|
|
73
|
-
#undef ONEMKL_DECLARE_BUF_SYRK
|
|
74
|
-
|
|
75
|
-
#define ONEMKL_DECLARE_BUF_HERK(T, Treal) \
|
|
76
|
-
DLL_EXPORT void herk(sycl::queue &queue, uplo upper_lower, transpose trans, std::int64_t n, std::int64_t k, \
|
|
77
|
-
Treal alpha, sycl::buffer<T, 1> &a, std::int64_t lda, \
|
|
78
|
-
Treal beta, sycl::buffer<T, 1> &c, std::int64_t ldc, \
|
|
79
|
-
compute_mode mode = MKL_BLAS_COMPUTE_MODE);
|
|
80
|
-
|
|
81
|
-
ONEMKL_DECLARE_BUF_HERK(std::complex<float>, float)
|
|
82
|
-
ONEMKL_DECLARE_BUF_HERK(std::complex<double>, double)
|
|
83
|
-
|
|
84
|
-
#undef ONEMKL_DECLARE_BUF_HERK
|
|
85
|
-
|
|
86
|
-
#define ONEMKL_DECLARE_BUF_SYR2K(T) \
|
|
87
|
-
DLL_EXPORT void syr2k(sycl::queue &queue, uplo upper_lower, transpose trans, std::int64_t n, std::int64_t k, \
|
|
88
|
-
T alpha, sycl::buffer<T, 1> &a, std::int64_t lda, \
|
|
89
|
-
sycl::buffer<T, 1> &b, std::int64_t ldb, \
|
|
90
|
-
T beta, sycl::buffer<T, 1> &c, std::int64_t ldc, \
|
|
91
|
-
compute_mode mode = MKL_BLAS_COMPUTE_MODE);
|
|
92
|
-
|
|
93
|
-
ONEMKL_DECLARE_BUF_SYR2K(float)
|
|
94
|
-
ONEMKL_DECLARE_BUF_SYR2K(double)
|
|
95
|
-
ONEMKL_DECLARE_BUF_SYR2K(std::complex<float>)
|
|
96
|
-
ONEMKL_DECLARE_BUF_SYR2K(std::complex<double>)
|
|
97
|
-
|
|
98
|
-
#undef ONEMKL_DECLARE_BUF_SYR2K
|
|
99
|
-
|
|
100
|
-
#define ONEMKL_DECLARE_BUF_HER2K(T, Treal) \
|
|
101
|
-
DLL_EXPORT void her2k(sycl::queue &queue, uplo upper_lower, transpose trans, std::int64_t n, std::int64_t k, \
|
|
102
|
-
T alpha, sycl::buffer<T, 1> &a, std::int64_t lda, \
|
|
103
|
-
sycl::buffer<T, 1> &b, std::int64_t ldb, \
|
|
104
|
-
Treal beta, sycl::buffer<T, 1> &c, std::int64_t ldc, \
|
|
105
|
-
compute_mode mode = MKL_BLAS_COMPUTE_MODE);
|
|
106
|
-
|
|
107
|
-
ONEMKL_DECLARE_BUF_HER2K(std::complex<float>, float)
|
|
108
|
-
ONEMKL_DECLARE_BUF_HER2K(std::complex<double>, double)
|
|
109
|
-
|
|
110
|
-
#undef ONEMKL_DECLARE_BUF_HER2K
|
|
111
|
-
|
|
112
|
-
#define ONEMKL_DECLARE_BUF_TRMM(T) \
|
|
113
|
-
DLL_EXPORT void trmm(sycl::queue &queue, side left_right, uplo upper_lower, transpose trans, diag unit_diag, \
|
|
114
|
-
std::int64_t m, std::int64_t n, \
|
|
115
|
-
T alpha, sycl::buffer<T, 1> &a, std::int64_t lda, \
|
|
116
|
-
sycl::buffer<T, 1> &b, std::int64_t ldb, \
|
|
117
|
-
compute_mode mode = MKL_BLAS_COMPUTE_MODE);
|
|
118
|
-
|
|
119
|
-
ONEMKL_DECLARE_BUF_TRMM(float)
|
|
120
|
-
ONEMKL_DECLARE_BUF_TRMM(double)
|
|
121
|
-
ONEMKL_DECLARE_BUF_TRMM(std::complex<float>)
|
|
122
|
-
ONEMKL_DECLARE_BUF_TRMM(std::complex<double>)
|
|
123
|
-
|
|
124
|
-
#undef ONEMKL_DECLARE_BUF_TRMM
|
|
125
|
-
|
|
126
|
-
#define ONEMKL_DECLARE_BUF_TRMM_OOP(T) \
|
|
127
|
-
DLL_EXPORT void trmm(sycl::queue &queue, side left_right, uplo upper_lower, transpose trans, diag unit_diag, \
|
|
128
|
-
std::int64_t m, std::int64_t n, \
|
|
129
|
-
T alpha, sycl::buffer<T, 1> &a, std::int64_t lda, \
|
|
130
|
-
sycl::buffer<T, 1> &b, std::int64_t ldb, \
|
|
131
|
-
T beta, sycl::buffer<T, 1> &c, std::int64_t ldc, \
|
|
132
|
-
compute_mode mode = MKL_BLAS_COMPUTE_MODE);
|
|
133
|
-
|
|
134
|
-
ONEMKL_DECLARE_BUF_TRMM_OOP(float)
|
|
135
|
-
ONEMKL_DECLARE_BUF_TRMM_OOP(double)
|
|
136
|
-
ONEMKL_DECLARE_BUF_TRMM_OOP(std::complex<float>)
|
|
137
|
-
ONEMKL_DECLARE_BUF_TRMM_OOP(std::complex<double>)
|
|
138
|
-
|
|
139
|
-
#undef ONEMKL_DECLARE_BUF_TRMM_OOP
|
|
140
|
-
|
|
141
|
-
#define ONEMKL_DECLARE_BUF_TRSM(T) \
|
|
142
|
-
DLL_EXPORT void trsm(sycl::queue &queue, side left_right, uplo upper_lower, transpose trans, diag unit_diag, \
|
|
143
|
-
std::int64_t m, std::int64_t n, \
|
|
144
|
-
T alpha, sycl::buffer<T, 1> &a, std::int64_t lda, \
|
|
145
|
-
sycl::buffer<T, 1> &b, std::int64_t ldb, \
|
|
146
|
-
compute_mode mode = MKL_BLAS_COMPUTE_MODE);
|
|
147
|
-
|
|
148
|
-
ONEMKL_DECLARE_BUF_TRSM(float)
|
|
149
|
-
ONEMKL_DECLARE_BUF_TRSM(double)
|
|
150
|
-
ONEMKL_DECLARE_BUF_TRSM(std::complex<float>)
|
|
151
|
-
ONEMKL_DECLARE_BUF_TRSM(std::complex<double>)
|
|
152
|
-
|
|
153
|
-
#undef ONEMKL_DECLARE_BUF_TRSM
|
|
154
|
-
|
|
155
|
-
#define ONEMKL_DECLARE_BUF_TRSM_OOP(T) \
|
|
156
|
-
DLL_EXPORT void trsm(sycl::queue &queue, side left_right, uplo upper_lower, transpose trans, diag unit_diag, \
|
|
157
|
-
std::int64_t m, std::int64_t n, \
|
|
158
|
-
T alpha, sycl::buffer<T, 1> &a, std::int64_t lda, \
|
|
159
|
-
sycl::buffer<T, 1> &b, std::int64_t ldb, \
|
|
160
|
-
T beta, sycl::buffer<T, 1> &c, std::int64_t ldc, \
|
|
161
|
-
compute_mode mode = MKL_BLAS_COMPUTE_MODE);
|
|
162
|
-
|
|
163
|
-
ONEMKL_DECLARE_BUF_TRSM_OOP(float)
|
|
164
|
-
ONEMKL_DECLARE_BUF_TRSM_OOP(double)
|
|
165
|
-
ONEMKL_DECLARE_BUF_TRSM_OOP(std::complex<float>)
|
|
166
|
-
ONEMKL_DECLARE_BUF_TRSM_OOP(std::complex<double>)
|
|
167
|
-
|
|
168
|
-
#undef ONEMKL_DECLARE_BUF_TRSM_OOP
|
|
169
|
-
|
|
170
|
-
// Level 2
|
|
171
|
-
|
|
172
|
-
#define ONEMKL_DECLARE_BUF_DGMM(T) \
|
|
173
|
-
DLL_EXPORT void dgmm(sycl::queue &queue, side left_right, \
|
|
174
|
-
std::int64_t m, std::int64_t n, \
|
|
175
|
-
sycl::buffer<T, 1> &a, std::int64_t lda, \
|
|
176
|
-
sycl::buffer<T, 1> &x, std::int64_t incx, \
|
|
177
|
-
sycl::buffer<T, 1> &c, std::int64_t ldc);
|
|
178
|
-
|
|
179
|
-
ONEMKL_DECLARE_BUF_DGMM(float)
|
|
180
|
-
ONEMKL_DECLARE_BUF_DGMM(double)
|
|
181
|
-
ONEMKL_DECLARE_BUF_DGMM(std::complex<float>)
|
|
182
|
-
ONEMKL_DECLARE_BUF_DGMM(std::complex<double>)
|
|
183
|
-
|
|
184
|
-
#undef ONEMKL_DECLARE_BUF_DGMM
|
|
185
|
-
|
|
186
|
-
#define ONEMKL_DECLARE_BUF_GEMV(T) \
|
|
187
|
-
DLL_EXPORT void gemv(sycl::queue &queue, transpose trans, std::int64_t m, std::int64_t n, T alpha, \
|
|
188
|
-
sycl::buffer<T, 1> &a, std::int64_t lda, \
|
|
189
|
-
sycl::buffer<T, 1> &x, std::int64_t incx, T beta, \
|
|
190
|
-
sycl::buffer<T, 1> &y, std::int64_t incy);
|
|
191
|
-
|
|
192
|
-
ONEMKL_DECLARE_BUF_GEMV(float)
|
|
193
|
-
ONEMKL_DECLARE_BUF_GEMV(double)
|
|
194
|
-
ONEMKL_DECLARE_BUF_GEMV(std::complex<float>)
|
|
195
|
-
ONEMKL_DECLARE_BUF_GEMV(std::complex<double>)
|
|
196
|
-
|
|
197
|
-
#undef ONEMKL_DECLARE_BUF_GEMV
|
|
198
|
-
|
|
199
|
-
#define ONEMKL_DECLARE_BUF_GBMV(T) \
|
|
200
|
-
DLL_EXPORT void gbmv(sycl::queue &queue, transpose trans, std::int64_t m, std::int64_t n, std::int64_t kl, std::int64_t ku, T alpha, \
|
|
201
|
-
sycl::buffer<T, 1> &a, std::int64_t lda, \
|
|
202
|
-
sycl::buffer<T, 1> &x, std::int64_t incx, T beta, \
|
|
203
|
-
sycl::buffer<T, 1> &y, std::int64_t incy);
|
|
204
|
-
|
|
205
|
-
ONEMKL_DECLARE_BUF_GBMV(float)
|
|
206
|
-
ONEMKL_DECLARE_BUF_GBMV(double)
|
|
207
|
-
ONEMKL_DECLARE_BUF_GBMV(std::complex<float>)
|
|
208
|
-
ONEMKL_DECLARE_BUF_GBMV(std::complex<double>)
|
|
209
|
-
|
|
210
|
-
#undef ONEMKL_DECLARE_BUF_GBMV
|
|
211
|
-
|
|
212
|
-
#define ONEMKL_DECLARE_BUF_GER(T) \
|
|
213
|
-
DLL_EXPORT void ger(sycl::queue &queue, std::int64_t m, std::int64_t n, T alpha, \
|
|
214
|
-
sycl::buffer<T, 1> &x, std::int64_t incx, sycl::buffer<T, 1> &y, std::int64_t incy, \
|
|
215
|
-
sycl::buffer<T, 1> &a, std::int64_t lda);
|
|
216
|
-
|
|
217
|
-
ONEMKL_DECLARE_BUF_GER(float)
|
|
218
|
-
ONEMKL_DECLARE_BUF_GER(double)
|
|
219
|
-
|
|
220
|
-
#undef ONEMKL_DECLARE_BUF_GER
|
|
221
|
-
|
|
222
|
-
#define ONEMKL_DECLARE_BUF_GERC(T) \
|
|
223
|
-
DLL_EXPORT void gerc(sycl::queue &queue, std::int64_t m, std::int64_t n, T alpha, \
|
|
224
|
-
sycl::buffer<T, 1> &x, std::int64_t incx, \
|
|
225
|
-
sycl::buffer<T, 1> &y, std::int64_t incy, \
|
|
226
|
-
sycl::buffer<T, 1> &a, std::int64_t lda);
|
|
227
|
-
|
|
228
|
-
ONEMKL_DECLARE_BUF_GERC(std::complex<float>)
|
|
229
|
-
ONEMKL_DECLARE_BUF_GERC(std::complex<double>)
|
|
230
|
-
|
|
231
|
-
#undef ONEMKL_DECLARE_BUF_GERC
|
|
232
|
-
|
|
233
|
-
#define ONEMKL_DECLARE_BUF_GERU(T) \
|
|
234
|
-
DLL_EXPORT void geru(sycl::queue &queue, std::int64_t m, std::int64_t n, T alpha, \
|
|
235
|
-
sycl::buffer<T, 1> &x, std::int64_t incx, \
|
|
236
|
-
sycl::buffer<T, 1> &y, std::int64_t incy, \
|
|
237
|
-
sycl::buffer<T, 1> &a, std::int64_t lda);
|
|
238
|
-
|
|
239
|
-
ONEMKL_DECLARE_BUF_GERU(std::complex<float>)
|
|
240
|
-
ONEMKL_DECLARE_BUF_GERU(std::complex<double>)
|
|
241
|
-
|
|
242
|
-
#undef ONEMKL_DECLARE_BUF_GERU
|
|
243
|
-
|
|
244
|
-
#define ONEMKL_DECLARE_BUF_HBMV(T) \
|
|
245
|
-
DLL_EXPORT void hbmv(sycl::queue &queue, uplo upper_lower, std::int64_t n, std::int64_t k, T alpha, \
|
|
246
|
-
sycl::buffer<T, 1> &a, std::int64_t lda, \
|
|
247
|
-
sycl::buffer<T, 1> &x, std::int64_t incx, T beta, \
|
|
248
|
-
sycl::buffer<T, 1> &y, std::int64_t incy);
|
|
249
|
-
|
|
250
|
-
ONEMKL_DECLARE_BUF_HBMV(std::complex<float>)
|
|
251
|
-
ONEMKL_DECLARE_BUF_HBMV(std::complex<double>)
|
|
252
|
-
|
|
253
|
-
#undef ONEMKL_DECLARE_BUF_HBMV
|
|
254
|
-
|
|
255
|
-
#define ONEMKL_DECLARE_BUF_HEMV(T) \
|
|
256
|
-
DLL_EXPORT void hemv(sycl::queue &queue, uplo upper_lower, std::int64_t n, T alpha, \
|
|
257
|
-
sycl::buffer<T, 1> &a, std::int64_t lda, \
|
|
258
|
-
sycl::buffer<T, 1> &x, std::int64_t incx, T beta, \
|
|
259
|
-
sycl::buffer<T, 1> &y, std::int64_t incy);
|
|
260
|
-
|
|
261
|
-
ONEMKL_DECLARE_BUF_HEMV(std::complex<float>)
|
|
262
|
-
ONEMKL_DECLARE_BUF_HEMV(std::complex<double>)
|
|
263
|
-
|
|
264
|
-
#undef ONEMKL_DECLARE_BUF_HEMV
|
|
265
|
-
|
|
266
|
-
#define ONEMKL_DECLARE_BUF_HER(T, Treal) \
|
|
267
|
-
DLL_EXPORT void her(sycl::queue &queue, uplo upper_lower, std::int64_t n, Treal alpha, \
|
|
268
|
-
sycl::buffer<T, 1> &x, std::int64_t incx, \
|
|
269
|
-
sycl::buffer<T, 1> &a, std::int64_t lda); \
|
|
270
|
-
|
|
271
|
-
ONEMKL_DECLARE_BUF_HER(std::complex<float>, float)
|
|
272
|
-
ONEMKL_DECLARE_BUF_HER(std::complex<double>, double)
|
|
273
|
-
|
|
274
|
-
#undef ONEMKL_DECLARE_BUF_HER
|
|
275
|
-
|
|
276
|
-
#define ONEMKL_DECLARE_BUF_HER2(T) \
|
|
277
|
-
DLL_EXPORT void her2(sycl::queue &queue, uplo upper_lower, std::int64_t n, T alpha, \
|
|
278
|
-
sycl::buffer<T, 1> &x, std::int64_t incx, \
|
|
279
|
-
sycl::buffer<T, 1> &y, std::int64_t incy, \
|
|
280
|
-
sycl::buffer<T, 1> &a, std::int64_t lda);
|
|
281
|
-
|
|
282
|
-
ONEMKL_DECLARE_BUF_HER2(std::complex<float>)
|
|
283
|
-
ONEMKL_DECLARE_BUF_HER2(std::complex<double>)
|
|
284
|
-
|
|
285
|
-
#undef ONEMKL_DECLARE_BUF_HER2
|
|
286
|
-
|
|
287
|
-
#define ONEMKL_DECLARE_BUF_HPMV(T) \
|
|
288
|
-
DLL_EXPORT void hpmv(sycl::queue &queue, uplo upper_lower, std::int64_t n, T alpha, \
|
|
289
|
-
sycl::buffer<T, 1> &a, \
|
|
290
|
-
sycl::buffer<T, 1> &x, std::int64_t incx, T beta, \
|
|
291
|
-
sycl::buffer<T, 1> &y, std::int64_t incy);
|
|
292
|
-
|
|
293
|
-
ONEMKL_DECLARE_BUF_HPMV(std::complex<float>)
|
|
294
|
-
ONEMKL_DECLARE_BUF_HPMV(std::complex<double>)
|
|
295
|
-
|
|
296
|
-
#undef ONEMKL_DECLARE_BUF_HPMV
|
|
297
|
-
|
|
298
|
-
#define ONEMKL_DECLARE_BUF_HPR(T, Treal) \
|
|
299
|
-
DLL_EXPORT void hpr(sycl::queue &queue, uplo upper_lower, std::int64_t n, Treal alpha, \
|
|
300
|
-
sycl::buffer<T, 1> &x, std::int64_t incx, \
|
|
301
|
-
sycl::buffer<T, 1> &a);
|
|
302
|
-
|
|
303
|
-
ONEMKL_DECLARE_BUF_HPR(std::complex<float>, float)
|
|
304
|
-
ONEMKL_DECLARE_BUF_HPR(std::complex<double>, double)
|
|
305
|
-
|
|
306
|
-
#undef ONEMKL_DECLARE_BUF_HPR
|
|
307
|
-
|
|
308
|
-
#define ONEMKL_DECLARE_BUF_HPR2(T) \
|
|
309
|
-
DLL_EXPORT void hpr2(sycl::queue &queue, uplo upper_lower, std::int64_t n, T alpha, \
|
|
310
|
-
sycl::buffer<T, 1> &x, std::int64_t incx, \
|
|
311
|
-
sycl::buffer<T, 1> &y, std::int64_t incy, \
|
|
312
|
-
sycl::buffer<T, 1> &a);
|
|
313
|
-
|
|
314
|
-
ONEMKL_DECLARE_BUF_HPR2(std::complex<float>)
|
|
315
|
-
ONEMKL_DECLARE_BUF_HPR2(std::complex<double>)
|
|
316
|
-
|
|
317
|
-
#undef ONEMKL_DECLARE_BUF_HPR2
|
|
318
|
-
|
|
319
|
-
#define ONEMKL_DECLARE_BUF_SBMV(T) \
|
|
320
|
-
DLL_EXPORT void sbmv(sycl::queue &queue, uplo upper_lower, std::int64_t n, std::int64_t k, T alpha, \
|
|
321
|
-
sycl::buffer<T, 1> &a, std::int64_t lda, \
|
|
322
|
-
sycl::buffer<T, 1> &x, std::int64_t incx, T beta, \
|
|
323
|
-
sycl::buffer<T, 1> &y, std::int64_t incy);
|
|
324
|
-
|
|
325
|
-
ONEMKL_DECLARE_BUF_SBMV(float)
|
|
326
|
-
ONEMKL_DECLARE_BUF_SBMV(double)
|
|
327
|
-
|
|
328
|
-
#undef ONEMKL_DECLARE_BUF_SBMV
|
|
329
|
-
|
|
330
|
-
#define ONEMKL_DECLARE_BUF_SYMV(T) \
|
|
331
|
-
DLL_EXPORT void symv(sycl::queue &queue, uplo upper_lower, std::int64_t n, T alpha, \
|
|
332
|
-
sycl::buffer<T, 1> &a, std::int64_t lda, \
|
|
333
|
-
sycl::buffer<T, 1> &x, std::int64_t incx, T beta, \
|
|
334
|
-
sycl::buffer<T, 1> &y, std::int64_t incy);
|
|
335
|
-
|
|
336
|
-
ONEMKL_DECLARE_BUF_SYMV(float)
|
|
337
|
-
ONEMKL_DECLARE_BUF_SYMV(double)
|
|
338
|
-
ONEMKL_DECLARE_BUF_SYMV(std::complex<float>)
|
|
339
|
-
ONEMKL_DECLARE_BUF_SYMV(std::complex<double>)
|
|
340
|
-
|
|
341
|
-
#undef ONEMKL_DECLARE_BUF_SYMV
|
|
342
|
-
|
|
343
|
-
#define ONEMKL_DECLARE_BUF_SYR(T) \
|
|
344
|
-
DLL_EXPORT void syr(sycl::queue &queue, uplo upper_lower, std::int64_t n, T alpha, \
|
|
345
|
-
sycl::buffer<T, 1> &x, std::int64_t incx, \
|
|
346
|
-
sycl::buffer<T, 1> &a, std::int64_t lda);
|
|
347
|
-
|
|
348
|
-
ONEMKL_DECLARE_BUF_SYR(float)
|
|
349
|
-
ONEMKL_DECLARE_BUF_SYR(double)
|
|
350
|
-
ONEMKL_DECLARE_BUF_SYR(std::complex<float>)
|
|
351
|
-
ONEMKL_DECLARE_BUF_SYR(std::complex<double>)
|
|
352
|
-
|
|
353
|
-
#undef ONEMKL_DECLARE_BUF_SYR
|
|
354
|
-
|
|
355
|
-
#define ONEMKL_DECLARE_BUF_SYR2(T) \
|
|
356
|
-
DLL_EXPORT void syr2(sycl::queue &queue, uplo upper_lower, std::int64_t n, T alpha, \
|
|
357
|
-
sycl::buffer<T, 1> &x, std::int64_t incx, \
|
|
358
|
-
sycl::buffer<T, 1> &y, std::int64_t incy, \
|
|
359
|
-
sycl::buffer<T, 1> &a, std::int64_t lda);
|
|
360
|
-
|
|
361
|
-
ONEMKL_DECLARE_BUF_SYR2(float)
|
|
362
|
-
ONEMKL_DECLARE_BUF_SYR2(double)
|
|
363
|
-
ONEMKL_DECLARE_BUF_SYR2(std::complex<float>)
|
|
364
|
-
ONEMKL_DECLARE_BUF_SYR2(std::complex<double>)
|
|
365
|
-
|
|
366
|
-
#undef ONEMKL_DECLARE_BUF_SYR2
|
|
367
|
-
|
|
368
|
-
#define ONEMKL_DECLARE_BUF_SPMV(T) \
|
|
369
|
-
DLL_EXPORT void spmv(sycl::queue &queue, uplo upper_lower, std::int64_t n, T alpha, \
|
|
370
|
-
sycl::buffer<T, 1> &a, \
|
|
371
|
-
sycl::buffer<T, 1> &x, std::int64_t incx, T beta, \
|
|
372
|
-
sycl::buffer<T, 1> &y, std::int64_t incy);
|
|
373
|
-
|
|
374
|
-
ONEMKL_DECLARE_BUF_SPMV(float)
|
|
375
|
-
ONEMKL_DECLARE_BUF_SPMV(double)
|
|
376
|
-
|
|
377
|
-
#undef ONEMKL_DECLARE_BUF_SPMV
|
|
378
|
-
|
|
379
|
-
#define ONEMKL_DECLARE_BUF_SPR(T) \
|
|
380
|
-
DLL_EXPORT void spr(sycl::queue &queue, uplo upper_lower, std::int64_t n, T alpha, \
|
|
381
|
-
sycl::buffer<T, 1> &x, std::int64_t incx, \
|
|
382
|
-
sycl::buffer<T, 1> &a);
|
|
383
|
-
|
|
384
|
-
ONEMKL_DECLARE_BUF_SPR(float)
|
|
385
|
-
ONEMKL_DECLARE_BUF_SPR(double)
|
|
386
|
-
|
|
387
|
-
#undef ONEMKL_DECLARE_BUF_SPR
|
|
388
|
-
|
|
389
|
-
#define ONEMKL_DECLARE_BUF_SPR2(T) \
|
|
390
|
-
DLL_EXPORT void spr2(sycl::queue &queue, uplo upper_lower, std::int64_t n, T alpha, \
|
|
391
|
-
sycl::buffer<T, 1> &x, std::int64_t incx, \
|
|
392
|
-
sycl::buffer<T, 1> &y, std::int64_t incy, \
|
|
393
|
-
sycl::buffer<T, 1> &a);
|
|
394
|
-
|
|
395
|
-
ONEMKL_DECLARE_BUF_SPR2(float)
|
|
396
|
-
ONEMKL_DECLARE_BUF_SPR2(double)
|
|
397
|
-
|
|
398
|
-
#undef ONEMKL_DECLARE_BUF_SPR2
|
|
399
|
-
|
|
400
|
-
#define ONEMKL_DECLARE_BUF_TBMV(T) \
|
|
401
|
-
DLL_EXPORT void tbmv(sycl::queue &queue, uplo upper_lower, transpose trans, diag unit_diag, \
|
|
402
|
-
std::int64_t n, std::int64_t k, \
|
|
403
|
-
sycl::buffer<T, 1> &a, std::int64_t lda, \
|
|
404
|
-
sycl::buffer<T, 1> &x, std::int64_t incx);
|
|
405
|
-
|
|
406
|
-
ONEMKL_DECLARE_BUF_TBMV(float)
|
|
407
|
-
ONEMKL_DECLARE_BUF_TBMV(double)
|
|
408
|
-
ONEMKL_DECLARE_BUF_TBMV(std::complex<float>)
|
|
409
|
-
ONEMKL_DECLARE_BUF_TBMV(std::complex<double>)
|
|
410
|
-
|
|
411
|
-
#undef ONEMKL_DECLARE_BUF_TBMV
|
|
412
|
-
|
|
413
|
-
#define ONEMKL_DECLARE_BUF_TBSV(T) \
|
|
414
|
-
DLL_EXPORT void tbsv(sycl::queue &queue, uplo upper_lower, transpose trans, diag unit_diag, \
|
|
415
|
-
std::int64_t n, std::int64_t k, \
|
|
416
|
-
sycl::buffer<T, 1> &a, std::int64_t lda, \
|
|
417
|
-
sycl::buffer<T, 1> &x, std::int64_t incx);
|
|
418
|
-
|
|
419
|
-
ONEMKL_DECLARE_BUF_TBSV(float)
|
|
420
|
-
ONEMKL_DECLARE_BUF_TBSV(double)
|
|
421
|
-
ONEMKL_DECLARE_BUF_TBSV(std::complex<float>)
|
|
422
|
-
ONEMKL_DECLARE_BUF_TBSV(std::complex<double>)
|
|
423
|
-
|
|
424
|
-
#undef ONEMKL_DECLARE_BUF_TBSV
|
|
425
|
-
|
|
426
|
-
#define ONEMKL_DECLARE_BUF_TPMV(T) \
|
|
427
|
-
DLL_EXPORT void tpmv(sycl::queue &queue, uplo upper_lower, transpose trans, diag unit_diag, \
|
|
428
|
-
std::int64_t n, \
|
|
429
|
-
sycl::buffer<T, 1> &a, \
|
|
430
|
-
sycl::buffer<T, 1> &x, std::int64_t incx);
|
|
431
|
-
|
|
432
|
-
ONEMKL_DECLARE_BUF_TPMV(float)
|
|
433
|
-
ONEMKL_DECLARE_BUF_TPMV(double)
|
|
434
|
-
ONEMKL_DECLARE_BUF_TPMV(std::complex<float>)
|
|
435
|
-
ONEMKL_DECLARE_BUF_TPMV(std::complex<double>)
|
|
436
|
-
|
|
437
|
-
#undef ONEMKL_DECLARE_BUF_TPMV
|
|
438
|
-
|
|
439
|
-
#define ONEMKL_DECLARE_BUF_TPSV(T) \
|
|
440
|
-
DLL_EXPORT void tpsv(sycl::queue &queue, uplo upper_lower, transpose trans, diag unit_diag, \
|
|
441
|
-
std::int64_t n, \
|
|
442
|
-
sycl::buffer<T, 1> &a, \
|
|
443
|
-
sycl::buffer<T, 1> &x, std::int64_t incx);
|
|
444
|
-
|
|
445
|
-
ONEMKL_DECLARE_BUF_TPSV(float)
|
|
446
|
-
ONEMKL_DECLARE_BUF_TPSV(double)
|
|
447
|
-
ONEMKL_DECLARE_BUF_TPSV(std::complex<float>)
|
|
448
|
-
ONEMKL_DECLARE_BUF_TPSV(std::complex<double>)
|
|
449
|
-
|
|
450
|
-
#undef ONEMKL_DECLARE_BUF_TPSV
|
|
451
|
-
|
|
452
|
-
#define ONEMKL_DECLARE_BUF_TRMV(T) \
|
|
453
|
-
DLL_EXPORT void trmv(sycl::queue &queue, uplo upper_lower, transpose trans, diag unit_diag, \
|
|
454
|
-
std::int64_t n, \
|
|
455
|
-
sycl::buffer<T, 1> &a, std::int64_t lda, \
|
|
456
|
-
sycl::buffer<T, 1> &x, std::int64_t incx);
|
|
457
|
-
|
|
458
|
-
ONEMKL_DECLARE_BUF_TRMV(float)
|
|
459
|
-
ONEMKL_DECLARE_BUF_TRMV(double)
|
|
460
|
-
ONEMKL_DECLARE_BUF_TRMV(std::complex<float>)
|
|
461
|
-
ONEMKL_DECLARE_BUF_TRMV(std::complex<double>)
|
|
462
|
-
|
|
463
|
-
#undef ONEMKL_DECLARE_BUF_TRMV
|
|
464
|
-
|
|
465
|
-
#define ONEMKL_DECLARE_BUF_TRSV(T) \
|
|
466
|
-
DLL_EXPORT void trsv(sycl::queue &queue, uplo upper_lower, transpose trans, diag unit_diag, \
|
|
467
|
-
std::int64_t n, \
|
|
468
|
-
sycl::buffer<T, 1> &a, std::int64_t lda, \
|
|
469
|
-
sycl::buffer<T, 1> &x, std::int64_t incx);
|
|
470
|
-
|
|
471
|
-
ONEMKL_DECLARE_BUF_TRSV(float)
|
|
472
|
-
ONEMKL_DECLARE_BUF_TRSV(double)
|
|
473
|
-
ONEMKL_DECLARE_BUF_TRSV(std::complex<float>)
|
|
474
|
-
ONEMKL_DECLARE_BUF_TRSV(std::complex<double>)
|
|
475
|
-
|
|
476
|
-
#undef ONEMKL_DECLARE_BUF_TRSV
|
|
477
|
-
|
|
478
|
-
// Level 1
|
|
479
|
-
|
|
480
|
-
#define ONEMKL_DECLARE_BUF_DOTC(T) \
|
|
481
|
-
DLL_EXPORT void dotc(sycl::queue &queue, std::int64_t n, sycl::buffer<T, 1> &x, \
|
|
482
|
-
std::int64_t incx, sycl::buffer<T, 1> &y, std::int64_t incy, \
|
|
483
|
-
sycl::buffer<T, 1> &result);
|
|
484
|
-
|
|
485
|
-
ONEMKL_DECLARE_BUF_DOTC(std::complex<float>)
|
|
486
|
-
ONEMKL_DECLARE_BUF_DOTC(std::complex<double>)
|
|
487
|
-
|
|
488
|
-
#undef ONEMKL_DECLARE_BUF_DOTC
|
|
489
|
-
|
|
490
|
-
#define ONEMKL_DECLARE_BUF_DOTU(T) \
|
|
491
|
-
DLL_EXPORT void dotu(sycl::queue &queue, std::int64_t n, sycl::buffer<T, 1> &x, \
|
|
492
|
-
std::int64_t incx, sycl::buffer<T, 1> &y, std::int64_t incy, \
|
|
493
|
-
sycl::buffer<T, 1> &result);
|
|
494
|
-
|
|
495
|
-
ONEMKL_DECLARE_BUF_DOTU(std::complex<float>)
|
|
496
|
-
ONEMKL_DECLARE_BUF_DOTU(std::complex<double>)
|
|
497
|
-
|
|
498
|
-
#undef ONEMKL_DECLARE_BUF_DOTU
|
|
499
|
-
|
|
500
|
-
#define ONEMKL_DECLARE_BUF_IAMAX(Tf, Ti) \
|
|
501
|
-
DLL_EXPORT void iamax(sycl::queue &queue, std::int64_t n, sycl::buffer<Tf, 1> &x, std::int64_t incx, \
|
|
502
|
-
sycl::buffer<Ti, 1> &result, index_base base=index_base::zero);
|
|
503
|
-
|
|
504
|
-
ONEMKL_DECLARE_BUF_IAMAX(float, std::int64_t)
|
|
505
|
-
ONEMKL_DECLARE_BUF_IAMAX(float, std::int32_t)
|
|
506
|
-
ONEMKL_DECLARE_BUF_IAMAX(double, std::int64_t)
|
|
507
|
-
ONEMKL_DECLARE_BUF_IAMAX(double, std::int32_t)
|
|
508
|
-
ONEMKL_DECLARE_BUF_IAMAX(std::complex<float>, std::int64_t)
|
|
509
|
-
ONEMKL_DECLARE_BUF_IAMAX(std::complex<float>, std::int32_t)
|
|
510
|
-
ONEMKL_DECLARE_BUF_IAMAX(std::complex<double>, std::int64_t)
|
|
511
|
-
ONEMKL_DECLARE_BUF_IAMAX(std::complex<double>, std::int32_t)
|
|
512
|
-
|
|
513
|
-
#undef ONEMKL_DECLARE_BUF_IAMAX
|
|
514
|
-
|
|
515
|
-
#define ONEMKL_DECLARE_BUF_IAMIN(Tf, Ti) \
|
|
516
|
-
DLL_EXPORT void iamin(sycl::queue &queue, std::int64_t n, sycl::buffer<Tf, 1> &x, std::int64_t incx, \
|
|
517
|
-
sycl::buffer<Ti, 1> &result, index_base base=index_base::zero);
|
|
518
|
-
|
|
519
|
-
ONEMKL_DECLARE_BUF_IAMIN(float, std::int64_t)
|
|
520
|
-
ONEMKL_DECLARE_BUF_IAMIN(float, std::int32_t)
|
|
521
|
-
ONEMKL_DECLARE_BUF_IAMIN(double, std::int64_t)
|
|
522
|
-
ONEMKL_DECLARE_BUF_IAMIN(double, std::int32_t)
|
|
523
|
-
ONEMKL_DECLARE_BUF_IAMIN(std::complex<float>, std::int64_t)
|
|
524
|
-
ONEMKL_DECLARE_BUF_IAMIN(std::complex<float>, std::int32_t)
|
|
525
|
-
ONEMKL_DECLARE_BUF_IAMIN(std::complex<double>, std::int64_t)
|
|
526
|
-
ONEMKL_DECLARE_BUF_IAMIN(std::complex<double>, std::int32_t)
|
|
527
|
-
|
|
528
|
-
#undef ONEMKL_DECLARE_BUF_IAMIN
|
|
529
|
-
|
|
530
|
-
#define ONEMKL_DECLARE_BUF_ASUM(T, Tres) \
|
|
531
|
-
DLL_EXPORT void asum(sycl::queue &queue, std::int64_t n, sycl::buffer<T, 1> &x, std::int64_t incx, sycl::buffer<Tres, 1> &result);
|
|
532
|
-
|
|
533
|
-
ONEMKL_DECLARE_BUF_ASUM(float, float)
|
|
534
|
-
ONEMKL_DECLARE_BUF_ASUM(double, double)
|
|
535
|
-
ONEMKL_DECLARE_BUF_ASUM(std::complex<float>, float)
|
|
536
|
-
ONEMKL_DECLARE_BUF_ASUM(std::complex<double>, double)
|
|
537
|
-
|
|
538
|
-
#undef ONEMKL_DECLARE_BUF_ASUM
|
|
539
|
-
|
|
540
|
-
#define ONEMKL_DECLARE_BUF_AXPY(T) \
|
|
541
|
-
DLL_EXPORT void axpy(sycl::queue &queue, std::int64_t n, T alpha, sycl::buffer<T, 1> &x, std::int64_t incx, sycl::buffer<T, 1> &y, std::int64_t incy);
|
|
542
|
-
|
|
543
|
-
ONEMKL_DECLARE_BUF_AXPY(sycl::half)
|
|
544
|
-
ONEMKL_DECLARE_BUF_AXPY(bfloat16)
|
|
545
|
-
ONEMKL_DECLARE_BUF_AXPY(float)
|
|
546
|
-
ONEMKL_DECLARE_BUF_AXPY(double)
|
|
547
|
-
ONEMKL_DECLARE_BUF_AXPY(std::complex<float>)
|
|
548
|
-
ONEMKL_DECLARE_BUF_AXPY(std::complex<double>)
|
|
549
|
-
|
|
550
|
-
#undef ONEMKL_DECLARE_BUF_AXPY
|
|
551
|
-
|
|
552
|
-
#define ONEMKL_DECLARE_BUF_AXPBY(T) \
|
|
553
|
-
DLL_EXPORT void axpby(sycl::queue &queue, std::int64_t n, T alpha, sycl::buffer<T, 1> &x, std::int64_t incx, T beta, sycl::buffer<T, 1> &y, std::int64_t incy);
|
|
554
|
-
|
|
555
|
-
ONEMKL_DECLARE_BUF_AXPBY(float)
|
|
556
|
-
ONEMKL_DECLARE_BUF_AXPBY(double)
|
|
557
|
-
ONEMKL_DECLARE_BUF_AXPBY(std::complex<float>)
|
|
558
|
-
ONEMKL_DECLARE_BUF_AXPBY(std::complex<double>)
|
|
559
|
-
|
|
560
|
-
#undef ONEMKL_DECLARE_BUF_AXPBY
|
|
561
|
-
|
|
562
|
-
#define ONEMKL_DECLARE_BUF_COPY(T) \
|
|
563
|
-
DLL_EXPORT void copy(sycl::queue &queue, std::int64_t n, sycl::buffer<T, 1> &x, std::int64_t incx, sycl::buffer<T, 1> &y, std::int64_t incy);
|
|
564
|
-
|
|
565
|
-
ONEMKL_DECLARE_BUF_COPY(float)
|
|
566
|
-
ONEMKL_DECLARE_BUF_COPY(double)
|
|
567
|
-
ONEMKL_DECLARE_BUF_COPY(std::complex<float>)
|
|
568
|
-
ONEMKL_DECLARE_BUF_COPY(std::complex<double>)
|
|
569
|
-
|
|
570
|
-
#undef ONEMKL_DECLARE_BUF_COPY
|
|
571
|
-
|
|
572
|
-
#define ONEMKL_DECLARE_BUF_DOT(T, Tres) \
|
|
573
|
-
DLL_EXPORT void dot(sycl::queue &queue, std::int64_t n, sycl::buffer<T, 1> &x, std::int64_t incx, sycl::buffer<T, 1> &y, std::int64_t incy, sycl::buffer<Tres, 1> &result);
|
|
574
|
-
|
|
575
|
-
ONEMKL_DECLARE_BUF_DOT(sycl::half, sycl::half)
|
|
576
|
-
ONEMKL_DECLARE_BUF_DOT(bfloat16, bfloat16)
|
|
577
|
-
ONEMKL_DECLARE_BUF_DOT(float, float)
|
|
578
|
-
ONEMKL_DECLARE_BUF_DOT(double, double)
|
|
579
|
-
ONEMKL_DECLARE_BUF_DOT(float, double)
|
|
580
|
-
|
|
581
|
-
#undef ONEMKL_DECLARE_BUF_DOT
|
|
582
|
-
|
|
583
|
-
#define ONEMKL_DECLARE_BUF_SDSDOT(T) \
|
|
584
|
-
DLL_EXPORT void sdsdot(sycl::queue &queue, std::int64_t n, T sb, sycl::buffer<T, 1> &x, std::int64_t incx, sycl::buffer<T, 1> &y, std::int64_t incy, sycl::buffer<T, 1> &result);
|
|
585
|
-
|
|
586
|
-
ONEMKL_DECLARE_BUF_SDSDOT(float)
|
|
587
|
-
|
|
588
|
-
#undef ONEMKL_DECLARE_BUF_SDSDOT
|
|
589
|
-
|
|
590
|
-
#define ONEMKL_DECLARE_BUF_NRM2(T, Tres) \
|
|
591
|
-
DLL_EXPORT void nrm2(sycl::queue &queue, std::int64_t n, sycl::buffer<T, 1> &x, std::int64_t incx, sycl::buffer<Tres, 1> &result);
|
|
592
|
-
|
|
593
|
-
ONEMKL_DECLARE_BUF_NRM2(sycl::half, sycl::half)
|
|
594
|
-
ONEMKL_DECLARE_BUF_NRM2(bfloat16, bfloat16)
|
|
595
|
-
ONEMKL_DECLARE_BUF_NRM2(float, float)
|
|
596
|
-
ONEMKL_DECLARE_BUF_NRM2(double, double)
|
|
597
|
-
ONEMKL_DECLARE_BUF_NRM2(std::complex<float>, float)
|
|
598
|
-
ONEMKL_DECLARE_BUF_NRM2(std::complex<double>, double)
|
|
599
|
-
|
|
600
|
-
#undef ONEMKL_DECLARE_BUF_NRM2
|
|
601
|
-
|
|
602
|
-
#define ONEMKL_DECLARE_BUF_ROT(T, Tc, Ts) \
|
|
603
|
-
DLL_EXPORT void rot(sycl::queue &queue, std::int64_t n, sycl::buffer<T, 1> &x, std::int64_t incx, sycl::buffer<T, 1> &y, std::int64_t incy, Tc c, Ts s);
|
|
604
|
-
|
|
605
|
-
ONEMKL_DECLARE_BUF_ROT(sycl::half, sycl::half, sycl::half)
|
|
606
|
-
ONEMKL_DECLARE_BUF_ROT(bfloat16, bfloat16, bfloat16)
|
|
607
|
-
ONEMKL_DECLARE_BUF_ROT(float, float, float)
|
|
608
|
-
ONEMKL_DECLARE_BUF_ROT(double, double, double)
|
|
609
|
-
ONEMKL_DECLARE_BUF_ROT(std::complex<float>, float, float)
|
|
610
|
-
ONEMKL_DECLARE_BUF_ROT(std::complex<float>, float, std::complex<float>)
|
|
611
|
-
ONEMKL_DECLARE_BUF_ROT(std::complex<double>, double, double)
|
|
612
|
-
ONEMKL_DECLARE_BUF_ROT(std::complex<double>, double, std::complex<double>)
|
|
613
|
-
|
|
614
|
-
#undef ONEMKL_DECLARE_BUF_ROT
|
|
615
|
-
|
|
616
|
-
#define ONEMKL_DECLARE_BUF_ROTG(T, Tc) \
|
|
617
|
-
DLL_EXPORT void rotg(sycl::queue &queue, sycl::buffer<T, 1> &a, sycl::buffer<T, 1> &b, sycl::buffer<Tc, 1> &c, sycl::buffer<T, 1> &s);
|
|
618
|
-
|
|
619
|
-
ONEMKL_DECLARE_BUF_ROTG(float, float)
|
|
620
|
-
ONEMKL_DECLARE_BUF_ROTG(double, double)
|
|
621
|
-
ONEMKL_DECLARE_BUF_ROTG(std::complex<float>, float)
|
|
622
|
-
ONEMKL_DECLARE_BUF_ROTG(std::complex<double>, double)
|
|
623
|
-
|
|
624
|
-
#undef ONEMKL_DECLARE_BUF_ROTG
|
|
625
|
-
|
|
626
|
-
#define ONEMKL_DECLARE_BUF_ROTM(T) \
|
|
627
|
-
DLL_EXPORT void rotm(sycl::queue &queue, std::int64_t n, sycl::buffer<T, 1> &x, std::int64_t incx, sycl::buffer<T, 1> &y, std::int64_t incy, sycl::buffer<T, 1> ¶m);
|
|
628
|
-
|
|
629
|
-
ONEMKL_DECLARE_BUF_ROTM(float)
|
|
630
|
-
ONEMKL_DECLARE_BUF_ROTM(double)
|
|
631
|
-
|
|
632
|
-
#undef ONEMKL_DECLARE_BUF_ROTM
|
|
633
|
-
|
|
634
|
-
#define ONEMKL_DECLARE_BUF_ROTMG(T) \
|
|
635
|
-
DLL_EXPORT void rotmg(sycl::queue &queue, sycl::buffer<T, 1> &d1, sycl::buffer<T, 1> &d2, sycl::buffer<T, 1> &x1, T y1, sycl::buffer<T, 1> ¶m);
|
|
636
|
-
|
|
637
|
-
ONEMKL_DECLARE_BUF_ROTMG(float)
|
|
638
|
-
ONEMKL_DECLARE_BUF_ROTMG(double)
|
|
639
|
-
|
|
640
|
-
#undef ONEMKL_DECLARE_BUF_ROTMG
|
|
641
|
-
|
|
642
|
-
#define ONEMKL_DECLARE_BUF_SCAL(T, Ts) \
|
|
643
|
-
DLL_EXPORT void scal(sycl::queue &queue, std::int64_t n, Ts alpha, sycl::buffer<T, 1> &x, std::int64_t incx);
|
|
644
|
-
|
|
645
|
-
ONEMKL_DECLARE_BUF_SCAL(sycl::half, sycl::half)
|
|
646
|
-
ONEMKL_DECLARE_BUF_SCAL(bfloat16, bfloat16)
|
|
647
|
-
ONEMKL_DECLARE_BUF_SCAL(float, float)
|
|
648
|
-
ONEMKL_DECLARE_BUF_SCAL(double, double)
|
|
649
|
-
ONEMKL_DECLARE_BUF_SCAL(std::complex<float>, std::complex<float>)
|
|
650
|
-
ONEMKL_DECLARE_BUF_SCAL(std::complex<double>, std::complex<double>)
|
|
651
|
-
ONEMKL_DECLARE_BUF_SCAL(std::complex<float>, float)
|
|
652
|
-
ONEMKL_DECLARE_BUF_SCAL(std::complex<double>, double)
|
|
653
|
-
|
|
654
|
-
#undef ONEMKL_DECLARE_BUF_SCAL
|
|
655
|
-
|
|
656
|
-
#define ONEMKL_DECLARE_BUF_SWAP(T) \
|
|
657
|
-
DLL_EXPORT void swap(sycl::queue &queue, std::int64_t n, sycl::buffer<T, 1> &x, std::int64_t incx, sycl::buffer<T, 1> &y, std::int64_t incy);
|
|
658
|
-
|
|
659
|
-
ONEMKL_DECLARE_BUF_SWAP(float)
|
|
660
|
-
ONEMKL_DECLARE_BUF_SWAP(double)
|
|
661
|
-
ONEMKL_DECLARE_BUF_SWAP(std::complex<float>)
|
|
662
|
-
ONEMKL_DECLARE_BUF_SWAP(std::complex<double>)
|
|
663
|
-
|
|
664
|
-
#undef ONEMKL_DECLARE_BUF_SWAP
|
|
665
|
-
|
|
666
|
-
// Batch API
|
|
667
|
-
|
|
668
|
-
#define ONEMKL_DECLARE_BUF_GEMM_BATCH(Ta, Tb, Tc, Ts) \
|
|
669
|
-
DLL_EXPORT void gemm_batch(sycl::queue &queue, transpose transa, transpose transb, \
|
|
670
|
-
std::int64_t m, std::int64_t n, std::int64_t k, \
|
|
671
|
-
Ts alpha, sycl::buffer<Ta, 1> &a, std::int64_t lda, std::int64_t stride_a, \
|
|
672
|
-
sycl::buffer<Tb, 1> &b, std::int64_t ldb, std::int64_t stride_b, \
|
|
673
|
-
Ts beta, sycl::buffer<Tc, 1> &c, std::int64_t ldc, std::int64_t stride_c, \
|
|
674
|
-
std::int64_t batch_size, compute_mode mode = MKL_BLAS_COMPUTE_MODE);
|
|
675
|
-
|
|
676
|
-
ONEMKL_DECLARE_BUF_GEMM_BATCH(float, float, float, float)
|
|
677
|
-
ONEMKL_DECLARE_BUF_GEMM_BATCH(double, double, double, double)
|
|
678
|
-
ONEMKL_DECLARE_BUF_GEMM_BATCH(std::complex<float>, std::complex<float>, std::complex<float>, std::complex<float>)
|
|
679
|
-
ONEMKL_DECLARE_BUF_GEMM_BATCH(std::complex<double>, std::complex<double>, std::complex<double>, std::complex<double>)
|
|
680
|
-
ONEMKL_DECLARE_BUF_GEMM_BATCH(sycl::half, sycl::half, sycl::half, sycl::half)
|
|
681
|
-
ONEMKL_DECLARE_BUF_GEMM_BATCH(sycl::half, sycl::half, float, float)
|
|
682
|
-
ONEMKL_DECLARE_BUF_GEMM_BATCH(bfloat16, bfloat16, bfloat16, float)
|
|
683
|
-
ONEMKL_DECLARE_BUF_GEMM_BATCH(bfloat16, bfloat16, float, float)
|
|
684
|
-
ONEMKL_DECLARE_BUF_GEMM_BATCH(std::int8_t, std::int8_t, std::int32_t, float)
|
|
685
|
-
ONEMKL_DECLARE_BUF_GEMM_BATCH(std::int8_t, std::int8_t, float, float)
|
|
686
|
-
|
|
687
|
-
#undef ONEMKL_DECLARE_BUF_GEMM_BATCH
|
|
688
|
-
|
|
689
|
-
#define ONEMKL_DECLARE_BUF_SYRK_BATCH(T) \
|
|
690
|
-
DLL_EXPORT void syrk_batch(sycl::queue &queue, \
|
|
691
|
-
uplo upper_lower, transpose trans, int64_t n, int64_t k, \
|
|
692
|
-
T alpha, sycl::buffer<T,1> &a, int64_t lda, int64_t stride_a, \
|
|
693
|
-
T beta, sycl::buffer<T,1> &c, int64_t ldc, int64_t stride_c, \
|
|
694
|
-
int64_t batch_size, compute_mode mode = MKL_BLAS_COMPUTE_MODE);
|
|
695
|
-
|
|
696
|
-
ONEMKL_DECLARE_BUF_SYRK_BATCH(float)
|
|
697
|
-
ONEMKL_DECLARE_BUF_SYRK_BATCH(double)
|
|
698
|
-
ONEMKL_DECLARE_BUF_SYRK_BATCH(std::complex<float>)
|
|
699
|
-
ONEMKL_DECLARE_BUF_SYRK_BATCH(std::complex<double>)
|
|
700
|
-
|
|
701
|
-
#undef ONEMKL_DECLARE_BUF_SYRK_BATCH
|
|
702
|
-
|
|
703
|
-
#define ONEMKL_DECLARE_BUF_TRSM_BATCH(T) \
|
|
704
|
-
DLL_EXPORT void trsm_batch(sycl::queue &queue, side left_right, uplo upper_lower, transpose trans, diag unit_diag, \
|
|
705
|
-
std::int64_t m, std::int64_t n, \
|
|
706
|
-
T alpha, sycl::buffer<T, 1> &a, std::int64_t lda, std::int64_t stride_a, \
|
|
707
|
-
sycl::buffer<T, 1> &b, std::int64_t ldb, std::int64_t stride_b, \
|
|
708
|
-
std::int64_t batch_size, compute_mode mode = MKL_BLAS_COMPUTE_MODE);
|
|
709
|
-
|
|
710
|
-
ONEMKL_DECLARE_BUF_TRSM_BATCH(float)
|
|
711
|
-
ONEMKL_DECLARE_BUF_TRSM_BATCH(double)
|
|
712
|
-
ONEMKL_DECLARE_BUF_TRSM_BATCH(std::complex<float>)
|
|
713
|
-
ONEMKL_DECLARE_BUF_TRSM_BATCH(std::complex<double>)
|
|
714
|
-
|
|
715
|
-
#undef ONEMKL_DECLARE_BUF_TRSM_BATCH
|
|
716
|
-
|
|
717
|
-
#define ONEMKL_DECLARE_BUF_GEMV_BATCH(T) \
|
|
718
|
-
DLL_EXPORT void gemv_batch(sycl::queue &queue, transpose trans, \
|
|
719
|
-
std::int64_t m, std::int64_t n, T alpha, \
|
|
720
|
-
sycl::buffer<T, 1> &a, std::int64_t lda, std::int64_t stridea, \
|
|
721
|
-
sycl::buffer<T, 1> &x, std::int64_t incx, std::int64_t stridex, T beta, \
|
|
722
|
-
sycl::buffer<T, 1> &y, std::int64_t incy, std::int64_t stridey, std::int64_t batch_size);
|
|
723
|
-
|
|
724
|
-
ONEMKL_DECLARE_BUF_GEMV_BATCH(float)
|
|
725
|
-
ONEMKL_DECLARE_BUF_GEMV_BATCH(double)
|
|
726
|
-
ONEMKL_DECLARE_BUF_GEMV_BATCH(std::complex<float>)
|
|
727
|
-
ONEMKL_DECLARE_BUF_GEMV_BATCH(std::complex<double>)
|
|
728
|
-
|
|
729
|
-
#undef ONEMKL_DECLARE_BUF_GEMV_BATCH
|
|
730
|
-
|
|
731
|
-
#define ONEMKL_DECLARE_BUF_DGMM_BATCH(T) \
|
|
732
|
-
DLL_EXPORT void dgmm_batch(sycl::queue &queue, side left_right, \
|
|
733
|
-
std::int64_t m, std::int64_t n, \
|
|
734
|
-
sycl::buffer<T, 1> &a, std::int64_t lda, std::int64_t stridea, \
|
|
735
|
-
sycl::buffer<T, 1> &x, std::int64_t incx, std::int64_t stridex, \
|
|
736
|
-
sycl::buffer<T, 1> &c, std::int64_t ldc, std::int64_t stridec, std::int64_t batch_size);
|
|
737
|
-
|
|
738
|
-
ONEMKL_DECLARE_BUF_DGMM_BATCH(float)
|
|
739
|
-
ONEMKL_DECLARE_BUF_DGMM_BATCH(double)
|
|
740
|
-
ONEMKL_DECLARE_BUF_DGMM_BATCH(std::complex<float>)
|
|
741
|
-
ONEMKL_DECLARE_BUF_DGMM_BATCH(std::complex<double>)
|
|
742
|
-
|
|
743
|
-
#undef ONEMKL_DECLARE_BUF_DGMM_BATCH
|
|
744
|
-
|
|
745
|
-
#define ONEMKL_DECLARE_BUF_AXPY_BATCH(T) \
|
|
746
|
-
DLL_EXPORT void axpy_batch(sycl::queue &queue, std::int64_t n, T alpha, \
|
|
747
|
-
sycl::buffer<T, 1> &x, std::int64_t incx, std::int64_t stridex, \
|
|
748
|
-
sycl::buffer<T, 1> &y, std::int64_t incy, std::int64_t stridey, std::int64_t batch_size);
|
|
749
|
-
|
|
750
|
-
ONEMKL_DECLARE_BUF_AXPY_BATCH(float)
|
|
751
|
-
ONEMKL_DECLARE_BUF_AXPY_BATCH(double)
|
|
752
|
-
ONEMKL_DECLARE_BUF_AXPY_BATCH(std::complex<float>)
|
|
753
|
-
ONEMKL_DECLARE_BUF_AXPY_BATCH(std::complex<double>)
|
|
754
|
-
|
|
755
|
-
#undef ONEMKL_DECLARE_BUF_AXPY_BATCH
|
|
756
|
-
|
|
757
|
-
#define ONEMKL_DECLARE_BUF_COPY_BATCH(T) \
|
|
758
|
-
DLL_EXPORT void copy_batch(sycl::queue &queue, std::int64_t n, \
|
|
759
|
-
sycl::buffer<T, 1> &x, std::int64_t incx, std::int64_t stridex, \
|
|
760
|
-
sycl::buffer<T, 1> &y, std::int64_t incy, std::int64_t stridey, \
|
|
761
|
-
std::int64_t batch_size);
|
|
762
|
-
|
|
763
|
-
ONEMKL_DECLARE_BUF_COPY_BATCH(float)
|
|
764
|
-
ONEMKL_DECLARE_BUF_COPY_BATCH(double)
|
|
765
|
-
ONEMKL_DECLARE_BUF_COPY_BATCH(std::complex<float>)
|
|
766
|
-
ONEMKL_DECLARE_BUF_COPY_BATCH(std::complex<double>)
|
|
767
|
-
|
|
768
|
-
#undef ONEMKL_DECLARE_BUF_COPY_BATCH
|
|
769
|
-
|
|
770
|
-
// BLAS like
|
|
771
|
-
|
|
772
|
-
#define ONEMKL_DECLARE_BUF_GEMMT(T) \
|
|
773
|
-
DLL_EXPORT void gemmt(sycl::queue &queue, uplo upper_lower, transpose transa, transpose transb, \
|
|
774
|
-
std::int64_t n, std::int64_t k, T alpha, sycl::buffer<T, 1> &a, std::int64_t lda, \
|
|
775
|
-
sycl::buffer<T, 1> &b, std::int64_t ldb, \
|
|
776
|
-
T beta, sycl::buffer<T, 1> &c, std::int64_t ldc, \
|
|
777
|
-
compute_mode mode = MKL_BLAS_COMPUTE_MODE);
|
|
778
|
-
|
|
779
|
-
ONEMKL_DECLARE_BUF_GEMMT(float)
|
|
780
|
-
ONEMKL_DECLARE_BUF_GEMMT(double)
|
|
781
|
-
ONEMKL_DECLARE_BUF_GEMMT(std::complex<float>)
|
|
782
|
-
ONEMKL_DECLARE_BUF_GEMMT(std::complex<double>)
|
|
783
|
-
|
|
784
|
-
#undef ONEMKL_DECLARE_BUF_GEMMT
|
|
785
|
-
|
|
786
|
-
#define ONEMKL_DECLARE_BUF_GEMM_BIAS(Ta, Tb) \
|
|
787
|
-
DLL_EXPORT void gemm_bias(sycl::queue &queue, transpose transa, transpose transb, offset offsetc, \
|
|
788
|
-
std::int64_t m, std::int64_t n, std::int64_t k, float alpha, \
|
|
789
|
-
sycl::buffer<Ta, 1> &a, std::int64_t lda, Ta ao, \
|
|
790
|
-
sycl::buffer<Tb, 1> &b, std::int64_t ldb, Tb bo, \
|
|
791
|
-
float beta, sycl::buffer<std::int32_t, 1> &c, std::int64_t ldc, sycl::buffer<std::int32_t, 1> &co, \
|
|
792
|
-
compute_mode mode = MKL_BLAS_COMPUTE_MODE);
|
|
793
|
-
|
|
794
|
-
ONEMKL_DECLARE_BUF_GEMM_BIAS(std::int8_t, std::int8_t)
|
|
795
|
-
ONEMKL_DECLARE_BUF_GEMM_BIAS(std::int8_t, std::uint8_t)
|
|
796
|
-
ONEMKL_DECLARE_BUF_GEMM_BIAS(std::uint8_t, std::int8_t)
|
|
797
|
-
ONEMKL_DECLARE_BUF_GEMM_BIAS(std::uint8_t, std::uint8_t)
|
|
798
|
-
|
|
799
|
-
#undef ONEMKL_DECLARE_BUF_GEMM_BIAS
|
|
800
|
-
|
|
801
|
-
#define ONEMKL_DECLARE_BUF_IMATCOPY(T) \
|
|
802
|
-
DLL_EXPORT void imatcopy(sycl::queue &queue, transpose trans, \
|
|
803
|
-
std::int64_t m, std::int64_t n, \
|
|
804
|
-
T alpha, sycl::buffer<T, 1> &ab, \
|
|
805
|
-
std::int64_t lda, std::int64_t ldb);
|
|
806
|
-
|
|
807
|
-
ONEMKL_DECLARE_BUF_IMATCOPY(float)
|
|
808
|
-
ONEMKL_DECLARE_BUF_IMATCOPY(double)
|
|
809
|
-
ONEMKL_DECLARE_BUF_IMATCOPY(std::complex<float>)
|
|
810
|
-
ONEMKL_DECLARE_BUF_IMATCOPY(std::complex<double>)
|
|
811
|
-
|
|
812
|
-
#undef ONEMKL_DECLARE_BUF_IMATCOPY
|
|
813
|
-
|
|
814
|
-
#define ONEMKL_DECLARE_BUF_OMATCOPY(T) \
|
|
815
|
-
DLL_EXPORT void omatcopy(sycl::queue &queue, transpose trans, \
|
|
816
|
-
std::int64_t m, std::int64_t n, \
|
|
817
|
-
T alpha, sycl::buffer<T, 1> &a, \
|
|
818
|
-
std::int64_t lda, sycl::buffer<T, 1> &b, std::int64_t ldb);
|
|
819
|
-
|
|
820
|
-
ONEMKL_DECLARE_BUF_OMATCOPY(float)
|
|
821
|
-
ONEMKL_DECLARE_BUF_OMATCOPY(double)
|
|
822
|
-
ONEMKL_DECLARE_BUF_OMATCOPY(std::complex<float>)
|
|
823
|
-
ONEMKL_DECLARE_BUF_OMATCOPY(std::complex<double>)
|
|
824
|
-
|
|
825
|
-
#undef ONEMKL_DECLARE_BUF_OMATCOPY
|
|
826
|
-
|
|
827
|
-
#define ONEMKL_DECLARE_BUF_OMATADD(T) \
|
|
828
|
-
DLL_EXPORT void omatadd(sycl::queue &queue, transpose transa, transpose transb, \
|
|
829
|
-
std::int64_t m, std::int64_t n, \
|
|
830
|
-
T alpha, sycl::buffer<T, 1> &a, std::int64_t lda, \
|
|
831
|
-
T beta, sycl::buffer<T, 1> &b, std::int64_t ldb, \
|
|
832
|
-
sycl::buffer<T, 1> &c, std::int64_t ldc);
|
|
833
|
-
|
|
834
|
-
ONEMKL_DECLARE_BUF_OMATADD(float)
|
|
835
|
-
ONEMKL_DECLARE_BUF_OMATADD(double)
|
|
836
|
-
ONEMKL_DECLARE_BUF_OMATADD(std::complex<float>)
|
|
837
|
-
ONEMKL_DECLARE_BUF_OMATADD(std::complex<double>)
|
|
838
|
-
|
|
839
|
-
#undef ONEMKL_DECLARE_BUF_OMATADD
|
|
840
|
-
|
|
841
|
-
#define ONEMKL_DECLARE_BUF_IMATCOPY_BATCH(T) \
|
|
842
|
-
DLL_EXPORT void imatcopy_batch(sycl::queue &queue, transpose trans, \
|
|
843
|
-
std::int64_t m, std::int64_t n, T alpha, sycl::buffer<T, 1> &ab, std::int64_t lda, \
|
|
844
|
-
std::int64_t ldb, std::int64_t stride, std::int64_t batch_size);
|
|
845
|
-
|
|
846
|
-
ONEMKL_DECLARE_BUF_IMATCOPY_BATCH(float)
|
|
847
|
-
ONEMKL_DECLARE_BUF_IMATCOPY_BATCH(double)
|
|
848
|
-
ONEMKL_DECLARE_BUF_IMATCOPY_BATCH(std::complex<float>)
|
|
849
|
-
ONEMKL_DECLARE_BUF_IMATCOPY_BATCH(std::complex<double>)
|
|
850
|
-
|
|
851
|
-
#undef ONEMKL_DECLARE_BUF_IMATCOPY_BATCH
|
|
852
|
-
|
|
853
|
-
#define ONEMKL_DECLARE_BUF_OMATCOPY_BATCH(T) \
|
|
854
|
-
DLL_EXPORT void omatcopy_batch(sycl::queue &queue, transpose trans, \
|
|
855
|
-
std::int64_t m, std::int64_t n, T alpha, \
|
|
856
|
-
sycl::buffer<T, 1> &a, std::int64_t lda, std::int64_t stride_a, \
|
|
857
|
-
sycl::buffer<T, 1> &b, std::int64_t ldb, std::int64_t stride_b, \
|
|
858
|
-
std::int64_t batch_size);
|
|
859
|
-
|
|
860
|
-
ONEMKL_DECLARE_BUF_OMATCOPY_BATCH(float)
|
|
861
|
-
ONEMKL_DECLARE_BUF_OMATCOPY_BATCH(double)
|
|
862
|
-
ONEMKL_DECLARE_BUF_OMATCOPY_BATCH(std::complex<float>)
|
|
863
|
-
ONEMKL_DECLARE_BUF_OMATCOPY_BATCH(std::complex<double>)
|
|
864
|
-
|
|
865
|
-
#undef ONEMKL_DECLARE_BUF_OMATCOPY_BATCH
|
|
866
|
-
|
|
867
|
-
#define ONEMKL_DECLARE_BUF_OMATADD_BATCH(T) \
|
|
868
|
-
DLL_EXPORT void omatadd_batch(sycl::queue &queue, transpose transa, transpose transb, \
|
|
869
|
-
std::int64_t m, std::int64_t n, T alpha, \
|
|
870
|
-
sycl::buffer<T, 1> &a, std::int64_t lda, std::int64_t stride_a, \
|
|
871
|
-
T beta, sycl::buffer<T, 1> &b, std::int64_t ldb, std::int64_t stride_b, \
|
|
872
|
-
sycl::buffer<T, 1> &c, std::int64_t ldc, std::int64_t stride_c, \
|
|
873
|
-
std::int64_t batch_size);
|
|
874
|
-
|
|
875
|
-
ONEMKL_DECLARE_BUF_OMATADD_BATCH(float)
|
|
876
|
-
ONEMKL_DECLARE_BUF_OMATADD_BATCH(double)
|
|
877
|
-
ONEMKL_DECLARE_BUF_OMATADD_BATCH(std::complex<float>)
|
|
878
|
-
ONEMKL_DECLARE_BUF_OMATADD_BATCH(std::complex<double>)
|
|
879
|
-
|
|
880
|
-
#undef ONEMKL_DECLARE_BUF_OMATADD_BATCH
|