@smake/eigen 1.0.2 → 1.1.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (435) hide show
  1. package/README.md +1 -1
  2. package/eigen/Eigen/AccelerateSupport +52 -0
  3. package/eigen/Eigen/Cholesky +18 -21
  4. package/eigen/Eigen/CholmodSupport +28 -28
  5. package/eigen/Eigen/Core +235 -326
  6. package/eigen/Eigen/Eigenvalues +16 -14
  7. package/eigen/Eigen/Geometry +21 -24
  8. package/eigen/Eigen/Householder +9 -8
  9. package/eigen/Eigen/IterativeLinearSolvers +8 -4
  10. package/eigen/Eigen/Jacobi +14 -14
  11. package/eigen/Eigen/KLUSupport +43 -0
  12. package/eigen/Eigen/LU +16 -20
  13. package/eigen/Eigen/MetisSupport +12 -12
  14. package/eigen/Eigen/OrderingMethods +54 -54
  15. package/eigen/Eigen/PaStiXSupport +23 -20
  16. package/eigen/Eigen/PardisoSupport +17 -14
  17. package/eigen/Eigen/QR +18 -21
  18. package/eigen/Eigen/QtAlignedMalloc +5 -13
  19. package/eigen/Eigen/SPQRSupport +21 -14
  20. package/eigen/Eigen/SVD +23 -18
  21. package/eigen/Eigen/Sparse +1 -4
  22. package/eigen/Eigen/SparseCholesky +18 -23
  23. package/eigen/Eigen/SparseCore +18 -17
  24. package/eigen/Eigen/SparseLU +12 -8
  25. package/eigen/Eigen/SparseQR +16 -14
  26. package/eigen/Eigen/StdDeque +5 -2
  27. package/eigen/Eigen/StdList +5 -2
  28. package/eigen/Eigen/StdVector +5 -2
  29. package/eigen/Eigen/SuperLUSupport +30 -24
  30. package/eigen/Eigen/ThreadPool +80 -0
  31. package/eigen/Eigen/UmfPackSupport +19 -17
  32. package/eigen/Eigen/Version +14 -0
  33. package/eigen/Eigen/src/AccelerateSupport/AccelerateSupport.h +423 -0
  34. package/eigen/Eigen/src/AccelerateSupport/InternalHeaderCheck.h +3 -0
  35. package/eigen/Eigen/src/Cholesky/InternalHeaderCheck.h +3 -0
  36. package/eigen/Eigen/src/Cholesky/LDLT.h +377 -401
  37. package/eigen/Eigen/src/Cholesky/LLT.h +332 -360
  38. package/eigen/Eigen/src/Cholesky/LLT_LAPACKE.h +81 -56
  39. package/eigen/Eigen/src/CholmodSupport/CholmodSupport.h +620 -521
  40. package/eigen/Eigen/src/CholmodSupport/InternalHeaderCheck.h +3 -0
  41. package/eigen/Eigen/src/Core/ArithmeticSequence.h +239 -0
  42. package/eigen/Eigen/src/Core/Array.h +341 -294
  43. package/eigen/Eigen/src/Core/ArrayBase.h +190 -203
  44. package/eigen/Eigen/src/Core/ArrayWrapper.h +127 -171
  45. package/eigen/Eigen/src/Core/Assign.h +30 -40
  46. package/eigen/Eigen/src/Core/AssignEvaluator.h +711 -589
  47. package/eigen/Eigen/src/Core/Assign_MKL.h +130 -125
  48. package/eigen/Eigen/src/Core/BandMatrix.h +268 -283
  49. package/eigen/Eigen/src/Core/Block.h +375 -398
  50. package/eigen/Eigen/src/Core/CommaInitializer.h +86 -97
  51. package/eigen/Eigen/src/Core/ConditionEstimator.h +51 -53
  52. package/eigen/Eigen/src/Core/CoreEvaluators.h +1356 -1026
  53. package/eigen/Eigen/src/Core/CoreIterators.h +73 -59
  54. package/eigen/Eigen/src/Core/CwiseBinaryOp.h +114 -132
  55. package/eigen/Eigen/src/Core/CwiseNullaryOp.h +726 -617
  56. package/eigen/Eigen/src/Core/CwiseTernaryOp.h +77 -103
  57. package/eigen/Eigen/src/Core/CwiseUnaryOp.h +56 -68
  58. package/eigen/Eigen/src/Core/CwiseUnaryView.h +132 -95
  59. package/eigen/Eigen/src/Core/DenseBase.h +632 -571
  60. package/eigen/Eigen/src/Core/DenseCoeffsBase.h +511 -624
  61. package/eigen/Eigen/src/Core/DenseStorage.h +512 -509
  62. package/eigen/Eigen/src/Core/DeviceWrapper.h +153 -0
  63. package/eigen/Eigen/src/Core/Diagonal.h +169 -210
  64. package/eigen/Eigen/src/Core/DiagonalMatrix.h +351 -274
  65. package/eigen/Eigen/src/Core/DiagonalProduct.h +12 -10
  66. package/eigen/Eigen/src/Core/Dot.h +172 -222
  67. package/eigen/Eigen/src/Core/EigenBase.h +75 -85
  68. package/eigen/Eigen/src/Core/Fill.h +138 -0
  69. package/eigen/Eigen/src/Core/FindCoeff.h +464 -0
  70. package/eigen/Eigen/src/Core/ForceAlignedAccess.h +90 -109
  71. package/eigen/Eigen/src/Core/Fuzzy.h +82 -105
  72. package/eigen/Eigen/src/Core/GeneralProduct.h +327 -263
  73. package/eigen/Eigen/src/Core/GenericPacketMath.h +1472 -360
  74. package/eigen/Eigen/src/Core/GlobalFunctions.h +194 -151
  75. package/eigen/Eigen/src/Core/IO.h +147 -139
  76. package/eigen/Eigen/src/Core/IndexedView.h +321 -0
  77. package/eigen/Eigen/src/Core/InnerProduct.h +260 -0
  78. package/eigen/Eigen/src/Core/InternalHeaderCheck.h +3 -0
  79. package/eigen/Eigen/src/Core/Inverse.h +56 -66
  80. package/eigen/Eigen/src/Core/Map.h +124 -142
  81. package/eigen/Eigen/src/Core/MapBase.h +256 -281
  82. package/eigen/Eigen/src/Core/MathFunctions.h +1620 -938
  83. package/eigen/Eigen/src/Core/MathFunctionsImpl.h +233 -71
  84. package/eigen/Eigen/src/Core/Matrix.h +491 -416
  85. package/eigen/Eigen/src/Core/MatrixBase.h +468 -453
  86. package/eigen/Eigen/src/Core/NestByValue.h +66 -85
  87. package/eigen/Eigen/src/Core/NoAlias.h +79 -85
  88. package/eigen/Eigen/src/Core/NumTraits.h +235 -148
  89. package/eigen/Eigen/src/Core/PartialReduxEvaluator.h +253 -0
  90. package/eigen/Eigen/src/Core/PermutationMatrix.h +461 -511
  91. package/eigen/Eigen/src/Core/PlainObjectBase.h +871 -894
  92. package/eigen/Eigen/src/Core/Product.h +260 -139
  93. package/eigen/Eigen/src/Core/ProductEvaluators.h +863 -714
  94. package/eigen/Eigen/src/Core/Random.h +161 -136
  95. package/eigen/Eigen/src/Core/RandomImpl.h +262 -0
  96. package/eigen/Eigen/src/Core/RealView.h +250 -0
  97. package/eigen/Eigen/src/Core/Redux.h +366 -336
  98. package/eigen/Eigen/src/Core/Ref.h +308 -209
  99. package/eigen/Eigen/src/Core/Replicate.h +94 -106
  100. package/eigen/Eigen/src/Core/Reshaped.h +398 -0
  101. package/eigen/Eigen/src/Core/ReturnByValue.h +49 -55
  102. package/eigen/Eigen/src/Core/Reverse.h +136 -145
  103. package/eigen/Eigen/src/Core/Select.h +70 -140
  104. package/eigen/Eigen/src/Core/SelfAdjointView.h +262 -285
  105. package/eigen/Eigen/src/Core/SelfCwiseBinaryOp.h +23 -20
  106. package/eigen/Eigen/src/Core/SkewSymmetricMatrix3.h +382 -0
  107. package/eigen/Eigen/src/Core/Solve.h +97 -111
  108. package/eigen/Eigen/src/Core/SolveTriangular.h +131 -129
  109. package/eigen/Eigen/src/Core/SolverBase.h +138 -101
  110. package/eigen/Eigen/src/Core/StableNorm.h +156 -160
  111. package/eigen/Eigen/src/Core/StlIterators.h +619 -0
  112. package/eigen/Eigen/src/Core/Stride.h +91 -88
  113. package/eigen/Eigen/src/Core/Swap.h +70 -38
  114. package/eigen/Eigen/src/Core/Transpose.h +295 -273
  115. package/eigen/Eigen/src/Core/Transpositions.h +272 -317
  116. package/eigen/Eigen/src/Core/TriangularMatrix.h +670 -755
  117. package/eigen/Eigen/src/Core/VectorBlock.h +59 -72
  118. package/eigen/Eigen/src/Core/VectorwiseOp.h +668 -630
  119. package/eigen/Eigen/src/Core/Visitor.h +480 -216
  120. package/eigen/Eigen/src/Core/arch/AVX/Complex.h +407 -293
  121. package/eigen/Eigen/src/Core/arch/AVX/MathFunctions.h +79 -388
  122. package/eigen/Eigen/src/Core/arch/AVX/PacketMath.h +2935 -491
  123. package/eigen/Eigen/src/Core/arch/AVX/Reductions.h +353 -0
  124. package/eigen/Eigen/src/Core/arch/AVX/TypeCasting.h +279 -22
  125. package/eigen/Eigen/src/Core/arch/AVX512/Complex.h +472 -0
  126. package/eigen/Eigen/src/Core/arch/AVX512/GemmKernel.h +1245 -0
  127. package/eigen/Eigen/src/Core/arch/AVX512/MathFunctions.h +85 -333
  128. package/eigen/Eigen/src/Core/arch/AVX512/MathFunctionsFP16.h +75 -0
  129. package/eigen/Eigen/src/Core/arch/AVX512/PacketMath.h +2490 -649
  130. package/eigen/Eigen/src/Core/arch/AVX512/PacketMathFP16.h +1413 -0
  131. package/eigen/Eigen/src/Core/arch/AVX512/Reductions.h +297 -0
  132. package/eigen/Eigen/src/Core/arch/AVX512/TrsmKernel.h +1167 -0
  133. package/eigen/Eigen/src/Core/arch/AVX512/TrsmUnrolls.inc +1219 -0
  134. package/eigen/Eigen/src/Core/arch/AVX512/TypeCasting.h +277 -0
  135. package/eigen/Eigen/src/Core/arch/AVX512/TypeCastingFP16.h +130 -0
  136. package/eigen/Eigen/src/Core/arch/AltiVec/Complex.h +521 -298
  137. package/eigen/Eigen/src/Core/arch/AltiVec/MathFunctions.h +39 -280
  138. package/eigen/Eigen/src/Core/arch/AltiVec/MatrixProduct.h +3686 -0
  139. package/eigen/Eigen/src/Core/arch/AltiVec/MatrixProductCommon.h +205 -0
  140. package/eigen/Eigen/src/Core/arch/AltiVec/MatrixProductMMA.h +901 -0
  141. package/eigen/Eigen/src/Core/arch/AltiVec/MatrixProductMMAbfloat16.h +742 -0
  142. package/eigen/Eigen/src/Core/arch/AltiVec/MatrixVectorProduct.inc +2818 -0
  143. package/eigen/Eigen/src/Core/arch/AltiVec/PacketMath.h +3391 -723
  144. package/eigen/Eigen/src/Core/arch/AltiVec/TypeCasting.h +153 -0
  145. package/eigen/Eigen/src/Core/arch/Default/BFloat16.h +866 -0
  146. package/eigen/Eigen/src/Core/arch/Default/ConjHelper.h +113 -14
  147. package/eigen/Eigen/src/Core/arch/Default/GenericPacketMathFunctions.h +2634 -0
  148. package/eigen/Eigen/src/Core/arch/Default/GenericPacketMathFunctionsFwd.h +227 -0
  149. package/eigen/Eigen/src/Core/arch/Default/Half.h +1091 -0
  150. package/eigen/Eigen/src/Core/arch/Default/Settings.h +11 -13
  151. package/eigen/Eigen/src/Core/arch/GPU/Complex.h +244 -0
  152. package/eigen/Eigen/src/Core/arch/GPU/MathFunctions.h +104 -0
  153. package/eigen/Eigen/src/Core/arch/GPU/PacketMath.h +1712 -0
  154. package/eigen/Eigen/src/Core/arch/GPU/Tuple.h +268 -0
  155. package/eigen/Eigen/src/Core/arch/GPU/TypeCasting.h +77 -0
  156. package/eigen/Eigen/src/Core/arch/HIP/hcc/math_constants.h +23 -0
  157. package/eigen/Eigen/src/Core/arch/HVX/PacketMath.h +1088 -0
  158. package/eigen/Eigen/src/Core/arch/LSX/Complex.h +520 -0
  159. package/eigen/Eigen/src/Core/arch/LSX/GeneralBlockPanelKernel.h +23 -0
  160. package/eigen/Eigen/src/Core/arch/LSX/MathFunctions.h +43 -0
  161. package/eigen/Eigen/src/Core/arch/LSX/PacketMath.h +2866 -0
  162. package/eigen/Eigen/src/Core/arch/LSX/TypeCasting.h +526 -0
  163. package/eigen/Eigen/src/Core/arch/MSA/Complex.h +620 -0
  164. package/eigen/Eigen/src/Core/arch/MSA/MathFunctions.h +379 -0
  165. package/eigen/Eigen/src/Core/arch/MSA/PacketMath.h +1237 -0
  166. package/eigen/Eigen/src/Core/arch/NEON/Complex.h +531 -289
  167. package/eigen/Eigen/src/Core/arch/NEON/GeneralBlockPanelKernel.h +243 -0
  168. package/eigen/Eigen/src/Core/arch/NEON/MathFunctions.h +50 -73
  169. package/eigen/Eigen/src/Core/arch/NEON/PacketMath.h +5915 -579
  170. package/eigen/Eigen/src/Core/arch/NEON/TypeCasting.h +1642 -0
  171. package/eigen/Eigen/src/Core/arch/NEON/UnaryFunctors.h +57 -0
  172. package/eigen/Eigen/src/Core/arch/SSE/Complex.h +366 -334
  173. package/eigen/Eigen/src/Core/arch/SSE/MathFunctions.h +40 -514
  174. package/eigen/Eigen/src/Core/arch/SSE/PacketMath.h +2164 -675
  175. package/eigen/Eigen/src/Core/arch/SSE/Reductions.h +324 -0
  176. package/eigen/Eigen/src/Core/arch/SSE/TypeCasting.h +188 -35
  177. package/eigen/Eigen/src/Core/arch/SVE/MathFunctions.h +48 -0
  178. package/eigen/Eigen/src/Core/arch/SVE/PacketMath.h +674 -0
  179. package/eigen/Eigen/src/Core/arch/SVE/TypeCasting.h +52 -0
  180. package/eigen/Eigen/src/Core/arch/SYCL/InteropHeaders.h +227 -0
  181. package/eigen/Eigen/src/Core/arch/SYCL/MathFunctions.h +303 -0
  182. package/eigen/Eigen/src/Core/arch/SYCL/PacketMath.h +576 -0
  183. package/eigen/Eigen/src/Core/arch/SYCL/TypeCasting.h +83 -0
  184. package/eigen/Eigen/src/Core/arch/ZVector/Complex.h +434 -261
  185. package/eigen/Eigen/src/Core/arch/ZVector/MathFunctions.h +160 -53
  186. package/eigen/Eigen/src/Core/arch/ZVector/PacketMath.h +1073 -605
  187. package/eigen/Eigen/src/Core/functors/AssignmentFunctors.h +123 -117
  188. package/eigen/Eigen/src/Core/functors/BinaryFunctors.h +594 -322
  189. package/eigen/Eigen/src/Core/functors/NullaryFunctors.h +204 -118
  190. package/eigen/Eigen/src/Core/functors/StlFunctors.h +110 -97
  191. package/eigen/Eigen/src/Core/functors/TernaryFunctors.h +34 -7
  192. package/eigen/Eigen/src/Core/functors/UnaryFunctors.h +1158 -530
  193. package/eigen/Eigen/src/Core/products/GeneralBlockPanelKernel.h +2329 -1333
  194. package/eigen/Eigen/src/Core/products/GeneralMatrixMatrix.h +328 -364
  195. package/eigen/Eigen/src/Core/products/GeneralMatrixMatrixTriangular.h +191 -178
  196. package/eigen/Eigen/src/Core/products/GeneralMatrixMatrixTriangular_BLAS.h +85 -82
  197. package/eigen/Eigen/src/Core/products/GeneralMatrixMatrix_BLAS.h +154 -73
  198. package/eigen/Eigen/src/Core/products/GeneralMatrixVector.h +396 -542
  199. package/eigen/Eigen/src/Core/products/GeneralMatrixVector_BLAS.h +80 -77
  200. package/eigen/Eigen/src/Core/products/Parallelizer.h +208 -92
  201. package/eigen/Eigen/src/Core/products/SelfadjointMatrixMatrix.h +331 -375
  202. package/eigen/Eigen/src/Core/products/SelfadjointMatrixMatrix_BLAS.h +206 -224
  203. package/eigen/Eigen/src/Core/products/SelfadjointMatrixVector.h +139 -146
  204. package/eigen/Eigen/src/Core/products/SelfadjointMatrixVector_BLAS.h +58 -61
  205. package/eigen/Eigen/src/Core/products/SelfadjointProduct.h +71 -71
  206. package/eigen/Eigen/src/Core/products/SelfadjointRank2Update.h +48 -46
  207. package/eigen/Eigen/src/Core/products/TriangularMatrixMatrix.h +294 -369
  208. package/eigen/Eigen/src/Core/products/TriangularMatrixMatrix_BLAS.h +246 -238
  209. package/eigen/Eigen/src/Core/products/TriangularMatrixVector.h +244 -247
  210. package/eigen/Eigen/src/Core/products/TriangularMatrixVector_BLAS.h +212 -192
  211. package/eigen/Eigen/src/Core/products/TriangularSolverMatrix.h +328 -275
  212. package/eigen/Eigen/src/Core/products/TriangularSolverMatrix_BLAS.h +108 -109
  213. package/eigen/Eigen/src/Core/products/TriangularSolverVector.h +70 -93
  214. package/eigen/Eigen/src/Core/util/Assert.h +158 -0
  215. package/eigen/Eigen/src/Core/util/BlasUtil.h +413 -290
  216. package/eigen/Eigen/src/Core/util/ConfigureVectorization.h +543 -0
  217. package/eigen/Eigen/src/Core/util/Constants.h +314 -263
  218. package/eigen/Eigen/src/Core/util/DisableStupidWarnings.h +130 -78
  219. package/eigen/Eigen/src/Core/util/EmulateArray.h +270 -0
  220. package/eigen/Eigen/src/Core/util/ForwardDeclarations.h +450 -224
  221. package/eigen/Eigen/src/Core/util/GpuHipCudaDefines.inc +101 -0
  222. package/eigen/Eigen/src/Core/util/GpuHipCudaUndefines.inc +45 -0
  223. package/eigen/Eigen/src/Core/util/IndexedViewHelper.h +487 -0
  224. package/eigen/Eigen/src/Core/util/IntegralConstant.h +279 -0
  225. package/eigen/Eigen/src/Core/util/MKL_support.h +39 -30
  226. package/eigen/Eigen/src/Core/util/Macros.h +939 -646
  227. package/eigen/Eigen/src/Core/util/MaxSizeVector.h +139 -0
  228. package/eigen/Eigen/src/Core/util/Memory.h +1042 -650
  229. package/eigen/Eigen/src/Core/util/Meta.h +618 -426
  230. package/eigen/Eigen/src/Core/util/MoreMeta.h +638 -0
  231. package/eigen/Eigen/src/Core/util/ReenableStupidWarnings.h +32 -19
  232. package/eigen/Eigen/src/Core/util/ReshapedHelper.h +51 -0
  233. package/eigen/Eigen/src/Core/util/Serializer.h +209 -0
  234. package/eigen/Eigen/src/Core/util/StaticAssert.h +51 -164
  235. package/eigen/Eigen/src/Core/util/SymbolicIndex.h +445 -0
  236. package/eigen/Eigen/src/Core/util/XprHelper.h +793 -538
  237. package/eigen/Eigen/src/Eigenvalues/ComplexEigenSolver.h +246 -277
  238. package/eigen/Eigen/src/Eigenvalues/ComplexSchur.h +299 -319
  239. package/eigen/Eigen/src/Eigenvalues/ComplexSchur_LAPACKE.h +52 -48
  240. package/eigen/Eigen/src/Eigenvalues/EigenSolver.h +413 -456
  241. package/eigen/Eigen/src/Eigenvalues/GeneralizedEigenSolver.h +309 -325
  242. package/eigen/Eigen/src/Eigenvalues/GeneralizedSelfAdjointEigenSolver.h +157 -171
  243. package/eigen/Eigen/src/Eigenvalues/HessenbergDecomposition.h +292 -310
  244. package/eigen/Eigen/src/Eigenvalues/InternalHeaderCheck.h +3 -0
  245. package/eigen/Eigen/src/Eigenvalues/MatrixBaseEigenvalues.h +91 -107
  246. package/eigen/Eigen/src/Eigenvalues/RealQZ.h +539 -606
  247. package/eigen/Eigen/src/Eigenvalues/RealSchur.h +348 -382
  248. package/eigen/Eigen/src/Eigenvalues/RealSchur_LAPACKE.h +41 -35
  249. package/eigen/Eigen/src/Eigenvalues/SelfAdjointEigenSolver.h +579 -600
  250. package/eigen/Eigen/src/Eigenvalues/SelfAdjointEigenSolver_LAPACKE.h +47 -44
  251. package/eigen/Eigen/src/Eigenvalues/Tridiagonalization.h +434 -461
  252. package/eigen/Eigen/src/Geometry/AlignedBox.h +307 -214
  253. package/eigen/Eigen/src/Geometry/AngleAxis.h +135 -137
  254. package/eigen/Eigen/src/Geometry/EulerAngles.h +163 -74
  255. package/eigen/Eigen/src/Geometry/Homogeneous.h +289 -333
  256. package/eigen/Eigen/src/Geometry/Hyperplane.h +152 -161
  257. package/eigen/Eigen/src/Geometry/InternalHeaderCheck.h +3 -0
  258. package/eigen/Eigen/src/Geometry/OrthoMethods.h +168 -145
  259. package/eigen/Eigen/src/Geometry/ParametrizedLine.h +141 -104
  260. package/eigen/Eigen/src/Geometry/Quaternion.h +595 -497
  261. package/eigen/Eigen/src/Geometry/Rotation2D.h +110 -108
  262. package/eigen/Eigen/src/Geometry/RotationBase.h +148 -145
  263. package/eigen/Eigen/src/Geometry/Scaling.h +115 -90
  264. package/eigen/Eigen/src/Geometry/Transform.h +896 -953
  265. package/eigen/Eigen/src/Geometry/Translation.h +100 -98
  266. package/eigen/Eigen/src/Geometry/Umeyama.h +79 -84
  267. package/eigen/Eigen/src/Geometry/arch/Geometry_SIMD.h +154 -0
  268. package/eigen/Eigen/src/Householder/BlockHouseholder.h +54 -42
  269. package/eigen/Eigen/src/Householder/Householder.h +104 -122
  270. package/eigen/Eigen/src/Householder/HouseholderSequence.h +416 -382
  271. package/eigen/Eigen/src/Householder/InternalHeaderCheck.h +3 -0
  272. package/eigen/Eigen/src/IterativeLinearSolvers/BasicPreconditioners.h +153 -166
  273. package/eigen/Eigen/src/IterativeLinearSolvers/BiCGSTAB.h +127 -138
  274. package/eigen/Eigen/src/IterativeLinearSolvers/ConjugateGradient.h +95 -124
  275. package/eigen/Eigen/src/IterativeLinearSolvers/IncompleteCholesky.h +269 -267
  276. package/eigen/Eigen/src/IterativeLinearSolvers/IncompleteLUT.h +246 -259
  277. package/eigen/Eigen/src/IterativeLinearSolvers/InternalHeaderCheck.h +3 -0
  278. package/eigen/Eigen/src/IterativeLinearSolvers/IterativeSolverBase.h +218 -217
  279. package/eigen/Eigen/src/IterativeLinearSolvers/LeastSquareConjugateGradient.h +80 -103
  280. package/eigen/Eigen/src/IterativeLinearSolvers/SolveWithGuess.h +59 -63
  281. package/eigen/Eigen/src/Jacobi/InternalHeaderCheck.h +3 -0
  282. package/eigen/Eigen/src/Jacobi/Jacobi.h +256 -291
  283. package/eigen/Eigen/src/KLUSupport/InternalHeaderCheck.h +3 -0
  284. package/eigen/Eigen/src/KLUSupport/KLUSupport.h +339 -0
  285. package/eigen/Eigen/src/LU/Determinant.h +60 -63
  286. package/eigen/Eigen/src/LU/FullPivLU.h +561 -626
  287. package/eigen/Eigen/src/LU/InternalHeaderCheck.h +3 -0
  288. package/eigen/Eigen/src/LU/InverseImpl.h +213 -275
  289. package/eigen/Eigen/src/LU/PartialPivLU.h +407 -435
  290. package/eigen/Eigen/src/LU/PartialPivLU_LAPACKE.h +54 -40
  291. package/eigen/Eigen/src/LU/arch/InverseSize4.h +353 -0
  292. package/eigen/Eigen/src/MetisSupport/InternalHeaderCheck.h +3 -0
  293. package/eigen/Eigen/src/MetisSupport/MetisSupport.h +81 -93
  294. package/eigen/Eigen/src/OrderingMethods/Amd.h +250 -282
  295. package/eigen/Eigen/src/OrderingMethods/Eigen_Colamd.h +950 -1103
  296. package/eigen/Eigen/src/OrderingMethods/InternalHeaderCheck.h +3 -0
  297. package/eigen/Eigen/src/OrderingMethods/Ordering.h +111 -122
  298. package/eigen/Eigen/src/PaStiXSupport/InternalHeaderCheck.h +3 -0
  299. package/eigen/Eigen/src/PaStiXSupport/PaStiXSupport.h +524 -570
  300. package/eigen/Eigen/src/PardisoSupport/InternalHeaderCheck.h +3 -0
  301. package/eigen/Eigen/src/PardisoSupport/PardisoSupport.h +385 -429
  302. package/eigen/Eigen/src/QR/ColPivHouseholderQR.h +494 -473
  303. package/eigen/Eigen/src/QR/ColPivHouseholderQR_LAPACKE.h +120 -56
  304. package/eigen/Eigen/src/QR/CompleteOrthogonalDecomposition.h +223 -137
  305. package/eigen/Eigen/src/QR/FullPivHouseholderQR.h +517 -460
  306. package/eigen/Eigen/src/QR/HouseholderQR.h +412 -278
  307. package/eigen/Eigen/src/QR/HouseholderQR_LAPACKE.h +32 -23
  308. package/eigen/Eigen/src/QR/InternalHeaderCheck.h +3 -0
  309. package/eigen/Eigen/src/SPQRSupport/InternalHeaderCheck.h +3 -0
  310. package/eigen/Eigen/src/SPQRSupport/SuiteSparseQRSupport.h +263 -261
  311. package/eigen/Eigen/src/SVD/BDCSVD.h +872 -679
  312. package/eigen/Eigen/src/SVD/BDCSVD_LAPACKE.h +174 -0
  313. package/eigen/Eigen/src/SVD/InternalHeaderCheck.h +3 -0
  314. package/eigen/Eigen/src/SVD/JacobiSVD.h +585 -543
  315. package/eigen/Eigen/src/SVD/JacobiSVD_LAPACKE.h +85 -49
  316. package/eigen/Eigen/src/SVD/SVDBase.h +281 -160
  317. package/eigen/Eigen/src/SVD/UpperBidiagonalization.h +202 -237
  318. package/eigen/Eigen/src/SparseCholesky/InternalHeaderCheck.h +3 -0
  319. package/eigen/Eigen/src/SparseCholesky/SimplicialCholesky.h +769 -590
  320. package/eigen/Eigen/src/SparseCholesky/SimplicialCholesky_impl.h +318 -129
  321. package/eigen/Eigen/src/SparseCore/AmbiVector.h +202 -251
  322. package/eigen/Eigen/src/SparseCore/CompressedStorage.h +184 -236
  323. package/eigen/Eigen/src/SparseCore/ConservativeSparseSparseProduct.h +140 -184
  324. package/eigen/Eigen/src/SparseCore/InternalHeaderCheck.h +3 -0
  325. package/eigen/Eigen/src/SparseCore/SparseAssign.h +174 -111
  326. package/eigen/Eigen/src/SparseCore/SparseBlock.h +408 -477
  327. package/eigen/Eigen/src/SparseCore/SparseColEtree.h +100 -112
  328. package/eigen/Eigen/src/SparseCore/SparseCompressedBase.h +531 -280
  329. package/eigen/Eigen/src/SparseCore/SparseCwiseBinaryOp.h +559 -347
  330. package/eigen/Eigen/src/SparseCore/SparseCwiseUnaryOp.h +100 -108
  331. package/eigen/Eigen/src/SparseCore/SparseDenseProduct.h +185 -191
  332. package/eigen/Eigen/src/SparseCore/SparseDiagonalProduct.h +71 -71
  333. package/eigen/Eigen/src/SparseCore/SparseDot.h +49 -47
  334. package/eigen/Eigen/src/SparseCore/SparseFuzzy.h +13 -11
  335. package/eigen/Eigen/src/SparseCore/SparseMap.h +243 -253
  336. package/eigen/Eigen/src/SparseCore/SparseMatrix.h +1614 -1142
  337. package/eigen/Eigen/src/SparseCore/SparseMatrixBase.h +403 -357
  338. package/eigen/Eigen/src/SparseCore/SparsePermutation.h +186 -115
  339. package/eigen/Eigen/src/SparseCore/SparseProduct.h +100 -91
  340. package/eigen/Eigen/src/SparseCore/SparseRedux.h +22 -24
  341. package/eigen/Eigen/src/SparseCore/SparseRef.h +268 -295
  342. package/eigen/Eigen/src/SparseCore/SparseSelfAdjointView.h +371 -414
  343. package/eigen/Eigen/src/SparseCore/SparseSolverBase.h +78 -87
  344. package/eigen/Eigen/src/SparseCore/SparseSparseProductWithPruning.h +81 -95
  345. package/eigen/Eigen/src/SparseCore/SparseTranspose.h +62 -71
  346. package/eigen/Eigen/src/SparseCore/SparseTriangularView.h +132 -144
  347. package/eigen/Eigen/src/SparseCore/SparseUtil.h +146 -115
  348. package/eigen/Eigen/src/SparseCore/SparseVector.h +426 -372
  349. package/eigen/Eigen/src/SparseCore/SparseView.h +164 -193
  350. package/eigen/Eigen/src/SparseCore/TriangularSolver.h +129 -170
  351. package/eigen/Eigen/src/SparseLU/InternalHeaderCheck.h +3 -0
  352. package/eigen/Eigen/src/SparseLU/SparseLU.h +814 -618
  353. package/eigen/Eigen/src/SparseLU/SparseLUImpl.h +61 -48
  354. package/eigen/Eigen/src/SparseLU/SparseLU_Memory.h +102 -118
  355. package/eigen/Eigen/src/SparseLU/SparseLU_Structs.h +38 -35
  356. package/eigen/Eigen/src/SparseLU/SparseLU_SupernodalMatrix.h +273 -255
  357. package/eigen/Eigen/src/SparseLU/SparseLU_Utils.h +44 -49
  358. package/eigen/Eigen/src/SparseLU/SparseLU_column_bmod.h +104 -108
  359. package/eigen/Eigen/src/SparseLU/SparseLU_column_dfs.h +90 -101
  360. package/eigen/Eigen/src/SparseLU/SparseLU_copy_to_ucol.h +57 -58
  361. package/eigen/Eigen/src/SparseLU/SparseLU_heap_relax_snode.h +43 -55
  362. package/eigen/Eigen/src/SparseLU/SparseLU_kernel_bmod.h +74 -71
  363. package/eigen/Eigen/src/SparseLU/SparseLU_panel_bmod.h +125 -133
  364. package/eigen/Eigen/src/SparseLU/SparseLU_panel_dfs.h +136 -159
  365. package/eigen/Eigen/src/SparseLU/SparseLU_pivotL.h +51 -52
  366. package/eigen/Eigen/src/SparseLU/SparseLU_pruneL.h +67 -73
  367. package/eigen/Eigen/src/SparseLU/SparseLU_relax_snode.h +24 -26
  368. package/eigen/Eigen/src/SparseQR/InternalHeaderCheck.h +3 -0
  369. package/eigen/Eigen/src/SparseQR/SparseQR.h +451 -490
  370. package/eigen/Eigen/src/StlSupport/StdDeque.h +28 -105
  371. package/eigen/Eigen/src/StlSupport/StdList.h +28 -84
  372. package/eigen/Eigen/src/StlSupport/StdVector.h +28 -108
  373. package/eigen/Eigen/src/StlSupport/details.h +48 -50
  374. package/eigen/Eigen/src/SuperLUSupport/InternalHeaderCheck.h +3 -0
  375. package/eigen/Eigen/src/SuperLUSupport/SuperLUSupport.h +634 -732
  376. package/eigen/Eigen/src/ThreadPool/Barrier.h +70 -0
  377. package/eigen/Eigen/src/ThreadPool/CoreThreadPoolDevice.h +336 -0
  378. package/eigen/Eigen/src/ThreadPool/EventCount.h +241 -0
  379. package/eigen/Eigen/src/ThreadPool/ForkJoin.h +140 -0
  380. package/eigen/Eigen/src/ThreadPool/InternalHeaderCheck.h +4 -0
  381. package/eigen/Eigen/src/ThreadPool/NonBlockingThreadPool.h +587 -0
  382. package/eigen/Eigen/src/ThreadPool/RunQueue.h +230 -0
  383. package/eigen/Eigen/src/ThreadPool/ThreadCancel.h +21 -0
  384. package/eigen/Eigen/src/ThreadPool/ThreadEnvironment.h +43 -0
  385. package/eigen/Eigen/src/ThreadPool/ThreadLocal.h +289 -0
  386. package/eigen/Eigen/src/ThreadPool/ThreadPoolInterface.h +50 -0
  387. package/eigen/Eigen/src/ThreadPool/ThreadYield.h +16 -0
  388. package/eigen/Eigen/src/UmfPackSupport/InternalHeaderCheck.h +3 -0
  389. package/eigen/Eigen/src/UmfPackSupport/UmfPackSupport.h +480 -380
  390. package/eigen/Eigen/src/misc/Image.h +41 -43
  391. package/eigen/Eigen/src/misc/InternalHeaderCheck.h +3 -0
  392. package/eigen/Eigen/src/misc/Kernel.h +39 -41
  393. package/eigen/Eigen/src/misc/RealSvd2x2.h +19 -21
  394. package/eigen/Eigen/src/misc/blas.h +83 -426
  395. package/eigen/Eigen/src/misc/lapacke.h +9976 -16182
  396. package/eigen/Eigen/src/misc/lapacke_helpers.h +163 -0
  397. package/eigen/Eigen/src/misc/lapacke_mangling.h +4 -5
  398. package/eigen/Eigen/src/plugins/ArrayCwiseBinaryOps.inc +344 -0
  399. package/eigen/Eigen/src/plugins/ArrayCwiseUnaryOps.inc +544 -0
  400. package/eigen/Eigen/src/plugins/BlockMethods.inc +1370 -0
  401. package/eigen/Eigen/src/plugins/CommonCwiseBinaryOps.inc +116 -0
  402. package/eigen/Eigen/src/plugins/CommonCwiseUnaryOps.inc +167 -0
  403. package/eigen/Eigen/src/plugins/IndexedViewMethods.inc +192 -0
  404. package/eigen/Eigen/src/plugins/InternalHeaderCheck.inc +3 -0
  405. package/eigen/Eigen/src/plugins/MatrixCwiseBinaryOps.inc +331 -0
  406. package/eigen/Eigen/src/plugins/MatrixCwiseUnaryOps.inc +118 -0
  407. package/eigen/Eigen/src/plugins/ReshapedMethods.inc +133 -0
  408. package/lib/LibEigen.d.ts +4 -0
  409. package/lib/LibEigen.js +14 -0
  410. package/lib/index.d.ts +1 -1
  411. package/lib/index.js +7 -3
  412. package/package.json +2 -10
  413. package/eigen/Eigen/CMakeLists.txt +0 -19
  414. package/eigen/Eigen/src/Core/BooleanRedux.h +0 -164
  415. package/eigen/Eigen/src/Core/arch/CUDA/Complex.h +0 -103
  416. package/eigen/Eigen/src/Core/arch/CUDA/Half.h +0 -675
  417. package/eigen/Eigen/src/Core/arch/CUDA/MathFunctions.h +0 -91
  418. package/eigen/Eigen/src/Core/arch/CUDA/PacketMath.h +0 -333
  419. package/eigen/Eigen/src/Core/arch/CUDA/PacketMathHalf.h +0 -1124
  420. package/eigen/Eigen/src/Core/arch/CUDA/TypeCasting.h +0 -212
  421. package/eigen/Eigen/src/Core/util/NonMPL2.h +0 -3
  422. package/eigen/Eigen/src/Geometry/arch/Geometry_SSE.h +0 -161
  423. package/eigen/Eigen/src/LU/arch/Inverse_SSE.h +0 -338
  424. package/eigen/Eigen/src/SparseCore/MappedSparseMatrix.h +0 -67
  425. package/eigen/Eigen/src/SparseLU/SparseLU_gemm_kernel.h +0 -280
  426. package/eigen/Eigen/src/misc/lapack.h +0 -152
  427. package/eigen/Eigen/src/plugins/ArrayCwiseBinaryOps.h +0 -332
  428. package/eigen/Eigen/src/plugins/ArrayCwiseUnaryOps.h +0 -552
  429. package/eigen/Eigen/src/plugins/BlockMethods.h +0 -1058
  430. package/eigen/Eigen/src/plugins/CommonCwiseBinaryOps.h +0 -115
  431. package/eigen/Eigen/src/plugins/CommonCwiseUnaryOps.h +0 -163
  432. package/eigen/Eigen/src/plugins/MatrixCwiseBinaryOps.h +0 -152
  433. package/eigen/Eigen/src/plugins/MatrixCwiseUnaryOps.h +0 -85
  434. package/lib/eigen.d.ts +0 -2
  435. package/lib/eigen.js +0 -15
@@ -0,0 +1,52 @@
1
+ // This file is part of Eigen, a lightweight C++ template library
2
+ // for linear algebra.
3
+ //
4
+ // Copyright (C) 2020, Arm Limited and Contributors
5
+ //
6
+ // This Source Code Form is subject to the terms of the Mozilla
7
+ // Public License v. 2.0. If a copy of the MPL was not distributed
8
+ // with this file, You can obtain one at http://mozilla.org/MPL/2.0/.
9
+
10
+ #ifndef EIGEN_TYPE_CASTING_SVE_H
11
+ #define EIGEN_TYPE_CASTING_SVE_H
12
+
13
+ // IWYU pragma: private
14
+ #include "../../InternalHeaderCheck.h"
15
+
16
+ namespace Eigen {
17
+ namespace internal {
18
+
19
+ template <>
20
+ struct type_casting_traits<float, numext::int32_t> {
21
+ enum { VectorizedCast = 1, SrcCoeffRatio = 1, TgtCoeffRatio = 1 };
22
+ };
23
+
24
+ template <>
25
+ struct type_casting_traits<numext::int32_t, float> {
26
+ enum { VectorizedCast = 1, SrcCoeffRatio = 1, TgtCoeffRatio = 1 };
27
+ };
28
+
29
+ template <>
30
+ EIGEN_STRONG_INLINE PacketXf pcast<PacketXi, PacketXf>(const PacketXi& a) {
31
+ return svcvt_f32_s32_x(svptrue_b32(), a);
32
+ }
33
+
34
+ template <>
35
+ EIGEN_STRONG_INLINE PacketXi pcast<PacketXf, PacketXi>(const PacketXf& a) {
36
+ return svcvt_s32_f32_x(svptrue_b32(), a);
37
+ }
38
+
39
+ template <>
40
+ EIGEN_STRONG_INLINE PacketXf preinterpret<PacketXf, PacketXi>(const PacketXi& a) {
41
+ return svreinterpret_f32_s32(a);
42
+ }
43
+
44
+ template <>
45
+ EIGEN_STRONG_INLINE PacketXi preinterpret<PacketXi, PacketXf>(const PacketXf& a) {
46
+ return svreinterpret_s32_f32(a);
47
+ }
48
+
49
+ } // namespace internal
50
+ } // namespace Eigen
51
+
52
+ #endif // EIGEN_TYPE_CASTING_SVE_H
@@ -0,0 +1,227 @@
1
+ // This file is part of Eigen, a lightweight C++ template library
2
+ // for linear algebra.
3
+ //
4
+ // Mehdi Goli Codeplay Software Ltd.
5
+ // Ralph Potter Codeplay Software Ltd.
6
+ // Luke Iwanski Codeplay Software Ltd.
7
+ // Contact: <eigen@codeplay.com>
8
+ //
9
+ // This Source Code Form is subject to the terms of the Mozilla
10
+ // Public License v. 2.0. If a copy of the MPL was not distributed
11
+ // with this file, You can obtain one at http://mozilla.org/MPL/2.0/.
12
+
13
+ /*****************************************************************
14
+ * InteropHeaders.h
15
+ *
16
+ * \brief:
17
+ * InteropHeaders
18
+ *
19
+ *****************************************************************/
20
+
21
+ #ifndef EIGEN_INTEROP_HEADERS_SYCL_H
22
+ #define EIGEN_INTEROP_HEADERS_SYCL_H
23
+
24
+ // IWYU pragma: private
25
+ #include "../../InternalHeaderCheck.h"
26
+
27
+ namespace Eigen {
28
+
29
+ #if !defined(EIGEN_DONT_VECTORIZE_SYCL)
30
+
31
+ namespace internal {
32
+
33
+ template <int has_blend, int lengths>
34
+ struct sycl_packet_traits : default_packet_traits {
35
+ enum {
36
+ Vectorizable = 1,
37
+ AlignedOnScalar = 1,
38
+ size = lengths,
39
+ HasDiv = 1,
40
+ HasLog = 1,
41
+ HasExp = 1,
42
+ HasSqrt = 1,
43
+ HasRsqrt = 1,
44
+ HasSin = 1,
45
+ HasCos = 1,
46
+ HasTan = 1,
47
+ HasASin = 1,
48
+ HasACos = 1,
49
+ HasATan = 1,
50
+ HasSinh = 1,
51
+ HasCosh = 1,
52
+ HasTanh = 1,
53
+ HasLGamma = 0,
54
+ HasDiGamma = 0,
55
+ HasZeta = 0,
56
+ HasPolygamma = 0,
57
+ HasErf = 0,
58
+ HasErfc = 0,
59
+ HasNdtri = 0,
60
+ HasIGamma = 0,
61
+ HasIGammac = 0,
62
+ HasBetaInc = 0,
63
+ HasBlend = has_blend,
64
+ // This flag is used to indicate whether packet comparison is supported.
65
+ // pcmp_eq, pcmp_lt and pcmp_le should be defined for it to be true.
66
+ HasCmp = 1,
67
+ HasMax = 1,
68
+ HasMin = 1,
69
+ HasMul = 1,
70
+ HasAdd = 1,
71
+ HasFloor = 1,
72
+ HasRound = 1,
73
+ HasRint = 1,
74
+ HasLog1p = 1,
75
+ HasExpm1 = 1,
76
+ HasCeil = 1,
77
+ };
78
+ };
79
+
80
+ #ifdef SYCL_DEVICE_ONLY
81
+ #define SYCL_PACKET_TRAITS(packet_type, has_blend, unpacket_type, lengths) \
82
+ template <> \
83
+ struct packet_traits<unpacket_type> : sycl_packet_traits<has_blend, lengths> { \
84
+ typedef packet_type type; \
85
+ typedef packet_type half; \
86
+ };
87
+
88
+ SYCL_PACKET_TRAITS(cl::sycl::cl_half8, 1, Eigen::half, 8)
89
+ SYCL_PACKET_TRAITS(cl::sycl::cl_half8, 1, const Eigen::half, 8)
90
+ SYCL_PACKET_TRAITS(cl::sycl::cl_float4, 1, float, 4)
91
+ SYCL_PACKET_TRAITS(cl::sycl::cl_float4, 1, const float, 4)
92
+ SYCL_PACKET_TRAITS(cl::sycl::cl_double2, 0, double, 2)
93
+ SYCL_PACKET_TRAITS(cl::sycl::cl_double2, 0, const double, 2)
94
+ #undef SYCL_PACKET_TRAITS
95
+
96
+ // Make sure this is only available when targeting a GPU: we don't want to
97
+ // introduce conflicts between these packet_traits definitions and the ones
98
+ // we'll use on the host side (SSE, AVX, ...)
99
+ #define SYCL_ARITHMETIC(packet_type) \
100
+ template <> \
101
+ struct is_arithmetic<packet_type> { \
102
+ enum { value = true }; \
103
+ };
104
+ SYCL_ARITHMETIC(cl::sycl::cl_half8)
105
+ SYCL_ARITHMETIC(cl::sycl::cl_float4)
106
+ SYCL_ARITHMETIC(cl::sycl::cl_double2)
107
+ #undef SYCL_ARITHMETIC
108
+
109
+ #define SYCL_UNPACKET_TRAITS(packet_type, unpacket_type, lengths) \
110
+ template <> \
111
+ struct unpacket_traits<packet_type> { \
112
+ typedef unpacket_type type; \
113
+ enum { size = lengths, vectorizable = true, alignment = Aligned16 }; \
114
+ typedef packet_type half; \
115
+ };
116
+ SYCL_UNPACKET_TRAITS(cl::sycl::cl_half8, Eigen::half, 8)
117
+ SYCL_UNPACKET_TRAITS(cl::sycl::cl_float4, float, 4)
118
+ SYCL_UNPACKET_TRAITS(cl::sycl::cl_double2, double, 2)
119
+
120
+ #undef SYCL_UNPACKET_TRAITS
121
+ #endif
122
+
123
+ } // end namespace internal
124
+
125
+ #endif
126
+
127
+ namespace TensorSycl {
128
+ namespace internal {
129
+
130
+ template <typename PacketReturnType, int PacketSize>
131
+ struct PacketWrapper;
132
+ // This function should never get called on the device
133
+ #ifndef SYCL_DEVICE_ONLY
134
+ template <typename PacketReturnType, int PacketSize>
135
+ struct PacketWrapper {
136
+ typedef typename ::Eigen::internal::unpacket_traits<PacketReturnType>::type Scalar;
137
+ template <typename Index>
138
+ EIGEN_DEVICE_FUNC static Scalar scalarize(Index, PacketReturnType &) {
139
+ eigen_assert(false && "THERE IS NO PACKETIZE VERSION FOR THE CHOSEN TYPE");
140
+ abort();
141
+ }
142
+ EIGEN_DEVICE_FUNC static PacketReturnType convert_to_packet_type(Scalar in, Scalar) {
143
+ return ::Eigen::internal::template plset<PacketReturnType>(in);
144
+ }
145
+ EIGEN_DEVICE_FUNC static void set_packet(PacketReturnType, Scalar *) {
146
+ eigen_assert(false && "THERE IS NO PACKETIZE VERSION FOR THE CHOSEN TYPE");
147
+ abort();
148
+ }
149
+ };
150
+
151
+ #elif defined(SYCL_DEVICE_ONLY)
152
+ template <typename PacketReturnType>
153
+ struct PacketWrapper<PacketReturnType, 4> {
154
+ typedef typename ::Eigen::internal::unpacket_traits<PacketReturnType>::type Scalar;
155
+ template <typename Index>
156
+ EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE static Scalar scalarize(Index index, PacketReturnType &in) {
157
+ switch (index) {
158
+ case 0:
159
+ return in.x();
160
+ case 1:
161
+ return in.y();
162
+ case 2:
163
+ return in.z();
164
+ case 3:
165
+ return in.w();
166
+ default:
167
+ // INDEX MUST BE BETWEEN 0 and 3.There is no abort function in SYCL kernel. so we cannot use abort here.
168
+ // The code will never reach here
169
+ __builtin_unreachable();
170
+ }
171
+ __builtin_unreachable();
172
+ }
173
+
174
+ EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE static PacketReturnType convert_to_packet_type(Scalar in, Scalar other) {
175
+ return PacketReturnType(in, other, other, other);
176
+ }
177
+ EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE static void set_packet(PacketReturnType &lhs, Scalar *rhs) {
178
+ lhs = PacketReturnType(rhs[0], rhs[1], rhs[2], rhs[3]);
179
+ }
180
+ };
181
+
182
+ template <typename PacketReturnType>
183
+ struct PacketWrapper<PacketReturnType, 1> {
184
+ typedef typename ::Eigen::internal::unpacket_traits<PacketReturnType>::type Scalar;
185
+ template <typename Index>
186
+ EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE static Scalar scalarize(Index, PacketReturnType &in) {
187
+ return in;
188
+ }
189
+ EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE static PacketReturnType convert_to_packet_type(Scalar in, Scalar) {
190
+ return PacketReturnType(in);
191
+ }
192
+ EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE static void set_packet(PacketReturnType &lhs, Scalar *rhs) { lhs = rhs[0]; }
193
+ };
194
+
195
+ template <typename PacketReturnType>
196
+ struct PacketWrapper<PacketReturnType, 2> {
197
+ typedef typename ::Eigen::internal::unpacket_traits<PacketReturnType>::type Scalar;
198
+ template <typename Index>
199
+ EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE static Scalar scalarize(Index index, PacketReturnType &in) {
200
+ switch (index) {
201
+ case 0:
202
+ return in.x();
203
+ case 1:
204
+ return in.y();
205
+ default:
206
+ // INDEX MUST BE BETWEEN 0 and 1.There is no abort function in SYCL kernel. so we cannot use abort here.
207
+ // The code will never reach here
208
+ __builtin_unreachable();
209
+ }
210
+ __builtin_unreachable();
211
+ }
212
+
213
+ EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE static PacketReturnType convert_to_packet_type(Scalar in, Scalar other) {
214
+ return PacketReturnType(in, other);
215
+ }
216
+ EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE static void set_packet(PacketReturnType &lhs, Scalar *rhs) {
217
+ lhs = PacketReturnType(rhs[0], rhs[1]);
218
+ }
219
+ };
220
+
221
+ #endif
222
+
223
+ } // end namespace internal
224
+ } // end namespace TensorSycl
225
+ } // end namespace Eigen
226
+
227
+ #endif // EIGEN_INTEROP_HEADERS_SYCL_H
@@ -0,0 +1,303 @@
1
+ // This file is part of Eigen, a lightweight C++ template library
2
+ // for linear algebra.
3
+ //
4
+ // Mehdi Goli Codeplay Software Ltd.
5
+ // Ralph Potter Codeplay Software Ltd.
6
+ // Luke Iwanski Codeplay Software Ltd.
7
+ // Contact: <eigen@codeplay.com>
8
+ //
9
+ // This Source Code Form is subject to the terms of the Mozilla
10
+ // Public License v. 2.0. If a copy of the MPL was not distributed
11
+ // with this file, You can obtain one at http://mozilla.org/MPL/2.0/.
12
+
13
+ /*****************************************************************
14
+ * MathFunctions.h
15
+ *
16
+ * \brief:
17
+ * MathFunctions
18
+ *
19
+ *****************************************************************/
20
+
21
+ #ifndef EIGEN_MATH_FUNCTIONS_SYCL_H
22
+ #define EIGEN_MATH_FUNCTIONS_SYCL_H
23
+ // IWYU pragma: private
24
+ #include "../../InternalHeaderCheck.h"
25
+
26
+ namespace Eigen {
27
+
28
+ namespace internal {
29
+
30
+ // Make sure this is only available when targeting a GPU: we don't want to
31
+ // introduce conflicts between these packet_traits definitions and the ones
32
+ // we'll use on the host side (SSE, AVX, ...)
33
+ #if defined(SYCL_DEVICE_ONLY)
34
+ #define SYCL_PLOG(packet_type) \
35
+ template <> \
36
+ EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE packet_type plog<packet_type>(const packet_type& a) { \
37
+ return cl::sycl::log(a); \
38
+ }
39
+
40
+ SYCL_PLOG(cl::sycl::cl_half8)
41
+ SYCL_PLOG(cl::sycl::cl_float4)
42
+ SYCL_PLOG(cl::sycl::cl_double2)
43
+ #undef SYCL_PLOG
44
+
45
+ #define SYCL_PLOG1P(packet_type) \
46
+ template <> \
47
+ EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE packet_type plog1p<packet_type>(const packet_type& a) { \
48
+ return cl::sycl::log1p(a); \
49
+ }
50
+
51
+ SYCL_PLOG1P(cl::sycl::cl_half8)
52
+ SYCL_PLOG1P(cl::sycl::cl_float4)
53
+ SYCL_PLOG1P(cl::sycl::cl_double2)
54
+ #undef SYCL_PLOG1P
55
+
56
+ #define SYCL_PLOG10(packet_type) \
57
+ template <> \
58
+ EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE packet_type plog10<packet_type>(const packet_type& a) { \
59
+ return cl::sycl::log10(a); \
60
+ }
61
+
62
+ SYCL_PLOG10(cl::sycl::cl_half8)
63
+ SYCL_PLOG10(cl::sycl::cl_float4)
64
+ SYCL_PLOG10(cl::sycl::cl_double2)
65
+ #undef SYCL_PLOG10
66
+
67
+ #define SYCL_PEXP(packet_type) \
68
+ template <> \
69
+ EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE packet_type pexp<packet_type>(const packet_type& a) { \
70
+ return cl::sycl::exp(a); \
71
+ }
72
+
73
+ SYCL_PEXP(cl::sycl::cl_half8)
74
+ SYCL_PEXP(cl::sycl::cl_half)
75
+ SYCL_PEXP(cl::sycl::cl_float4)
76
+ SYCL_PEXP(cl::sycl::cl_float)
77
+ SYCL_PEXP(cl::sycl::cl_double2)
78
+ #undef SYCL_PEXP
79
+
80
+ #define SYCL_PEXPM1(packet_type) \
81
+ template <> \
82
+ EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE packet_type pexpm1<packet_type>(const packet_type& a) { \
83
+ return cl::sycl::expm1(a); \
84
+ }
85
+
86
+ SYCL_PEXPM1(cl::sycl::cl_half8)
87
+ SYCL_PEXPM1(cl::sycl::cl_float4)
88
+ SYCL_PEXPM1(cl::sycl::cl_double2)
89
+ #undef SYCL_PEXPM1
90
+
91
+ #define SYCL_PSQRT(packet_type) \
92
+ template <> \
93
+ EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE packet_type psqrt<packet_type>(const packet_type& a) { \
94
+ return cl::sycl::sqrt(a); \
95
+ }
96
+
97
+ SYCL_PSQRT(cl::sycl::cl_half8)
98
+ SYCL_PSQRT(cl::sycl::cl_float4)
99
+ SYCL_PSQRT(cl::sycl::cl_double2)
100
+ #undef SYCL_PSQRT
101
+
102
+ #define SYCL_PRSQRT(packet_type) \
103
+ template <> \
104
+ EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE packet_type prsqrt<packet_type>(const packet_type& a) { \
105
+ return cl::sycl::rsqrt(a); \
106
+ }
107
+
108
+ SYCL_PRSQRT(cl::sycl::cl_half8)
109
+ SYCL_PRSQRT(cl::sycl::cl_float4)
110
+ SYCL_PRSQRT(cl::sycl::cl_double2)
111
+ #undef SYCL_PRSQRT
112
+
113
+ /** \internal \returns the hyperbolic sine of \a a (coeff-wise) */
114
+ #define SYCL_PSIN(packet_type) \
115
+ template <> \
116
+ EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE packet_type psin<packet_type>(const packet_type& a) { \
117
+ return cl::sycl::sin(a); \
118
+ }
119
+
120
+ SYCL_PSIN(cl::sycl::cl_half8)
121
+ SYCL_PSIN(cl::sycl::cl_float4)
122
+ SYCL_PSIN(cl::sycl::cl_double2)
123
+ #undef SYCL_PSIN
124
+
125
+ /** \internal \returns the hyperbolic cosine of \a a (coeff-wise) */
126
+ #define SYCL_PCOS(packet_type) \
127
+ template <> \
128
+ EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE packet_type pcos<packet_type>(const packet_type& a) { \
129
+ return cl::sycl::cos(a); \
130
+ }
131
+
132
+ SYCL_PCOS(cl::sycl::cl_half8)
133
+ SYCL_PCOS(cl::sycl::cl_float4)
134
+ SYCL_PCOS(cl::sycl::cl_double2)
135
+ #undef SYCL_PCOS
136
+
137
+ /** \internal \returns the hyperbolic tan of \a a (coeff-wise) */
138
+ #define SYCL_PTAN(packet_type) \
139
+ template <> \
140
+ EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE packet_type ptan<packet_type>(const packet_type& a) { \
141
+ return cl::sycl::tan(a); \
142
+ }
143
+
144
+ SYCL_PTAN(cl::sycl::cl_half8)
145
+ SYCL_PTAN(cl::sycl::cl_float4)
146
+ SYCL_PTAN(cl::sycl::cl_double2)
147
+ #undef SYCL_PTAN
148
+
149
+ /** \internal \returns the hyperbolic sine of \a a (coeff-wise) */
150
+ #define SYCL_PASIN(packet_type) \
151
+ template <> \
152
+ EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE packet_type pasin<packet_type>(const packet_type& a) { \
153
+ return cl::sycl::asin(a); \
154
+ }
155
+
156
+ SYCL_PASIN(cl::sycl::cl_half8)
157
+ SYCL_PASIN(cl::sycl::cl_float4)
158
+ SYCL_PASIN(cl::sycl::cl_double2)
159
+ #undef SYCL_PASIN
160
+
161
+ /** \internal \returns the hyperbolic cosine of \a a (coeff-wise) */
162
+ #define SYCL_PACOS(packet_type) \
163
+ template <> \
164
+ EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE packet_type pacos<packet_type>(const packet_type& a) { \
165
+ return cl::sycl::acos(a); \
166
+ }
167
+
168
+ SYCL_PACOS(cl::sycl::cl_half8)
169
+ SYCL_PACOS(cl::sycl::cl_float4)
170
+ SYCL_PACOS(cl::sycl::cl_double2)
171
+ #undef SYCL_PACOS
172
+
173
+ /** \internal \returns the hyperbolic tan of \a a (coeff-wise) */
174
+ #define SYCL_PATAN(packet_type) \
175
+ template <> \
176
+ EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE packet_type patan<packet_type>(const packet_type& a) { \
177
+ return cl::sycl::atan(a); \
178
+ }
179
+
180
+ SYCL_PATAN(cl::sycl::cl_half8)
181
+ SYCL_PATAN(cl::sycl::cl_float4)
182
+ SYCL_PATAN(cl::sycl::cl_double2)
183
+ #undef SYCL_PATAN
184
+
185
+ /** \internal \returns the hyperbolic sine of \a a (coeff-wise) */
186
+ #define SYCL_PSINH(packet_type) \
187
+ template <> \
188
+ EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE packet_type psinh<packet_type>(const packet_type& a) { \
189
+ return cl::sycl::sinh(a); \
190
+ }
191
+
192
+ SYCL_PSINH(cl::sycl::cl_half8)
193
+ SYCL_PSINH(cl::sycl::cl_float4)
194
+ SYCL_PSINH(cl::sycl::cl_double2)
195
+ #undef SYCL_PSINH
196
+
197
+ /** \internal \returns the hyperbolic cosine of \a a (coeff-wise) */
198
+ #define SYCL_PCOSH(packet_type) \
199
+ template <> \
200
+ EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE packet_type pcosh<packet_type>(const packet_type& a) { \
201
+ return cl::sycl::cosh(a); \
202
+ }
203
+
204
+ SYCL_PCOSH(cl::sycl::cl_half8)
205
+ SYCL_PCOSH(cl::sycl::cl_float4)
206
+ SYCL_PCOSH(cl::sycl::cl_double2)
207
+ #undef SYCL_PCOSH
208
+
209
+ /** \internal \returns the hyperbolic tan of \a a (coeff-wise) */
210
+ #define SYCL_PTANH(packet_type) \
211
+ template <> \
212
+ EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE packet_type ptanh<packet_type>(const packet_type& a) { \
213
+ return cl::sycl::tanh(a); \
214
+ }
215
+
216
+ SYCL_PTANH(cl::sycl::cl_half8)
217
+ SYCL_PTANH(cl::sycl::cl_float4)
218
+ SYCL_PTANH(cl::sycl::cl_double2)
219
+ #undef SYCL_PTANH
220
+
221
+ #define SYCL_PCEIL(packet_type) \
222
+ template <> \
223
+ EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE packet_type pceil<packet_type>(const packet_type& a) { \
224
+ return cl::sycl::ceil(a); \
225
+ }
226
+
227
+ SYCL_PCEIL(cl::sycl::cl_half)
228
+ SYCL_PCEIL(cl::sycl::cl_float4)
229
+ SYCL_PCEIL(cl::sycl::cl_double2)
230
+ #undef SYCL_PCEIL
231
+
232
+ #define SYCL_PROUND(packet_type) \
233
+ template <> \
234
+ EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE packet_type pround<packet_type>(const packet_type& a) { \
235
+ return cl::sycl::round(a); \
236
+ }
237
+
238
+ SYCL_PROUND(cl::sycl::cl_half8)
239
+ SYCL_PROUND(cl::sycl::cl_float4)
240
+ SYCL_PROUND(cl::sycl::cl_double2)
241
+ #undef SYCL_PROUND
242
+
243
+ #define SYCL_PRINT(packet_type) \
244
+ template <> \
245
+ EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE packet_type print<packet_type>(const packet_type& a) { \
246
+ return cl::sycl::rint(a); \
247
+ }
248
+
249
+ SYCL_PRINT(cl::sycl::cl_half8)
250
+ SYCL_PRINT(cl::sycl::cl_float4)
251
+ SYCL_PRINT(cl::sycl::cl_double2)
252
+ #undef SYCL_PRINT
253
+
254
+ #define SYCL_FLOOR(packet_type) \
255
+ template <> \
256
+ EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE packet_type pfloor<packet_type>(const packet_type& a) { \
257
+ return cl::sycl::floor(a); \
258
+ }
259
+
260
+ SYCL_FLOOR(cl::sycl::cl_half8)
261
+ SYCL_FLOOR(cl::sycl::cl_float4)
262
+ SYCL_FLOOR(cl::sycl::cl_double2)
263
+ #undef SYCL_FLOOR
264
+
265
+ #define SYCL_PMIN(packet_type, expr) \
266
+ template <> \
267
+ EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE packet_type pmin<packet_type>(const packet_type& a, const packet_type& b) { \
268
+ return expr; \
269
+ }
270
+
271
+ SYCL_PMIN(cl::sycl::cl_half8, cl::sycl::fmin(a, b))
272
+ SYCL_PMIN(cl::sycl::cl_float4, cl::sycl::fmin(a, b))
273
+ SYCL_PMIN(cl::sycl::cl_double2, cl::sycl::fmin(a, b))
274
+ #undef SYCL_PMIN
275
+
276
+ #define SYCL_PMAX(packet_type, expr) \
277
+ template <> \
278
+ EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE packet_type pmax<packet_type>(const packet_type& a, const packet_type& b) { \
279
+ return expr; \
280
+ }
281
+
282
+ SYCL_PMAX(cl::sycl::cl_half8, cl::sycl::fmax(a, b))
283
+ SYCL_PMAX(cl::sycl::cl_float4, cl::sycl::fmax(a, b))
284
+ SYCL_PMAX(cl::sycl::cl_double2, cl::sycl::fmax(a, b))
285
+ #undef SYCL_PMAX
286
+
287
+ #define SYCL_PLDEXP(packet_type) \
288
+ template <> \
289
+ EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE packet_type pldexp(const packet_type& a, const packet_type& exponent) { \
290
+ return cl::sycl::ldexp(a, exponent.template convert<cl::sycl::cl_int, cl::sycl::rounding_mode::automatic>()); \
291
+ }
292
+
293
+ SYCL_PLDEXP(cl::sycl::cl_half8)
294
+ SYCL_PLDEXP(cl::sycl::cl_float4)
295
+ SYCL_PLDEXP(cl::sycl::cl_double2)
296
+ #undef SYCL_PLDEXP
297
+
298
+ #endif
299
+ } // end namespace internal
300
+
301
+ } // end namespace Eigen
302
+
303
+ #endif // EIGEN_MATH_FUNCTIONS_SYCL_H