@smake/eigen 1.1.0 → 1.1.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +1 -1
- package/eigen/Eigen/AccelerateSupport +52 -0
- package/eigen/Eigen/Cholesky +18 -20
- package/eigen/Eigen/CholmodSupport +28 -28
- package/eigen/Eigen/Core +187 -120
- package/eigen/Eigen/Eigenvalues +16 -13
- package/eigen/Eigen/Geometry +18 -18
- package/eigen/Eigen/Householder +9 -7
- package/eigen/Eigen/IterativeLinearSolvers +8 -4
- package/eigen/Eigen/Jacobi +14 -13
- package/eigen/Eigen/KLUSupport +23 -21
- package/eigen/Eigen/LU +15 -16
- package/eigen/Eigen/MetisSupport +12 -12
- package/eigen/Eigen/OrderingMethods +54 -51
- package/eigen/Eigen/PaStiXSupport +23 -21
- package/eigen/Eigen/PardisoSupport +17 -14
- package/eigen/Eigen/QR +18 -20
- package/eigen/Eigen/QtAlignedMalloc +5 -12
- package/eigen/Eigen/SPQRSupport +21 -14
- package/eigen/Eigen/SVD +23 -17
- package/eigen/Eigen/Sparse +1 -2
- package/eigen/Eigen/SparseCholesky +18 -15
- package/eigen/Eigen/SparseCore +18 -17
- package/eigen/Eigen/SparseLU +9 -9
- package/eigen/Eigen/SparseQR +16 -14
- package/eigen/Eigen/StdDeque +5 -2
- package/eigen/Eigen/StdList +5 -2
- package/eigen/Eigen/StdVector +5 -2
- package/eigen/Eigen/SuperLUSupport +30 -24
- package/eigen/Eigen/ThreadPool +80 -0
- package/eigen/Eigen/UmfPackSupport +19 -17
- package/eigen/Eigen/Version +14 -0
- package/eigen/Eigen/src/AccelerateSupport/AccelerateSupport.h +423 -0
- package/eigen/Eigen/src/AccelerateSupport/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/Cholesky/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/Cholesky/LDLT.h +366 -405
- package/eigen/Eigen/src/Cholesky/LLT.h +323 -367
- package/eigen/Eigen/src/Cholesky/LLT_LAPACKE.h +81 -56
- package/eigen/Eigen/src/CholmodSupport/CholmodSupport.h +585 -529
- package/eigen/Eigen/src/CholmodSupport/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/Core/ArithmeticSequence.h +143 -317
- package/eigen/Eigen/src/Core/Array.h +329 -370
- package/eigen/Eigen/src/Core/ArrayBase.h +190 -203
- package/eigen/Eigen/src/Core/ArrayWrapper.h +126 -170
- package/eigen/Eigen/src/Core/Assign.h +30 -40
- package/eigen/Eigen/src/Core/AssignEvaluator.h +651 -604
- package/eigen/Eigen/src/Core/Assign_MKL.h +125 -120
- package/eigen/Eigen/src/Core/BandMatrix.h +267 -282
- package/eigen/Eigen/src/Core/Block.h +371 -390
- package/eigen/Eigen/src/Core/CommaInitializer.h +85 -100
- package/eigen/Eigen/src/Core/ConditionEstimator.h +51 -53
- package/eigen/Eigen/src/Core/CoreEvaluators.h +1214 -937
- package/eigen/Eigen/src/Core/CoreIterators.h +72 -63
- package/eigen/Eigen/src/Core/CwiseBinaryOp.h +112 -129
- package/eigen/Eigen/src/Core/CwiseNullaryOp.h +676 -702
- package/eigen/Eigen/src/Core/CwiseTernaryOp.h +77 -103
- package/eigen/Eigen/src/Core/CwiseUnaryOp.h +55 -67
- package/eigen/Eigen/src/Core/CwiseUnaryView.h +127 -92
- package/eigen/Eigen/src/Core/DenseBase.h +630 -658
- package/eigen/Eigen/src/Core/DenseCoeffsBase.h +511 -628
- package/eigen/Eigen/src/Core/DenseStorage.h +511 -590
- package/eigen/Eigen/src/Core/DeviceWrapper.h +153 -0
- package/eigen/Eigen/src/Core/Diagonal.h +168 -207
- package/eigen/Eigen/src/Core/DiagonalMatrix.h +346 -317
- package/eigen/Eigen/src/Core/DiagonalProduct.h +12 -10
- package/eigen/Eigen/src/Core/Dot.h +167 -217
- package/eigen/Eigen/src/Core/EigenBase.h +74 -85
- package/eigen/Eigen/src/Core/Fill.h +138 -0
- package/eigen/Eigen/src/Core/FindCoeff.h +464 -0
- package/eigen/Eigen/src/Core/ForceAlignedAccess.h +90 -113
- package/eigen/Eigen/src/Core/Fuzzy.h +82 -105
- package/eigen/Eigen/src/Core/GeneralProduct.h +315 -261
- package/eigen/Eigen/src/Core/GenericPacketMath.h +1182 -520
- package/eigen/Eigen/src/Core/GlobalFunctions.h +193 -157
- package/eigen/Eigen/src/Core/IO.h +131 -156
- package/eigen/Eigen/src/Core/IndexedView.h +209 -125
- package/eigen/Eigen/src/Core/InnerProduct.h +260 -0
- package/eigen/Eigen/src/Core/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/Core/Inverse.h +50 -59
- package/eigen/Eigen/src/Core/Map.h +123 -141
- package/eigen/Eigen/src/Core/MapBase.h +255 -282
- package/eigen/Eigen/src/Core/MathFunctions.h +1247 -1201
- package/eigen/Eigen/src/Core/MathFunctionsImpl.h +162 -99
- package/eigen/Eigen/src/Core/Matrix.h +463 -494
- package/eigen/Eigen/src/Core/MatrixBase.h +468 -470
- package/eigen/Eigen/src/Core/NestByValue.h +58 -52
- package/eigen/Eigen/src/Core/NoAlias.h +79 -86
- package/eigen/Eigen/src/Core/NumTraits.h +206 -206
- package/eigen/Eigen/src/Core/PartialReduxEvaluator.h +163 -142
- package/eigen/Eigen/src/Core/PermutationMatrix.h +461 -511
- package/eigen/Eigen/src/Core/PlainObjectBase.h +858 -972
- package/eigen/Eigen/src/Core/Product.h +246 -130
- package/eigen/Eigen/src/Core/ProductEvaluators.h +779 -671
- package/eigen/Eigen/src/Core/Random.h +153 -164
- package/eigen/Eigen/src/Core/RandomImpl.h +262 -0
- package/eigen/Eigen/src/Core/RealView.h +250 -0
- package/eigen/Eigen/src/Core/Redux.h +334 -314
- package/eigen/Eigen/src/Core/Ref.h +259 -257
- package/eigen/Eigen/src/Core/Replicate.h +92 -104
- package/eigen/Eigen/src/Core/Reshaped.h +215 -271
- package/eigen/Eigen/src/Core/ReturnByValue.h +47 -55
- package/eigen/Eigen/src/Core/Reverse.h +133 -148
- package/eigen/Eigen/src/Core/Select.h +68 -140
- package/eigen/Eigen/src/Core/SelfAdjointView.h +254 -290
- package/eigen/Eigen/src/Core/SelfCwiseBinaryOp.h +23 -20
- package/eigen/Eigen/src/Core/SkewSymmetricMatrix3.h +382 -0
- package/eigen/Eigen/src/Core/Solve.h +88 -102
- package/eigen/Eigen/src/Core/SolveTriangular.h +126 -124
- package/eigen/Eigen/src/Core/SolverBase.h +132 -133
- package/eigen/Eigen/src/Core/StableNorm.h +113 -147
- package/eigen/Eigen/src/Core/StlIterators.h +404 -248
- package/eigen/Eigen/src/Core/Stride.h +90 -92
- package/eigen/Eigen/src/Core/Swap.h +70 -39
- package/eigen/Eigen/src/Core/Transpose.h +258 -295
- package/eigen/Eigen/src/Core/Transpositions.h +270 -333
- package/eigen/Eigen/src/Core/TriangularMatrix.h +642 -743
- package/eigen/Eigen/src/Core/VectorBlock.h +59 -72
- package/eigen/Eigen/src/Core/VectorwiseOp.h +653 -704
- package/eigen/Eigen/src/Core/Visitor.h +464 -308
- package/eigen/Eigen/src/Core/arch/AVX/Complex.h +380 -187
- package/eigen/Eigen/src/Core/arch/AVX/MathFunctions.h +65 -163
- package/eigen/Eigen/src/Core/arch/AVX/PacketMath.h +2145 -638
- package/eigen/Eigen/src/Core/arch/AVX/Reductions.h +353 -0
- package/eigen/Eigen/src/Core/arch/AVX/TypeCasting.h +253 -60
- package/eigen/Eigen/src/Core/arch/AVX512/Complex.h +278 -228
- package/eigen/Eigen/src/Core/arch/AVX512/GemmKernel.h +1245 -0
- package/eigen/Eigen/src/Core/arch/AVX512/MathFunctions.h +48 -269
- package/eigen/Eigen/src/Core/arch/AVX512/MathFunctionsFP16.h +75 -0
- package/eigen/Eigen/src/Core/arch/AVX512/PacketMath.h +1597 -754
- package/eigen/Eigen/src/Core/arch/AVX512/PacketMathFP16.h +1413 -0
- package/eigen/Eigen/src/Core/arch/AVX512/Reductions.h +297 -0
- package/eigen/Eigen/src/Core/arch/AVX512/TrsmKernel.h +1167 -0
- package/eigen/Eigen/src/Core/arch/AVX512/TrsmUnrolls.inc +1219 -0
- package/eigen/Eigen/src/Core/arch/AVX512/TypeCasting.h +229 -41
- package/eigen/Eigen/src/Core/arch/AVX512/TypeCastingFP16.h +130 -0
- package/eigen/Eigen/src/Core/arch/AltiVec/Complex.h +420 -184
- package/eigen/Eigen/src/Core/arch/AltiVec/MathFunctions.h +40 -49
- package/eigen/Eigen/src/Core/arch/AltiVec/MatrixProduct.h +2962 -2213
- package/eigen/Eigen/src/Core/arch/AltiVec/MatrixProductCommon.h +196 -212
- package/eigen/Eigen/src/Core/arch/AltiVec/MatrixProductMMA.h +713 -441
- package/eigen/Eigen/src/Core/arch/AltiVec/MatrixProductMMAbfloat16.h +742 -0
- package/eigen/Eigen/src/Core/arch/AltiVec/MatrixVectorProduct.inc +2818 -0
- package/eigen/Eigen/src/Core/arch/AltiVec/PacketMath.h +2380 -1362
- package/eigen/Eigen/src/Core/arch/AltiVec/TypeCasting.h +153 -0
- package/eigen/Eigen/src/Core/arch/Default/BFloat16.h +390 -224
- package/eigen/Eigen/src/Core/arch/Default/ConjHelper.h +78 -67
- package/eigen/Eigen/src/Core/arch/Default/GenericPacketMathFunctions.h +1784 -799
- package/eigen/Eigen/src/Core/arch/Default/GenericPacketMathFunctionsFwd.h +167 -50
- package/eigen/Eigen/src/Core/arch/Default/Half.h +528 -379
- package/eigen/Eigen/src/Core/arch/Default/Settings.h +10 -12
- package/eigen/Eigen/src/Core/arch/GPU/Complex.h +244 -0
- package/eigen/Eigen/src/Core/arch/GPU/MathFunctions.h +41 -40
- package/eigen/Eigen/src/Core/arch/GPU/PacketMath.h +550 -523
- package/eigen/Eigen/src/Core/arch/GPU/Tuple.h +268 -0
- package/eigen/Eigen/src/Core/arch/GPU/TypeCasting.h +27 -30
- package/eigen/Eigen/src/Core/arch/HIP/hcc/math_constants.h +8 -8
- package/eigen/Eigen/src/Core/arch/HVX/PacketMath.h +1088 -0
- package/eigen/Eigen/src/Core/arch/LSX/Complex.h +520 -0
- package/eigen/Eigen/src/Core/arch/LSX/GeneralBlockPanelKernel.h +23 -0
- package/eigen/Eigen/src/Core/arch/LSX/MathFunctions.h +43 -0
- package/eigen/Eigen/src/Core/arch/LSX/PacketMath.h +2866 -0
- package/eigen/Eigen/src/Core/arch/LSX/TypeCasting.h +526 -0
- package/eigen/Eigen/src/Core/arch/MSA/Complex.h +54 -82
- package/eigen/Eigen/src/Core/arch/MSA/MathFunctions.h +84 -92
- package/eigen/Eigen/src/Core/arch/MSA/PacketMath.h +51 -47
- package/eigen/Eigen/src/Core/arch/NEON/Complex.h +454 -306
- package/eigen/Eigen/src/Core/arch/NEON/GeneralBlockPanelKernel.h +175 -115
- package/eigen/Eigen/src/Core/arch/NEON/MathFunctions.h +23 -30
- package/eigen/Eigen/src/Core/arch/NEON/PacketMath.h +4366 -2857
- package/eigen/Eigen/src/Core/arch/NEON/TypeCasting.h +616 -393
- package/eigen/Eigen/src/Core/arch/NEON/UnaryFunctors.h +57 -0
- package/eigen/Eigen/src/Core/arch/SSE/Complex.h +350 -198
- package/eigen/Eigen/src/Core/arch/SSE/MathFunctions.h +38 -149
- package/eigen/Eigen/src/Core/arch/SSE/PacketMath.h +1791 -912
- package/eigen/Eigen/src/Core/arch/SSE/Reductions.h +324 -0
- package/eigen/Eigen/src/Core/arch/SSE/TypeCasting.h +128 -40
- package/eigen/Eigen/src/Core/arch/SVE/MathFunctions.h +10 -6
- package/eigen/Eigen/src/Core/arch/SVE/PacketMath.h +156 -234
- package/eigen/Eigen/src/Core/arch/SVE/TypeCasting.h +6 -3
- package/eigen/Eigen/src/Core/arch/SYCL/InteropHeaders.h +27 -32
- package/eigen/Eigen/src/Core/arch/SYCL/MathFunctions.h +119 -117
- package/eigen/Eigen/src/Core/arch/SYCL/PacketMath.h +325 -419
- package/eigen/Eigen/src/Core/arch/SYCL/TypeCasting.h +15 -17
- package/eigen/Eigen/src/Core/arch/ZVector/Complex.h +325 -181
- package/eigen/Eigen/src/Core/arch/ZVector/MathFunctions.h +94 -83
- package/eigen/Eigen/src/Core/arch/ZVector/PacketMath.h +811 -458
- package/eigen/Eigen/src/Core/functors/AssignmentFunctors.h +121 -124
- package/eigen/Eigen/src/Core/functors/BinaryFunctors.h +576 -370
- package/eigen/Eigen/src/Core/functors/NullaryFunctors.h +194 -109
- package/eigen/Eigen/src/Core/functors/StlFunctors.h +95 -112
- package/eigen/Eigen/src/Core/functors/TernaryFunctors.h +34 -7
- package/eigen/Eigen/src/Core/functors/UnaryFunctors.h +1038 -749
- package/eigen/Eigen/src/Core/products/GeneralBlockPanelKernel.h +1883 -1375
- package/eigen/Eigen/src/Core/products/GeneralMatrixMatrix.h +312 -370
- package/eigen/Eigen/src/Core/products/GeneralMatrixMatrixTriangular.h +189 -176
- package/eigen/Eigen/src/Core/products/GeneralMatrixMatrixTriangular_BLAS.h +84 -81
- package/eigen/Eigen/src/Core/products/GeneralMatrixMatrix_BLAS.h +154 -73
- package/eigen/Eigen/src/Core/products/GeneralMatrixVector.h +292 -337
- package/eigen/Eigen/src/Core/products/GeneralMatrixVector_BLAS.h +80 -77
- package/eigen/Eigen/src/Core/products/Parallelizer.h +207 -105
- package/eigen/Eigen/src/Core/products/SelfadjointMatrixMatrix.h +327 -388
- package/eigen/Eigen/src/Core/products/SelfadjointMatrixMatrix_BLAS.h +206 -224
- package/eigen/Eigen/src/Core/products/SelfadjointMatrixVector.h +138 -147
- package/eigen/Eigen/src/Core/products/SelfadjointMatrixVector_BLAS.h +58 -61
- package/eigen/Eigen/src/Core/products/SelfadjointProduct.h +71 -71
- package/eigen/Eigen/src/Core/products/SelfadjointRank2Update.h +48 -47
- package/eigen/Eigen/src/Core/products/TriangularMatrixMatrix.h +294 -369
- package/eigen/Eigen/src/Core/products/TriangularMatrixMatrix_BLAS.h +246 -238
- package/eigen/Eigen/src/Core/products/TriangularMatrixVector.h +244 -247
- package/eigen/Eigen/src/Core/products/TriangularMatrixVector_BLAS.h +212 -192
- package/eigen/Eigen/src/Core/products/TriangularSolverMatrix.h +328 -277
- package/eigen/Eigen/src/Core/products/TriangularSolverMatrix_BLAS.h +108 -109
- package/eigen/Eigen/src/Core/products/TriangularSolverVector.h +68 -94
- package/eigen/Eigen/src/Core/util/Assert.h +158 -0
- package/eigen/Eigen/src/Core/util/BlasUtil.h +342 -303
- package/eigen/Eigen/src/Core/util/ConfigureVectorization.h +348 -317
- package/eigen/Eigen/src/Core/util/Constants.h +297 -262
- package/eigen/Eigen/src/Core/util/DisableStupidWarnings.h +130 -90
- package/eigen/Eigen/src/Core/util/EmulateArray.h +270 -0
- package/eigen/Eigen/src/Core/util/ForwardDeclarations.h +449 -247
- package/eigen/Eigen/src/Core/util/GpuHipCudaDefines.inc +101 -0
- package/eigen/Eigen/src/Core/util/GpuHipCudaUndefines.inc +45 -0
- package/eigen/Eigen/src/Core/util/IndexedViewHelper.h +417 -116
- package/eigen/Eigen/src/Core/util/IntegralConstant.h +211 -204
- package/eigen/Eigen/src/Core/util/MKL_support.h +39 -37
- package/eigen/Eigen/src/Core/util/Macros.h +655 -773
- package/eigen/Eigen/src/Core/util/MaxSizeVector.h +139 -0
- package/eigen/Eigen/src/Core/util/Memory.h +970 -748
- package/eigen/Eigen/src/Core/util/Meta.h +581 -633
- package/eigen/Eigen/src/Core/util/MoreMeta.h +638 -0
- package/eigen/Eigen/src/Core/util/ReenableStupidWarnings.h +32 -19
- package/eigen/Eigen/src/Core/util/ReshapedHelper.h +17 -17
- package/eigen/Eigen/src/Core/util/Serializer.h +209 -0
- package/eigen/Eigen/src/Core/util/StaticAssert.h +50 -166
- package/eigen/Eigen/src/Core/util/SymbolicIndex.h +377 -225
- package/eigen/Eigen/src/Core/util/XprHelper.h +784 -547
- package/eigen/Eigen/src/Eigenvalues/ComplexEigenSolver.h +246 -277
- package/eigen/Eigen/src/Eigenvalues/ComplexSchur.h +299 -319
- package/eigen/Eigen/src/Eigenvalues/ComplexSchur_LAPACKE.h +52 -48
- package/eigen/Eigen/src/Eigenvalues/EigenSolver.h +413 -456
- package/eigen/Eigen/src/Eigenvalues/GeneralizedEigenSolver.h +309 -325
- package/eigen/Eigen/src/Eigenvalues/GeneralizedSelfAdjointEigenSolver.h +157 -171
- package/eigen/Eigen/src/Eigenvalues/HessenbergDecomposition.h +292 -310
- package/eigen/Eigen/src/Eigenvalues/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/Eigenvalues/MatrixBaseEigenvalues.h +89 -105
- package/eigen/Eigen/src/Eigenvalues/RealQZ.h +537 -607
- package/eigen/Eigen/src/Eigenvalues/RealSchur.h +342 -381
- package/eigen/Eigen/src/Eigenvalues/RealSchur_LAPACKE.h +41 -35
- package/eigen/Eigen/src/Eigenvalues/SelfAdjointEigenSolver.h +541 -595
- package/eigen/Eigen/src/Eigenvalues/SelfAdjointEigenSolver_LAPACKE.h +47 -44
- package/eigen/Eigen/src/Eigenvalues/Tridiagonalization.h +430 -462
- package/eigen/Eigen/src/Geometry/AlignedBox.h +226 -227
- package/eigen/Eigen/src/Geometry/AngleAxis.h +131 -133
- package/eigen/Eigen/src/Geometry/EulerAngles.h +163 -74
- package/eigen/Eigen/src/Geometry/Homogeneous.h +285 -333
- package/eigen/Eigen/src/Geometry/Hyperplane.h +151 -160
- package/eigen/Eigen/src/Geometry/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/Geometry/OrthoMethods.h +168 -146
- package/eigen/Eigen/src/Geometry/ParametrizedLine.h +127 -127
- package/eigen/Eigen/src/Geometry/Quaternion.h +566 -506
- package/eigen/Eigen/src/Geometry/Rotation2D.h +107 -105
- package/eigen/Eigen/src/Geometry/RotationBase.h +148 -145
- package/eigen/Eigen/src/Geometry/Scaling.h +113 -106
- package/eigen/Eigen/src/Geometry/Transform.h +858 -936
- package/eigen/Eigen/src/Geometry/Translation.h +94 -92
- package/eigen/Eigen/src/Geometry/Umeyama.h +79 -84
- package/eigen/Eigen/src/Geometry/arch/Geometry_SIMD.h +90 -104
- package/eigen/Eigen/src/Householder/BlockHouseholder.h +51 -46
- package/eigen/Eigen/src/Householder/Householder.h +102 -124
- package/eigen/Eigen/src/Householder/HouseholderSequence.h +412 -453
- package/eigen/Eigen/src/Householder/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/IterativeLinearSolvers/BasicPreconditioners.h +149 -162
- package/eigen/Eigen/src/IterativeLinearSolvers/BiCGSTAB.h +124 -119
- package/eigen/Eigen/src/IterativeLinearSolvers/ConjugateGradient.h +92 -104
- package/eigen/Eigen/src/IterativeLinearSolvers/IncompleteCholesky.h +251 -243
- package/eigen/Eigen/src/IterativeLinearSolvers/IncompleteLUT.h +224 -228
- package/eigen/Eigen/src/IterativeLinearSolvers/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/IterativeLinearSolvers/IterativeSolverBase.h +178 -227
- package/eigen/Eigen/src/IterativeLinearSolvers/LeastSquareConjugateGradient.h +79 -84
- package/eigen/Eigen/src/IterativeLinearSolvers/SolveWithGuess.h +54 -60
- package/eigen/Eigen/src/Jacobi/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/Jacobi/Jacobi.h +252 -308
- package/eigen/Eigen/src/KLUSupport/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/KLUSupport/KLUSupport.h +208 -227
- package/eigen/Eigen/src/LU/Determinant.h +50 -69
- package/eigen/Eigen/src/LU/FullPivLU.h +545 -596
- package/eigen/Eigen/src/LU/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/LU/InverseImpl.h +206 -285
- package/eigen/Eigen/src/LU/PartialPivLU.h +390 -428
- package/eigen/Eigen/src/LU/PartialPivLU_LAPACKE.h +54 -40
- package/eigen/Eigen/src/LU/arch/InverseSize4.h +72 -70
- package/eigen/Eigen/src/MetisSupport/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/MetisSupport/MetisSupport.h +81 -93
- package/eigen/Eigen/src/OrderingMethods/Amd.h +243 -265
- package/eigen/Eigen/src/OrderingMethods/Eigen_Colamd.h +831 -1004
- package/eigen/Eigen/src/OrderingMethods/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/OrderingMethods/Ordering.h +112 -119
- package/eigen/Eigen/src/PaStiXSupport/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/PaStiXSupport/PaStiXSupport.h +524 -570
- package/eigen/Eigen/src/PardisoSupport/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/PardisoSupport/PardisoSupport.h +385 -430
- package/eigen/Eigen/src/QR/ColPivHouseholderQR.h +479 -479
- package/eigen/Eigen/src/QR/ColPivHouseholderQR_LAPACKE.h +120 -56
- package/eigen/Eigen/src/QR/CompleteOrthogonalDecomposition.h +166 -153
- package/eigen/Eigen/src/QR/FullPivHouseholderQR.h +495 -475
- package/eigen/Eigen/src/QR/HouseholderQR.h +394 -285
- package/eigen/Eigen/src/QR/HouseholderQR_LAPACKE.h +32 -23
- package/eigen/Eigen/src/QR/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/SPQRSupport/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/SPQRSupport/SuiteSparseQRSupport.h +244 -264
- package/eigen/Eigen/src/SVD/BDCSVD.h +817 -713
- package/eigen/Eigen/src/SVD/BDCSVD_LAPACKE.h +174 -0
- package/eigen/Eigen/src/SVD/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/SVD/JacobiSVD.h +577 -543
- package/eigen/Eigen/src/SVD/JacobiSVD_LAPACKE.h +85 -49
- package/eigen/Eigen/src/SVD/SVDBase.h +242 -182
- package/eigen/Eigen/src/SVD/UpperBidiagonalization.h +200 -235
- package/eigen/Eigen/src/SparseCholesky/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/SparseCholesky/SimplicialCholesky.h +765 -594
- package/eigen/Eigen/src/SparseCholesky/SimplicialCholesky_impl.h +308 -94
- package/eigen/Eigen/src/SparseCore/AmbiVector.h +202 -251
- package/eigen/Eigen/src/SparseCore/CompressedStorage.h +184 -252
- package/eigen/Eigen/src/SparseCore/ConservativeSparseSparseProduct.h +134 -178
- package/eigen/Eigen/src/SparseCore/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/SparseCore/SparseAssign.h +149 -140
- package/eigen/Eigen/src/SparseCore/SparseBlock.h +403 -440
- package/eigen/Eigen/src/SparseCore/SparseColEtree.h +100 -112
- package/eigen/Eigen/src/SparseCore/SparseCompressedBase.h +525 -303
- package/eigen/Eigen/src/SparseCore/SparseCwiseBinaryOp.h +555 -339
- package/eigen/Eigen/src/SparseCore/SparseCwiseUnaryOp.h +100 -108
- package/eigen/Eigen/src/SparseCore/SparseDenseProduct.h +169 -197
- package/eigen/Eigen/src/SparseCore/SparseDiagonalProduct.h +71 -71
- package/eigen/Eigen/src/SparseCore/SparseDot.h +49 -47
- package/eigen/Eigen/src/SparseCore/SparseFuzzy.h +13 -11
- package/eigen/Eigen/src/SparseCore/SparseMap.h +243 -253
- package/eigen/Eigen/src/SparseCore/SparseMatrix.h +1603 -1245
- package/eigen/Eigen/src/SparseCore/SparseMatrixBase.h +403 -350
- package/eigen/Eigen/src/SparseCore/SparsePermutation.h +186 -115
- package/eigen/Eigen/src/SparseCore/SparseProduct.h +94 -97
- package/eigen/Eigen/src/SparseCore/SparseRedux.h +22 -24
- package/eigen/Eigen/src/SparseCore/SparseRef.h +268 -295
- package/eigen/Eigen/src/SparseCore/SparseSelfAdjointView.h +370 -416
- package/eigen/Eigen/src/SparseCore/SparseSolverBase.h +78 -87
- package/eigen/Eigen/src/SparseCore/SparseSparseProductWithPruning.h +81 -95
- package/eigen/Eigen/src/SparseCore/SparseTranspose.h +62 -71
- package/eigen/Eigen/src/SparseCore/SparseTriangularView.h +132 -144
- package/eigen/Eigen/src/SparseCore/SparseUtil.h +138 -115
- package/eigen/Eigen/src/SparseCore/SparseVector.h +426 -372
- package/eigen/Eigen/src/SparseCore/SparseView.h +164 -193
- package/eigen/Eigen/src/SparseCore/TriangularSolver.h +129 -170
- package/eigen/Eigen/src/SparseLU/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/SparseLU/SparseLU.h +756 -710
- package/eigen/Eigen/src/SparseLU/SparseLUImpl.h +61 -48
- package/eigen/Eigen/src/SparseLU/SparseLU_Memory.h +102 -118
- package/eigen/Eigen/src/SparseLU/SparseLU_Structs.h +38 -35
- package/eigen/Eigen/src/SparseLU/SparseLU_SupernodalMatrix.h +245 -301
- package/eigen/Eigen/src/SparseLU/SparseLU_Utils.h +44 -49
- package/eigen/Eigen/src/SparseLU/SparseLU_column_bmod.h +104 -108
- package/eigen/Eigen/src/SparseLU/SparseLU_column_dfs.h +89 -100
- package/eigen/Eigen/src/SparseLU/SparseLU_copy_to_ucol.h +57 -58
- package/eigen/Eigen/src/SparseLU/SparseLU_heap_relax_snode.h +43 -55
- package/eigen/Eigen/src/SparseLU/SparseLU_kernel_bmod.h +74 -71
- package/eigen/Eigen/src/SparseLU/SparseLU_panel_bmod.h +124 -132
- package/eigen/Eigen/src/SparseLU/SparseLU_panel_dfs.h +136 -159
- package/eigen/Eigen/src/SparseLU/SparseLU_pivotL.h +51 -52
- package/eigen/Eigen/src/SparseLU/SparseLU_pruneL.h +67 -73
- package/eigen/Eigen/src/SparseLU/SparseLU_relax_snode.h +24 -26
- package/eigen/Eigen/src/SparseQR/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/SparseQR/SparseQR.h +450 -502
- package/eigen/Eigen/src/StlSupport/StdDeque.h +28 -93
- package/eigen/Eigen/src/StlSupport/StdList.h +28 -84
- package/eigen/Eigen/src/StlSupport/StdVector.h +28 -108
- package/eigen/Eigen/src/StlSupport/details.h +48 -50
- package/eigen/Eigen/src/SuperLUSupport/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/SuperLUSupport/SuperLUSupport.h +634 -730
- package/eigen/Eigen/src/ThreadPool/Barrier.h +70 -0
- package/eigen/Eigen/src/ThreadPool/CoreThreadPoolDevice.h +336 -0
- package/eigen/Eigen/src/ThreadPool/EventCount.h +241 -0
- package/eigen/Eigen/src/ThreadPool/ForkJoin.h +140 -0
- package/eigen/Eigen/src/ThreadPool/InternalHeaderCheck.h +4 -0
- package/eigen/Eigen/src/ThreadPool/NonBlockingThreadPool.h +587 -0
- package/eigen/Eigen/src/ThreadPool/RunQueue.h +230 -0
- package/eigen/Eigen/src/ThreadPool/ThreadCancel.h +21 -0
- package/eigen/Eigen/src/ThreadPool/ThreadEnvironment.h +43 -0
- package/eigen/Eigen/src/ThreadPool/ThreadLocal.h +289 -0
- package/eigen/Eigen/src/ThreadPool/ThreadPoolInterface.h +50 -0
- package/eigen/Eigen/src/ThreadPool/ThreadYield.h +16 -0
- package/eigen/Eigen/src/UmfPackSupport/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/UmfPackSupport/UmfPackSupport.h +428 -464
- package/eigen/Eigen/src/misc/Image.h +41 -43
- package/eigen/Eigen/src/misc/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/misc/Kernel.h +39 -41
- package/eigen/Eigen/src/misc/RealSvd2x2.h +19 -21
- package/eigen/Eigen/src/misc/blas.h +83 -426
- package/eigen/Eigen/src/misc/lapacke.h +9972 -16179
- package/eigen/Eigen/src/misc/lapacke_helpers.h +163 -0
- package/eigen/Eigen/src/misc/lapacke_mangling.h +4 -5
- package/eigen/Eigen/src/plugins/ArrayCwiseBinaryOps.inc +344 -0
- package/eigen/Eigen/src/plugins/ArrayCwiseUnaryOps.inc +544 -0
- package/eigen/Eigen/src/plugins/{BlockMethods.h → BlockMethods.inc} +434 -506
- package/eigen/Eigen/src/plugins/CommonCwiseBinaryOps.inc +116 -0
- package/eigen/Eigen/src/plugins/{CommonCwiseUnaryOps.h → CommonCwiseUnaryOps.inc} +58 -68
- package/eigen/Eigen/src/plugins/IndexedViewMethods.inc +192 -0
- package/eigen/Eigen/src/plugins/InternalHeaderCheck.inc +3 -0
- package/eigen/Eigen/src/plugins/MatrixCwiseBinaryOps.inc +331 -0
- package/eigen/Eigen/src/plugins/MatrixCwiseUnaryOps.inc +118 -0
- package/eigen/Eigen/src/plugins/ReshapedMethods.inc +133 -0
- package/package.json +1 -1
- package/eigen/COPYING.APACHE +0 -203
- package/eigen/COPYING.BSD +0 -26
- package/eigen/COPYING.GPL +0 -674
- package/eigen/COPYING.LGPL +0 -502
- package/eigen/COPYING.MINPACK +0 -51
- package/eigen/COPYING.MPL2 +0 -373
- package/eigen/COPYING.README +0 -18
- package/eigen/Eigen/src/Core/BooleanRedux.h +0 -162
- package/eigen/Eigen/src/Core/arch/CUDA/Complex.h +0 -258
- package/eigen/Eigen/src/Core/arch/Default/TypeCasting.h +0 -120
- package/eigen/Eigen/src/Core/arch/SYCL/SyclMemoryModel.h +0 -694
- package/eigen/Eigen/src/Core/util/NonMPL2.h +0 -3
- package/eigen/Eigen/src/SparseCore/MappedSparseMatrix.h +0 -67
- package/eigen/Eigen/src/SparseLU/SparseLU_gemm_kernel.h +0 -280
- package/eigen/Eigen/src/misc/lapack.h +0 -152
- package/eigen/Eigen/src/plugins/ArrayCwiseBinaryOps.h +0 -358
- package/eigen/Eigen/src/plugins/ArrayCwiseUnaryOps.h +0 -696
- package/eigen/Eigen/src/plugins/CommonCwiseBinaryOps.h +0 -115
- package/eigen/Eigen/src/plugins/IndexedViewMethods.h +0 -262
- package/eigen/Eigen/src/plugins/MatrixCwiseBinaryOps.h +0 -152
- package/eigen/Eigen/src/plugins/MatrixCwiseUnaryOps.h +0 -95
- package/eigen/Eigen/src/plugins/ReshapedMethods.h +0 -149
- package/eigen/README.md +0 -5
|
@@ -11,7 +11,10 @@
|
|
|
11
11
|
#ifndef EIGEN_REDUX_H
|
|
12
12
|
#define EIGEN_REDUX_H
|
|
13
13
|
|
|
14
|
-
|
|
14
|
+
// IWYU pragma: private
|
|
15
|
+
#include "./InternalHeaderCheck.h"
|
|
16
|
+
|
|
17
|
+
namespace Eigen {
|
|
15
18
|
|
|
16
19
|
namespace internal {
|
|
17
20
|
|
|
@@ -20,56 +23,51 @@ namespace internal {
|
|
|
20
23
|
// * factorize code
|
|
21
24
|
|
|
22
25
|
/***************************************************************************
|
|
23
|
-
* Part 1 : the logic deciding a strategy for vectorization and unrolling
|
|
24
|
-
***************************************************************************/
|
|
25
|
-
|
|
26
|
-
template<typename Func, typename Evaluator>
|
|
27
|
-
struct redux_traits
|
|
28
|
-
|
|
29
|
-
|
|
30
|
-
typedef typename find_best_packet<typename Evaluator::Scalar,Evaluator::SizeAtCompileTime>::type PacketType;
|
|
26
|
+
* Part 1 : the logic deciding a strategy for vectorization and unrolling
|
|
27
|
+
***************************************************************************/
|
|
28
|
+
|
|
29
|
+
template <typename Func, typename Evaluator>
|
|
30
|
+
struct redux_traits {
|
|
31
|
+
public:
|
|
32
|
+
typedef typename find_best_packet<typename Evaluator::Scalar, Evaluator::SizeAtCompileTime>::type PacketType;
|
|
31
33
|
enum {
|
|
32
34
|
PacketSize = unpacket_traits<PacketType>::size,
|
|
33
|
-
InnerMaxSize = int(Evaluator::IsRowMajor)
|
|
34
|
-
|
|
35
|
-
|
|
36
|
-
|
|
37
|
-
|
|
38
|
-
: Evaluator::MaxColsAtCompileTime,
|
|
39
|
-
SliceVectorizedWork = int(InnerMaxSize)==Dynamic ? Dynamic
|
|
40
|
-
: int(OuterMaxSize)==Dynamic ? (int(InnerMaxSize)>=int(PacketSize) ? Dynamic : 0)
|
|
41
|
-
: (int(InnerMaxSize)/int(PacketSize)) * int(OuterMaxSize)
|
|
35
|
+
InnerMaxSize = int(Evaluator::IsRowMajor) ? Evaluator::MaxColsAtCompileTime : Evaluator::MaxRowsAtCompileTime,
|
|
36
|
+
OuterMaxSize = int(Evaluator::IsRowMajor) ? Evaluator::MaxRowsAtCompileTime : Evaluator::MaxColsAtCompileTime,
|
|
37
|
+
SliceVectorizedWork = int(InnerMaxSize) == Dynamic ? Dynamic
|
|
38
|
+
: int(OuterMaxSize) == Dynamic ? (int(InnerMaxSize) >= int(PacketSize) ? Dynamic : 0)
|
|
39
|
+
: (int(InnerMaxSize) / int(PacketSize)) * int(OuterMaxSize)
|
|
42
40
|
};
|
|
43
41
|
|
|
44
42
|
enum {
|
|
45
|
-
|
|
46
|
-
|
|
47
|
-
MayLinearVectorize = bool(MightVectorize) && (
|
|
48
|
-
MaySliceVectorize
|
|
43
|
+
MayLinearize = (int(Evaluator::Flags) & LinearAccessBit),
|
|
44
|
+
MightVectorize = (int(Evaluator::Flags) & ActualPacketAccessBit) && (functor_traits<Func>::PacketAccess),
|
|
45
|
+
MayLinearVectorize = bool(MightVectorize) && bool(MayLinearize),
|
|
46
|
+
MaySliceVectorize = bool(MightVectorize) && (int(SliceVectorizedWork) == Dynamic || int(SliceVectorizedWork) >= 3)
|
|
49
47
|
};
|
|
50
48
|
|
|
51
|
-
public:
|
|
49
|
+
public:
|
|
52
50
|
enum {
|
|
53
|
-
Traversal = int(MayLinearVectorize)
|
|
54
|
-
|
|
55
|
-
|
|
51
|
+
Traversal = int(MayLinearVectorize) ? int(LinearVectorizedTraversal)
|
|
52
|
+
: int(MaySliceVectorize) ? int(SliceVectorizedTraversal)
|
|
53
|
+
: int(MayLinearize) ? int(LinearTraversal)
|
|
54
|
+
: int(DefaultTraversal)
|
|
56
55
|
};
|
|
57
56
|
|
|
58
|
-
public:
|
|
57
|
+
public:
|
|
59
58
|
enum {
|
|
60
|
-
Cost = Evaluator::SizeAtCompileTime == Dynamic
|
|
61
|
-
|
|
59
|
+
Cost = Evaluator::SizeAtCompileTime == Dynamic
|
|
60
|
+
? HugeCost
|
|
61
|
+
: int(Evaluator::SizeAtCompileTime) * int(Evaluator::CoeffReadCost) +
|
|
62
|
+
(Evaluator::SizeAtCompileTime - 1) * functor_traits<Func>::Cost,
|
|
62
63
|
UnrollingLimit = EIGEN_UNROLLING_LIMIT * (int(Traversal) == int(DefaultTraversal) ? 1 : int(PacketSize))
|
|
63
64
|
};
|
|
64
65
|
|
|
65
|
-
public:
|
|
66
|
-
enum {
|
|
67
|
-
|
|
68
|
-
};
|
|
69
|
-
|
|
66
|
+
public:
|
|
67
|
+
enum { Unrolling = Cost <= UnrollingLimit ? CompleteUnrolling : NoUnrolling };
|
|
68
|
+
|
|
70
69
|
#ifdef EIGEN_DEBUG_ASSIGN
|
|
71
|
-
static void debug()
|
|
72
|
-
{
|
|
70
|
+
static void debug() {
|
|
73
71
|
std::cerr << "Xpr: " << typeid(typename Evaluator::XprType).name() << std::endl;
|
|
74
72
|
std::cerr.setf(std::ios::hex, std::ios::basefield);
|
|
75
73
|
EIGEN_DEBUG_VAR(Evaluator::Flags)
|
|
@@ -81,50 +79,42 @@ public:
|
|
|
81
79
|
EIGEN_DEBUG_VAR(MightVectorize)
|
|
82
80
|
EIGEN_DEBUG_VAR(MayLinearVectorize)
|
|
83
81
|
EIGEN_DEBUG_VAR(MaySliceVectorize)
|
|
84
|
-
std::cerr << "Traversal"
|
|
82
|
+
std::cerr << "Traversal"
|
|
83
|
+
<< " = " << Traversal << " (" << demangle_traversal(Traversal) << ")" << std::endl;
|
|
85
84
|
EIGEN_DEBUG_VAR(UnrollingLimit)
|
|
86
|
-
std::cerr << "Unrolling"
|
|
85
|
+
std::cerr << "Unrolling"
|
|
86
|
+
<< " = " << Unrolling << " (" << demangle_unrolling(Unrolling) << ")" << std::endl;
|
|
87
87
|
std::cerr << std::endl;
|
|
88
88
|
}
|
|
89
89
|
#endif
|
|
90
90
|
};
|
|
91
91
|
|
|
92
92
|
/***************************************************************************
|
|
93
|
-
* Part 2 : unrollers
|
|
94
|
-
***************************************************************************/
|
|
93
|
+
* Part 2 : unrollers
|
|
94
|
+
***************************************************************************/
|
|
95
95
|
|
|
96
96
|
/*** no vectorization ***/
|
|
97
97
|
|
|
98
|
-
template<typename Func, typename Evaluator,
|
|
99
|
-
struct redux_novec_unroller
|
|
100
|
-
|
|
101
|
-
enum {
|
|
102
|
-
HalfLength = Length/2
|
|
103
|
-
};
|
|
98
|
+
template <typename Func, typename Evaluator, Index Start, Index Length>
|
|
99
|
+
struct redux_novec_unroller {
|
|
100
|
+
static constexpr Index HalfLength = Length / 2;
|
|
104
101
|
|
|
105
102
|
typedef typename Evaluator::Scalar Scalar;
|
|
106
103
|
|
|
107
|
-
EIGEN_DEVICE_FUNC
|
|
108
|
-
|
|
109
|
-
|
|
110
|
-
return func(redux_novec_unroller<Func, Evaluator, Start, HalfLength>::run(eval,func),
|
|
111
|
-
redux_novec_unroller<Func, Evaluator, Start+HalfLength, Length-HalfLength>::run(eval,func));
|
|
104
|
+
EIGEN_DEVICE_FUNC static EIGEN_STRONG_INLINE Scalar run(const Evaluator& eval, const Func& func) {
|
|
105
|
+
return func(redux_novec_unroller<Func, Evaluator, Start, HalfLength>::run(eval, func),
|
|
106
|
+
redux_novec_unroller<Func, Evaluator, Start + HalfLength, Length - HalfLength>::run(eval, func));
|
|
112
107
|
}
|
|
113
108
|
};
|
|
114
109
|
|
|
115
|
-
template<typename Func, typename Evaluator,
|
|
116
|
-
struct redux_novec_unroller<Func, Evaluator, Start, 1>
|
|
117
|
-
|
|
118
|
-
|
|
119
|
-
outer = Start / Evaluator::InnerSizeAtCompileTime,
|
|
120
|
-
inner = Start % Evaluator::InnerSizeAtCompileTime
|
|
121
|
-
};
|
|
110
|
+
template <typename Func, typename Evaluator, Index Start>
|
|
111
|
+
struct redux_novec_unroller<Func, Evaluator, Start, 1> {
|
|
112
|
+
static constexpr Index outer = Start / Evaluator::InnerSizeAtCompileTime;
|
|
113
|
+
static constexpr Index inner = Start % Evaluator::InnerSizeAtCompileTime;
|
|
122
114
|
|
|
123
115
|
typedef typename Evaluator::Scalar Scalar;
|
|
124
116
|
|
|
125
|
-
EIGEN_DEVICE_FUNC
|
|
126
|
-
static EIGEN_STRONG_INLINE Scalar run(const Evaluator &eval, const Func&)
|
|
127
|
-
{
|
|
117
|
+
EIGEN_DEVICE_FUNC static EIGEN_STRONG_INLINE Scalar run(const Evaluator& eval, const Func&) {
|
|
128
118
|
return eval.coeffByOuterInner(outer, inner);
|
|
129
119
|
}
|
|
130
120
|
};
|
|
@@ -132,150 +122,201 @@ struct redux_novec_unroller<Func, Evaluator, Start, 1>
|
|
|
132
122
|
// This is actually dead code and will never be called. It is required
|
|
133
123
|
// to prevent false warnings regarding failed inlining though
|
|
134
124
|
// for 0 length run() will never be called at all.
|
|
135
|
-
template<typename Func, typename Evaluator,
|
|
136
|
-
struct redux_novec_unroller<Func, Evaluator, Start, 0>
|
|
137
|
-
|
|
125
|
+
template <typename Func, typename Evaluator, Index Start>
|
|
126
|
+
struct redux_novec_unroller<Func, Evaluator, Start, 0> {
|
|
127
|
+
typedef typename Evaluator::Scalar Scalar;
|
|
128
|
+
EIGEN_DEVICE_FUNC static EIGEN_STRONG_INLINE Scalar run(const Evaluator&, const Func&) { return Scalar(); }
|
|
129
|
+
};
|
|
130
|
+
|
|
131
|
+
template <typename Func, typename Evaluator, Index Start, Index Length>
|
|
132
|
+
struct redux_novec_linear_unroller {
|
|
133
|
+
static constexpr Index HalfLength = Length / 2;
|
|
134
|
+
|
|
135
|
+
typedef typename Evaluator::Scalar Scalar;
|
|
136
|
+
|
|
137
|
+
EIGEN_DEVICE_FUNC static EIGEN_STRONG_INLINE Scalar run(const Evaluator& eval, const Func& func) {
|
|
138
|
+
return func(redux_novec_linear_unroller<Func, Evaluator, Start, HalfLength>::run(eval, func),
|
|
139
|
+
redux_novec_linear_unroller<Func, Evaluator, Start + HalfLength, Length - HalfLength>::run(eval, func));
|
|
140
|
+
}
|
|
141
|
+
};
|
|
142
|
+
|
|
143
|
+
template <typename Func, typename Evaluator, Index Start>
|
|
144
|
+
struct redux_novec_linear_unroller<Func, Evaluator, Start, 1> {
|
|
145
|
+
typedef typename Evaluator::Scalar Scalar;
|
|
146
|
+
|
|
147
|
+
EIGEN_DEVICE_FUNC static EIGEN_STRONG_INLINE Scalar run(const Evaluator& eval, const Func&) {
|
|
148
|
+
return eval.coeff(Start);
|
|
149
|
+
}
|
|
150
|
+
};
|
|
151
|
+
|
|
152
|
+
// This is actually dead code and will never be called. It is required
|
|
153
|
+
// to prevent false warnings regarding failed inlining though
|
|
154
|
+
// for 0 length run() will never be called at all.
|
|
155
|
+
template <typename Func, typename Evaluator, Index Start>
|
|
156
|
+
struct redux_novec_linear_unroller<Func, Evaluator, Start, 0> {
|
|
138
157
|
typedef typename Evaluator::Scalar Scalar;
|
|
139
|
-
EIGEN_DEVICE_FUNC
|
|
140
|
-
static EIGEN_STRONG_INLINE Scalar run(const Evaluator&, const Func&) { return Scalar(); }
|
|
158
|
+
EIGEN_DEVICE_FUNC static EIGEN_STRONG_INLINE Scalar run(const Evaluator&, const Func&) { return Scalar(); }
|
|
141
159
|
};
|
|
142
160
|
|
|
143
161
|
/*** vectorization ***/
|
|
144
162
|
|
|
145
|
-
template<typename Func, typename Evaluator,
|
|
146
|
-
struct redux_vec_unroller
|
|
147
|
-
|
|
148
|
-
|
|
149
|
-
|
|
150
|
-
static EIGEN_STRONG_INLINE PacketType run(const Evaluator &eval, const Func& func)
|
|
151
|
-
{
|
|
152
|
-
enum {
|
|
153
|
-
PacketSize = unpacket_traits<PacketType>::size,
|
|
154
|
-
HalfLength = Length/2
|
|
155
|
-
};
|
|
163
|
+
template <typename Func, typename Evaluator, Index Start, Index Length>
|
|
164
|
+
struct redux_vec_unroller {
|
|
165
|
+
template <typename PacketType>
|
|
166
|
+
EIGEN_DEVICE_FUNC static EIGEN_STRONG_INLINE PacketType run(const Evaluator& eval, const Func& func) {
|
|
167
|
+
constexpr Index HalfLength = Length / 2;
|
|
156
168
|
|
|
157
169
|
return func.packetOp(
|
|
158
|
-
|
|
159
|
-
|
|
170
|
+
redux_vec_unroller<Func, Evaluator, Start, HalfLength>::template run<PacketType>(eval, func),
|
|
171
|
+
redux_vec_unroller<Func, Evaluator, Start + HalfLength, Length - HalfLength>::template run<PacketType>(eval,
|
|
172
|
+
func));
|
|
173
|
+
}
|
|
174
|
+
};
|
|
175
|
+
|
|
176
|
+
template <typename Func, typename Evaluator, Index Start>
|
|
177
|
+
struct redux_vec_unroller<Func, Evaluator, Start, 1> {
|
|
178
|
+
template <typename PacketType>
|
|
179
|
+
EIGEN_DEVICE_FUNC static EIGEN_STRONG_INLINE PacketType run(const Evaluator& eval, const Func&) {
|
|
180
|
+
constexpr Index PacketSize = unpacket_traits<PacketType>::size;
|
|
181
|
+
constexpr Index index = Start * PacketSize;
|
|
182
|
+
constexpr Index outer = index / int(Evaluator::InnerSizeAtCompileTime);
|
|
183
|
+
constexpr Index inner = index % int(Evaluator::InnerSizeAtCompileTime);
|
|
184
|
+
constexpr int alignment = Evaluator::Alignment;
|
|
185
|
+
|
|
186
|
+
return eval.template packetByOuterInner<alignment, PacketType>(outer, inner);
|
|
160
187
|
}
|
|
161
188
|
};
|
|
162
189
|
|
|
163
|
-
template<typename Func, typename Evaluator,
|
|
164
|
-
struct
|
|
165
|
-
|
|
166
|
-
|
|
167
|
-
|
|
168
|
-
|
|
169
|
-
|
|
170
|
-
|
|
171
|
-
|
|
172
|
-
|
|
173
|
-
|
|
174
|
-
|
|
175
|
-
|
|
176
|
-
|
|
177
|
-
|
|
190
|
+
template <typename Func, typename Evaluator, Index Start, Index Length>
|
|
191
|
+
struct redux_vec_linear_unroller {
|
|
192
|
+
template <typename PacketType>
|
|
193
|
+
EIGEN_DEVICE_FUNC static EIGEN_STRONG_INLINE PacketType run(const Evaluator& eval, const Func& func) {
|
|
194
|
+
constexpr Index HalfLength = Length / 2;
|
|
195
|
+
|
|
196
|
+
return func.packetOp(
|
|
197
|
+
redux_vec_linear_unroller<Func, Evaluator, Start, HalfLength>::template run<PacketType>(eval, func),
|
|
198
|
+
redux_vec_linear_unroller<Func, Evaluator, Start + HalfLength, Length - HalfLength>::template run<PacketType>(
|
|
199
|
+
eval, func));
|
|
200
|
+
}
|
|
201
|
+
};
|
|
202
|
+
|
|
203
|
+
template <typename Func, typename Evaluator, Index Start>
|
|
204
|
+
struct redux_vec_linear_unroller<Func, Evaluator, Start, 1> {
|
|
205
|
+
template <typename PacketType>
|
|
206
|
+
EIGEN_DEVICE_FUNC static EIGEN_STRONG_INLINE PacketType run(const Evaluator& eval, const Func&) {
|
|
207
|
+
constexpr Index PacketSize = unpacket_traits<PacketType>::size;
|
|
208
|
+
constexpr Index index = (Start * PacketSize);
|
|
209
|
+
constexpr int alignment = Evaluator::Alignment;
|
|
210
|
+
return eval.template packet<alignment, PacketType>(index);
|
|
178
211
|
}
|
|
179
212
|
};
|
|
180
213
|
|
|
181
214
|
/***************************************************************************
|
|
182
|
-
* Part 3 : implementation of all cases
|
|
183
|
-
***************************************************************************/
|
|
215
|
+
* Part 3 : implementation of all cases
|
|
216
|
+
***************************************************************************/
|
|
184
217
|
|
|
185
|
-
template<typename Func, typename Evaluator,
|
|
186
|
-
|
|
187
|
-
int Unrolling = redux_traits<Func, Evaluator>::Unrolling
|
|
188
|
-
>
|
|
218
|
+
template <typename Func, typename Evaluator, int Traversal = redux_traits<Func, Evaluator>::Traversal,
|
|
219
|
+
int Unrolling = redux_traits<Func, Evaluator>::Unrolling>
|
|
189
220
|
struct redux_impl;
|
|
190
221
|
|
|
191
|
-
template<typename Func, typename Evaluator>
|
|
192
|
-
struct redux_impl<Func, Evaluator, DefaultTraversal, NoUnrolling>
|
|
193
|
-
{
|
|
222
|
+
template <typename Func, typename Evaluator>
|
|
223
|
+
struct redux_impl<Func, Evaluator, DefaultTraversal, NoUnrolling> {
|
|
194
224
|
typedef typename Evaluator::Scalar Scalar;
|
|
195
225
|
|
|
196
|
-
template<typename XprType>
|
|
197
|
-
EIGEN_DEVICE_FUNC static EIGEN_STRONG_INLINE
|
|
198
|
-
|
|
199
|
-
|
|
200
|
-
|
|
201
|
-
|
|
202
|
-
|
|
203
|
-
|
|
204
|
-
|
|
205
|
-
|
|
206
|
-
|
|
207
|
-
|
|
226
|
+
template <typename XprType>
|
|
227
|
+
EIGEN_DEVICE_FUNC static EIGEN_STRONG_INLINE Scalar run(const Evaluator& eval, const Func& func, const XprType& xpr) {
|
|
228
|
+
eigen_assert(xpr.rows() > 0 && xpr.cols() > 0 && "you are using an empty matrix");
|
|
229
|
+
Scalar res = eval.coeffByOuterInner(0, 0);
|
|
230
|
+
for (Index i = 1; i < xpr.innerSize(); ++i) res = func(res, eval.coeffByOuterInner(0, i));
|
|
231
|
+
for (Index i = 1; i < xpr.outerSize(); ++i)
|
|
232
|
+
for (Index j = 0; j < xpr.innerSize(); ++j) res = func(res, eval.coeffByOuterInner(i, j));
|
|
233
|
+
return res;
|
|
234
|
+
}
|
|
235
|
+
};
|
|
236
|
+
|
|
237
|
+
template <typename Func, typename Evaluator>
|
|
238
|
+
struct redux_impl<Func, Evaluator, LinearTraversal, NoUnrolling> {
|
|
239
|
+
typedef typename Evaluator::Scalar Scalar;
|
|
240
|
+
|
|
241
|
+
template <typename XprType>
|
|
242
|
+
EIGEN_DEVICE_FUNC static EIGEN_STRONG_INLINE Scalar run(const Evaluator& eval, const Func& func, const XprType& xpr) {
|
|
243
|
+
eigen_assert(xpr.size() > 0 && "you are using an empty matrix");
|
|
244
|
+
Scalar res = eval.coeff(0);
|
|
245
|
+
for (Index k = 1; k < xpr.size(); ++k) res = func(res, eval.coeff(k));
|
|
208
246
|
return res;
|
|
209
247
|
}
|
|
210
248
|
};
|
|
211
249
|
|
|
212
|
-
template<typename Func, typename Evaluator>
|
|
213
|
-
struct redux_impl<Func,Evaluator, DefaultTraversal, CompleteUnrolling>
|
|
214
|
-
|
|
215
|
-
|
|
216
|
-
typedef
|
|
250
|
+
template <typename Func, typename Evaluator>
|
|
251
|
+
struct redux_impl<Func, Evaluator, DefaultTraversal, CompleteUnrolling>
|
|
252
|
+
: redux_novec_unroller<Func, Evaluator, 0, Evaluator::SizeAtCompileTime> {
|
|
253
|
+
typedef redux_novec_unroller<Func, Evaluator, 0, Evaluator::SizeAtCompileTime> Base;
|
|
254
|
+
typedef typename Evaluator::Scalar Scalar;
|
|
255
|
+
template <typename XprType>
|
|
256
|
+
EIGEN_DEVICE_FUNC static EIGEN_STRONG_INLINE Scalar run(const Evaluator& eval, const Func& func,
|
|
257
|
+
const XprType& /*xpr*/) {
|
|
258
|
+
return Base::run(eval, func);
|
|
259
|
+
}
|
|
260
|
+
};
|
|
261
|
+
|
|
262
|
+
template <typename Func, typename Evaluator>
|
|
263
|
+
struct redux_impl<Func, Evaluator, LinearTraversal, CompleteUnrolling>
|
|
264
|
+
: redux_novec_linear_unroller<Func, Evaluator, 0, Evaluator::SizeAtCompileTime> {
|
|
265
|
+
typedef redux_novec_linear_unroller<Func, Evaluator, 0, Evaluator::SizeAtCompileTime> Base;
|
|
217
266
|
typedef typename Evaluator::Scalar Scalar;
|
|
218
|
-
template<typename XprType>
|
|
219
|
-
EIGEN_DEVICE_FUNC static EIGEN_STRONG_INLINE
|
|
220
|
-
|
|
221
|
-
|
|
222
|
-
return Base::run(eval,func);
|
|
267
|
+
template <typename XprType>
|
|
268
|
+
EIGEN_DEVICE_FUNC static EIGEN_STRONG_INLINE Scalar run(const Evaluator& eval, const Func& func,
|
|
269
|
+
const XprType& /*xpr*/) {
|
|
270
|
+
return Base::run(eval, func);
|
|
223
271
|
}
|
|
224
272
|
};
|
|
225
273
|
|
|
226
|
-
template<typename Func, typename Evaluator>
|
|
227
|
-
struct redux_impl<Func, Evaluator, LinearVectorizedTraversal, NoUnrolling>
|
|
228
|
-
{
|
|
274
|
+
template <typename Func, typename Evaluator>
|
|
275
|
+
struct redux_impl<Func, Evaluator, LinearVectorizedTraversal, NoUnrolling> {
|
|
229
276
|
typedef typename Evaluator::Scalar Scalar;
|
|
230
277
|
typedef typename redux_traits<Func, Evaluator>::PacketType PacketScalar;
|
|
231
278
|
|
|
232
|
-
template<typename XprType>
|
|
233
|
-
static Scalar run(const Evaluator
|
|
234
|
-
{
|
|
279
|
+
template <typename XprType>
|
|
280
|
+
static Scalar run(const Evaluator& eval, const Func& func, const XprType& xpr) {
|
|
235
281
|
const Index size = xpr.size();
|
|
236
|
-
|
|
237
|
-
|
|
238
|
-
|
|
239
|
-
|
|
240
|
-
|
|
241
|
-
|
|
242
|
-
|
|
282
|
+
|
|
283
|
+
constexpr Index packetSize = redux_traits<Func, Evaluator>::PacketSize;
|
|
284
|
+
constexpr int packetAlignment = unpacket_traits<PacketScalar>::alignment;
|
|
285
|
+
constexpr int alignment0 =
|
|
286
|
+
(bool(Evaluator::Flags & DirectAccessBit) && bool(packet_traits<Scalar>::AlignedOnScalar))
|
|
287
|
+
? int(packetAlignment)
|
|
288
|
+
: int(Unaligned);
|
|
289
|
+
constexpr int alignment = plain_enum_max(alignment0, Evaluator::Alignment);
|
|
243
290
|
const Index alignedStart = internal::first_default_aligned(xpr);
|
|
244
|
-
const Index alignedSize2 = ((size-alignedStart)/(2*packetSize))*(2*packetSize);
|
|
245
|
-
const Index alignedSize = ((size-alignedStart)/(packetSize))*(packetSize);
|
|
291
|
+
const Index alignedSize2 = ((size - alignedStart) / (2 * packetSize)) * (2 * packetSize);
|
|
292
|
+
const Index alignedSize = ((size - alignedStart) / (packetSize)) * (packetSize);
|
|
246
293
|
const Index alignedEnd2 = alignedStart + alignedSize2;
|
|
247
|
-
const Index alignedEnd
|
|
294
|
+
const Index alignedEnd = alignedStart + alignedSize;
|
|
248
295
|
Scalar res;
|
|
249
|
-
if(alignedSize)
|
|
250
|
-
|
|
251
|
-
|
|
252
|
-
if(alignedSize>packetSize) // we have at least two packets to partly unroll the loop
|
|
296
|
+
if (alignedSize) {
|
|
297
|
+
PacketScalar packet_res0 = eval.template packet<alignment, PacketScalar>(alignedStart);
|
|
298
|
+
if (alignedSize > packetSize) // we have at least two packets to partly unroll the loop
|
|
253
299
|
{
|
|
254
|
-
PacketScalar packet_res1 = eval.template packet<alignment,PacketScalar>(alignedStart+packetSize);
|
|
255
|
-
for(Index index = alignedStart + 2*packetSize; index < alignedEnd2; index += 2*packetSize)
|
|
256
|
-
|
|
257
|
-
|
|
258
|
-
packet_res1 = func.packetOp(packet_res1, eval.template packet<alignment,PacketScalar>(index+packetSize));
|
|
300
|
+
PacketScalar packet_res1 = eval.template packet<alignment, PacketScalar>(alignedStart + packetSize);
|
|
301
|
+
for (Index index = alignedStart + 2 * packetSize; index < alignedEnd2; index += 2 * packetSize) {
|
|
302
|
+
packet_res0 = func.packetOp(packet_res0, eval.template packet<alignment, PacketScalar>(index));
|
|
303
|
+
packet_res1 = func.packetOp(packet_res1, eval.template packet<alignment, PacketScalar>(index + packetSize));
|
|
259
304
|
}
|
|
260
305
|
|
|
261
|
-
packet_res0 = func.packetOp(packet_res0,packet_res1);
|
|
262
|
-
if(alignedEnd>alignedEnd2)
|
|
263
|
-
packet_res0 = func.packetOp(packet_res0, eval.template packet<alignment,PacketScalar>(alignedEnd2));
|
|
306
|
+
packet_res0 = func.packetOp(packet_res0, packet_res1);
|
|
307
|
+
if (alignedEnd > alignedEnd2)
|
|
308
|
+
packet_res0 = func.packetOp(packet_res0, eval.template packet<alignment, PacketScalar>(alignedEnd2));
|
|
264
309
|
}
|
|
265
310
|
res = func.predux(packet_res0);
|
|
266
311
|
|
|
267
|
-
for(Index index = 0; index < alignedStart; ++index)
|
|
268
|
-
res = func(res,eval.coeff(index));
|
|
312
|
+
for (Index index = 0; index < alignedStart; ++index) res = func(res, eval.coeff(index));
|
|
269
313
|
|
|
270
|
-
for(Index index = alignedEnd; index < size; ++index)
|
|
271
|
-
|
|
272
|
-
|
|
273
|
-
else // too small to vectorize anything.
|
|
274
|
-
// since this is dynamic-size hence inefficient anyway for such small sizes, don't try to optimize.
|
|
314
|
+
for (Index index = alignedEnd; index < size; ++index) res = func(res, eval.coeff(index));
|
|
315
|
+
} else // too small to vectorize anything.
|
|
316
|
+
// since this is dynamic-size hence inefficient anyway for such small sizes, don't try to optimize.
|
|
275
317
|
{
|
|
276
318
|
res = eval.coeff(0);
|
|
277
|
-
for(Index index = 1; index < size; ++index)
|
|
278
|
-
res = func(res,eval.coeff(index));
|
|
319
|
+
for (Index index = 1; index < size; ++index) res = func(res, eval.coeff(index));
|
|
279
320
|
}
|
|
280
321
|
|
|
281
322
|
return res;
|
|
@@ -283,37 +324,30 @@ struct redux_impl<Func, Evaluator, LinearVectorizedTraversal, NoUnrolling>
|
|
|
283
324
|
};
|
|
284
325
|
|
|
285
326
|
// NOTE: for SliceVectorizedTraversal we simply bypass unrolling
|
|
286
|
-
template<typename Func, typename Evaluator, int Unrolling>
|
|
287
|
-
struct redux_impl<Func, Evaluator, SliceVectorizedTraversal, Unrolling>
|
|
288
|
-
{
|
|
327
|
+
template <typename Func, typename Evaluator, int Unrolling>
|
|
328
|
+
struct redux_impl<Func, Evaluator, SliceVectorizedTraversal, Unrolling> {
|
|
289
329
|
typedef typename Evaluator::Scalar Scalar;
|
|
290
330
|
typedef typename redux_traits<Func, Evaluator>::PacketType PacketType;
|
|
291
331
|
|
|
292
|
-
template<typename XprType>
|
|
293
|
-
EIGEN_DEVICE_FUNC static Scalar run(const Evaluator
|
|
294
|
-
|
|
295
|
-
|
|
332
|
+
template <typename XprType>
|
|
333
|
+
EIGEN_DEVICE_FUNC static Scalar run(const Evaluator& eval, const Func& func, const XprType& xpr) {
|
|
334
|
+
eigen_assert(xpr.rows() > 0 && xpr.cols() > 0 && "you are using an empty matrix");
|
|
335
|
+
constexpr Index packetSize = redux_traits<Func, Evaluator>::PacketSize;
|
|
296
336
|
const Index innerSize = xpr.innerSize();
|
|
297
337
|
const Index outerSize = xpr.outerSize();
|
|
298
|
-
|
|
299
|
-
packetSize = redux_traits<Func, Evaluator>::PacketSize
|
|
300
|
-
};
|
|
301
|
-
const Index packetedInnerSize = ((innerSize)/packetSize)*packetSize;
|
|
338
|
+
const Index packetedInnerSize = ((innerSize) / packetSize) * packetSize;
|
|
302
339
|
Scalar res;
|
|
303
|
-
if(packetedInnerSize)
|
|
304
|
-
|
|
305
|
-
|
|
306
|
-
|
|
307
|
-
|
|
308
|
-
packet_res = func.packetOp(packet_res, eval.template packetByOuterInner<Unaligned,PacketType>(j,i));
|
|
340
|
+
if (packetedInnerSize) {
|
|
341
|
+
PacketType packet_res = eval.template packet<Unaligned, PacketType>(0, 0);
|
|
342
|
+
for (Index j = 0; j < outerSize; ++j)
|
|
343
|
+
for (Index i = (j == 0 ? packetSize : 0); i < packetedInnerSize; i += Index(packetSize))
|
|
344
|
+
packet_res = func.packetOp(packet_res, eval.template packetByOuterInner<Unaligned, PacketType>(j, i));
|
|
309
345
|
|
|
310
346
|
res = func.predux(packet_res);
|
|
311
|
-
for(Index j=0; j<outerSize; ++j)
|
|
312
|
-
for(Index i=packetedInnerSize; i<innerSize; ++i)
|
|
313
|
-
|
|
314
|
-
|
|
315
|
-
else // too small to vectorize anything.
|
|
316
|
-
// since this is dynamic-size hence inefficient anyway for such small sizes, don't try to optimize.
|
|
347
|
+
for (Index j = 0; j < outerSize; ++j)
|
|
348
|
+
for (Index i = packetedInnerSize; i < innerSize; ++i) res = func(res, eval.coeffByOuterInner(j, i));
|
|
349
|
+
} else // too small to vectorize anything.
|
|
350
|
+
// since this is dynamic-size hence inefficient anyway for such small sizes, don't try to optimize.
|
|
317
351
|
{
|
|
318
352
|
res = redux_impl<Func, Evaluator, DefaultTraversal, NoUnrolling>::run(eval, func, xpr);
|
|
319
353
|
}
|
|
@@ -322,194 +356,180 @@ struct redux_impl<Func, Evaluator, SliceVectorizedTraversal, Unrolling>
|
|
|
322
356
|
}
|
|
323
357
|
};
|
|
324
358
|
|
|
325
|
-
template<typename Func, typename Evaluator>
|
|
326
|
-
struct redux_impl<Func, Evaluator, LinearVectorizedTraversal, CompleteUnrolling>
|
|
327
|
-
{
|
|
359
|
+
template <typename Func, typename Evaluator>
|
|
360
|
+
struct redux_impl<Func, Evaluator, LinearVectorizedTraversal, CompleteUnrolling> {
|
|
328
361
|
typedef typename Evaluator::Scalar Scalar;
|
|
329
362
|
|
|
330
363
|
typedef typename redux_traits<Func, Evaluator>::PacketType PacketType;
|
|
331
|
-
|
|
332
|
-
|
|
333
|
-
|
|
334
|
-
VectorizedSize = (int(Size) / int(PacketSize)) * int(PacketSize)
|
|
335
|
-
};
|
|
364
|
+
static constexpr Index PacketSize = redux_traits<Func, Evaluator>::PacketSize;
|
|
365
|
+
static constexpr Index Size = Evaluator::SizeAtCompileTime;
|
|
366
|
+
static constexpr Index VectorizedSize = (int(Size) / int(PacketSize)) * int(PacketSize);
|
|
336
367
|
|
|
337
|
-
template<typename XprType>
|
|
338
|
-
EIGEN_DEVICE_FUNC static EIGEN_STRONG_INLINE
|
|
339
|
-
Scalar run(const Evaluator &eval, const Func& func, const XprType &xpr)
|
|
340
|
-
{
|
|
368
|
+
template <typename XprType>
|
|
369
|
+
EIGEN_DEVICE_FUNC static EIGEN_STRONG_INLINE Scalar run(const Evaluator& eval, const Func& func, const XprType& xpr) {
|
|
341
370
|
EIGEN_ONLY_USED_FOR_DEBUG(xpr)
|
|
342
|
-
eigen_assert(xpr.rows()>0 && xpr.cols()>0 && "you are using an empty matrix");
|
|
371
|
+
eigen_assert(xpr.rows() > 0 && xpr.cols() > 0 && "you are using an empty matrix");
|
|
343
372
|
if (VectorizedSize > 0) {
|
|
344
|
-
Scalar res = func.predux(
|
|
373
|
+
Scalar res = func.predux(
|
|
374
|
+
redux_vec_linear_unroller<Func, Evaluator, 0, Size / PacketSize>::template run<PacketType>(eval, func));
|
|
345
375
|
if (VectorizedSize != Size)
|
|
346
|
-
res = func(
|
|
376
|
+
res = func(
|
|
377
|
+
res, redux_novec_linear_unroller<Func, Evaluator, VectorizedSize, Size - VectorizedSize>::run(eval, func));
|
|
347
378
|
return res;
|
|
348
|
-
}
|
|
349
|
-
|
|
350
|
-
return redux_novec_unroller<Func, Evaluator, 0, Size>::run(eval,func);
|
|
379
|
+
} else {
|
|
380
|
+
return redux_novec_linear_unroller<Func, Evaluator, 0, Size>::run(eval, func);
|
|
351
381
|
}
|
|
352
382
|
}
|
|
353
383
|
};
|
|
354
384
|
|
|
355
385
|
// evaluator adaptor
|
|
356
|
-
template<typename
|
|
357
|
-
class redux_evaluator : public internal::evaluator<
|
|
358
|
-
|
|
359
|
-
|
|
360
|
-
public:
|
|
361
|
-
typedef
|
|
362
|
-
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE
|
|
363
|
-
|
|
364
|
-
|
|
386
|
+
template <typename XprType_>
|
|
387
|
+
class redux_evaluator : public internal::evaluator<XprType_> {
|
|
388
|
+
typedef internal::evaluator<XprType_> Base;
|
|
389
|
+
|
|
390
|
+
public:
|
|
391
|
+
typedef XprType_ XprType;
|
|
392
|
+
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE explicit redux_evaluator(const XprType& xpr) : Base(xpr) {}
|
|
393
|
+
|
|
365
394
|
typedef typename XprType::Scalar Scalar;
|
|
366
395
|
typedef typename XprType::CoeffReturnType CoeffReturnType;
|
|
367
396
|
typedef typename XprType::PacketScalar PacketScalar;
|
|
368
|
-
|
|
397
|
+
|
|
369
398
|
enum {
|
|
370
399
|
MaxRowsAtCompileTime = XprType::MaxRowsAtCompileTime,
|
|
371
400
|
MaxColsAtCompileTime = XprType::MaxColsAtCompileTime,
|
|
372
|
-
// TODO we should not remove DirectAccessBit and rather find an elegant way to query the alignment offset at runtime
|
|
401
|
+
// TODO we should not remove DirectAccessBit and rather find an elegant way to query the alignment offset at runtime
|
|
402
|
+
// from the evaluator
|
|
373
403
|
Flags = Base::Flags & ~DirectAccessBit,
|
|
374
404
|
IsRowMajor = XprType::IsRowMajor,
|
|
375
405
|
SizeAtCompileTime = XprType::SizeAtCompileTime,
|
|
376
406
|
InnerSizeAtCompileTime = XprType::InnerSizeAtCompileTime
|
|
377
407
|
};
|
|
378
|
-
|
|
379
|
-
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE
|
|
380
|
-
|
|
381
|
-
|
|
382
|
-
|
|
383
|
-
template<int LoadMode, typename PacketType>
|
|
384
|
-
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE
|
|
385
|
-
|
|
386
|
-
|
|
387
|
-
|
|
408
|
+
|
|
409
|
+
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE CoeffReturnType coeffByOuterInner(Index outer, Index inner) const {
|
|
410
|
+
return Base::coeff(IsRowMajor ? outer : inner, IsRowMajor ? inner : outer);
|
|
411
|
+
}
|
|
412
|
+
|
|
413
|
+
template <int LoadMode, typename PacketType>
|
|
414
|
+
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE PacketType packetByOuterInner(Index outer, Index inner) const {
|
|
415
|
+
return Base::template packet<LoadMode, PacketType>(IsRowMajor ? outer : inner, IsRowMajor ? inner : outer);
|
|
416
|
+
}
|
|
417
|
+
|
|
418
|
+
template <int LoadMode, typename PacketType>
|
|
419
|
+
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE PacketType packetSegmentByOuterInner(Index outer, Index inner, Index begin,
|
|
420
|
+
Index count) const {
|
|
421
|
+
return Base::template packetSegment<LoadMode, PacketType>(IsRowMajor ? outer : inner, IsRowMajor ? inner : outer,
|
|
422
|
+
begin, count);
|
|
423
|
+
}
|
|
388
424
|
};
|
|
389
425
|
|
|
390
|
-
}
|
|
426
|
+
} // end namespace internal
|
|
391
427
|
|
|
392
428
|
/***************************************************************************
|
|
393
|
-
* Part 4 : public API
|
|
394
|
-
***************************************************************************/
|
|
395
|
-
|
|
429
|
+
* Part 4 : public API
|
|
430
|
+
***************************************************************************/
|
|
396
431
|
|
|
397
432
|
/** \returns the result of a full redux operation on the whole matrix or vector using \a func
|
|
398
|
-
|
|
399
|
-
|
|
400
|
-
|
|
401
|
-
|
|
402
|
-
|
|
403
|
-
|
|
404
|
-
|
|
405
|
-
|
|
406
|
-
template<typename Derived>
|
|
407
|
-
template<typename Func>
|
|
408
|
-
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE typename internal::traits<Derived>::Scalar
|
|
409
|
-
|
|
410
|
-
|
|
411
|
-
eigen_assert(this->rows()>0 && this->cols()>0 && "you are using an empty matrix");
|
|
433
|
+
*
|
|
434
|
+
* The template parameter \a BinaryOp is the type of the functor \a func which must be
|
|
435
|
+
* an associative operator. Both current C++98 and C++11 functor styles are handled.
|
|
436
|
+
*
|
|
437
|
+
* \warning the matrix must be not empty, otherwise an assertion is triggered.
|
|
438
|
+
*
|
|
439
|
+
* \sa DenseBase::sum(), DenseBase::minCoeff(), DenseBase::maxCoeff(), MatrixBase::colwise(), MatrixBase::rowwise()
|
|
440
|
+
*/
|
|
441
|
+
template <typename Derived>
|
|
442
|
+
template <typename Func>
|
|
443
|
+
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE typename internal::traits<Derived>::Scalar DenseBase<Derived>::redux(
|
|
444
|
+
const Func& func) const {
|
|
445
|
+
eigen_assert(this->rows() > 0 && this->cols() > 0 && "you are using an empty matrix");
|
|
412
446
|
|
|
413
447
|
typedef typename internal::redux_evaluator<Derived> ThisEvaluator;
|
|
414
448
|
ThisEvaluator thisEval(derived());
|
|
415
449
|
|
|
416
450
|
// The initial expression is passed to the reducer as an additional argument instead of
|
|
417
|
-
// passing it as a member of redux_evaluator to help
|
|
451
|
+
// passing it as a member of redux_evaluator to help
|
|
418
452
|
return internal::redux_impl<Func, ThisEvaluator>::run(thisEval, func, derived());
|
|
419
453
|
}
|
|
420
454
|
|
|
421
455
|
/** \returns the minimum of all coefficients of \c *this.
|
|
422
|
-
|
|
423
|
-
|
|
424
|
-
|
|
425
|
-
|
|
426
|
-
|
|
427
|
-
|
|
428
|
-
template<typename Derived>
|
|
429
|
-
template<int NaNPropagation>
|
|
430
|
-
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE typename internal::traits<Derived>::Scalar
|
|
431
|
-
|
|
432
|
-
{
|
|
433
|
-
return derived().redux(Eigen::internal::scalar_min_op<Scalar,Scalar, NaNPropagation>());
|
|
456
|
+
* In case \c *this contains NaN, NaNPropagation determines the behavior:
|
|
457
|
+
* NaNPropagation == PropagateFast : undefined
|
|
458
|
+
* NaNPropagation == PropagateNaN : result is NaN
|
|
459
|
+
* NaNPropagation == PropagateNumbers : result is minimum of elements that are not NaN
|
|
460
|
+
* \warning the matrix must be not empty, otherwise an assertion is triggered.
|
|
461
|
+
*/
|
|
462
|
+
template <typename Derived>
|
|
463
|
+
template <int NaNPropagation>
|
|
464
|
+
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE typename internal::traits<Derived>::Scalar DenseBase<Derived>::minCoeff() const {
|
|
465
|
+
return derived().redux(Eigen::internal::scalar_min_op<Scalar, Scalar, NaNPropagation>());
|
|
434
466
|
}
|
|
435
467
|
|
|
436
|
-
/** \returns the maximum of all coefficients of \c *this.
|
|
437
|
-
|
|
438
|
-
|
|
439
|
-
|
|
440
|
-
|
|
441
|
-
|
|
442
|
-
|
|
443
|
-
template<typename Derived>
|
|
444
|
-
template<int NaNPropagation>
|
|
445
|
-
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE typename internal::traits<Derived>::Scalar
|
|
446
|
-
|
|
447
|
-
{
|
|
448
|
-
return derived().redux(Eigen::internal::scalar_max_op<Scalar,Scalar, NaNPropagation>());
|
|
468
|
+
/** \returns the maximum of all coefficients of \c *this.
|
|
469
|
+
* In case \c *this contains NaN, NaNPropagation determines the behavior:
|
|
470
|
+
* NaNPropagation == PropagateFast : undefined
|
|
471
|
+
* NaNPropagation == PropagateNaN : result is NaN
|
|
472
|
+
* NaNPropagation == PropagateNumbers : result is maximum of elements that are not NaN
|
|
473
|
+
* \warning the matrix must be not empty, otherwise an assertion is triggered.
|
|
474
|
+
*/
|
|
475
|
+
template <typename Derived>
|
|
476
|
+
template <int NaNPropagation>
|
|
477
|
+
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE typename internal::traits<Derived>::Scalar DenseBase<Derived>::maxCoeff() const {
|
|
478
|
+
return derived().redux(Eigen::internal::scalar_max_op<Scalar, Scalar, NaNPropagation>());
|
|
449
479
|
}
|
|
450
480
|
|
|
451
481
|
/** \returns the sum of all coefficients of \c *this
|
|
452
|
-
|
|
453
|
-
|
|
454
|
-
|
|
455
|
-
|
|
456
|
-
|
|
457
|
-
template<typename Derived>
|
|
458
|
-
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE typename internal::traits<Derived>::Scalar
|
|
459
|
-
|
|
460
|
-
|
|
461
|
-
if(SizeAtCompileTime==0 || (SizeAtCompileTime==Dynamic && size()==0))
|
|
462
|
-
return Scalar(0);
|
|
463
|
-
return derived().redux(Eigen::internal::scalar_sum_op<Scalar,Scalar>());
|
|
482
|
+
*
|
|
483
|
+
* If \c *this is empty, then the value 0 is returned.
|
|
484
|
+
*
|
|
485
|
+
* \sa trace(), prod(), mean()
|
|
486
|
+
*/
|
|
487
|
+
template <typename Derived>
|
|
488
|
+
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE typename internal::traits<Derived>::Scalar DenseBase<Derived>::sum() const {
|
|
489
|
+
if (SizeAtCompileTime == 0 || (SizeAtCompileTime == Dynamic && size() == 0)) return Scalar(0);
|
|
490
|
+
return derived().redux(Eigen::internal::scalar_sum_op<Scalar, Scalar>());
|
|
464
491
|
}
|
|
465
492
|
|
|
466
493
|
/** \returns the mean of all coefficients of *this
|
|
467
|
-
*
|
|
468
|
-
* \sa trace(), prod(), sum()
|
|
469
|
-
*/
|
|
470
|
-
template<typename Derived>
|
|
471
|
-
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE typename internal::traits<Derived>::Scalar
|
|
472
|
-
DenseBase<Derived>::mean() const
|
|
473
|
-
{
|
|
494
|
+
*
|
|
495
|
+
* \sa trace(), prod(), sum()
|
|
496
|
+
*/
|
|
497
|
+
template <typename Derived>
|
|
498
|
+
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE typename internal::traits<Derived>::Scalar DenseBase<Derived>::mean() const {
|
|
474
499
|
#ifdef __INTEL_COMPILER
|
|
475
|
-
|
|
476
|
-
|
|
500
|
+
#pragma warning push
|
|
501
|
+
#pragma warning(disable : 2259)
|
|
477
502
|
#endif
|
|
478
|
-
return Scalar(derived().redux(Eigen::internal::scalar_sum_op<Scalar,Scalar>())) / Scalar(this->size());
|
|
503
|
+
return Scalar(derived().redux(Eigen::internal::scalar_sum_op<Scalar, Scalar>())) / Scalar(this->size());
|
|
479
504
|
#ifdef __INTEL_COMPILER
|
|
480
|
-
|
|
505
|
+
#pragma warning pop
|
|
481
506
|
#endif
|
|
482
507
|
}
|
|
483
508
|
|
|
484
509
|
/** \returns the product of all coefficients of *this
|
|
485
|
-
|
|
486
|
-
|
|
487
|
-
|
|
488
|
-
|
|
489
|
-
|
|
490
|
-
|
|
491
|
-
template<typename Derived>
|
|
492
|
-
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE typename internal::traits<Derived>::Scalar
|
|
493
|
-
|
|
494
|
-
{
|
|
495
|
-
if(SizeAtCompileTime==0 || (SizeAtCompileTime==Dynamic && size()==0))
|
|
496
|
-
return Scalar(1);
|
|
510
|
+
*
|
|
511
|
+
* Example: \include MatrixBase_prod.cpp
|
|
512
|
+
* Output: \verbinclude MatrixBase_prod.out
|
|
513
|
+
*
|
|
514
|
+
* \sa sum(), mean(), trace()
|
|
515
|
+
*/
|
|
516
|
+
template <typename Derived>
|
|
517
|
+
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE typename internal::traits<Derived>::Scalar DenseBase<Derived>::prod() const {
|
|
518
|
+
if (SizeAtCompileTime == 0 || (SizeAtCompileTime == Dynamic && size() == 0)) return Scalar(1);
|
|
497
519
|
return derived().redux(Eigen::internal::scalar_product_op<Scalar>());
|
|
498
520
|
}
|
|
499
521
|
|
|
500
522
|
/** \returns the trace of \c *this, i.e. the sum of the coefficients on the main diagonal.
|
|
501
|
-
|
|
502
|
-
|
|
503
|
-
|
|
504
|
-
|
|
505
|
-
|
|
506
|
-
template<typename Derived>
|
|
507
|
-
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE typename internal::traits<Derived>::Scalar
|
|
508
|
-
MatrixBase<Derived>::trace() const
|
|
509
|
-
{
|
|
523
|
+
*
|
|
524
|
+
* \c *this can be any matrix, not necessarily square.
|
|
525
|
+
*
|
|
526
|
+
* \sa diagonal(), sum()
|
|
527
|
+
*/
|
|
528
|
+
template <typename Derived>
|
|
529
|
+
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE typename internal::traits<Derived>::Scalar MatrixBase<Derived>::trace() const {
|
|
510
530
|
return derived().diagonal().sum();
|
|
511
531
|
}
|
|
512
532
|
|
|
513
|
-
}
|
|
533
|
+
} // end namespace Eigen
|
|
514
534
|
|
|
515
|
-
#endif
|
|
535
|
+
#endif // EIGEN_REDUX_H
|