@smake/eigen 1.1.0 → 1.1.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +1 -1
- package/eigen/Eigen/AccelerateSupport +52 -0
- package/eigen/Eigen/Cholesky +18 -20
- package/eigen/Eigen/CholmodSupport +28 -28
- package/eigen/Eigen/Core +187 -120
- package/eigen/Eigen/Eigenvalues +16 -13
- package/eigen/Eigen/Geometry +18 -18
- package/eigen/Eigen/Householder +9 -7
- package/eigen/Eigen/IterativeLinearSolvers +8 -4
- package/eigen/Eigen/Jacobi +14 -13
- package/eigen/Eigen/KLUSupport +23 -21
- package/eigen/Eigen/LU +15 -16
- package/eigen/Eigen/MetisSupport +12 -12
- package/eigen/Eigen/OrderingMethods +54 -51
- package/eigen/Eigen/PaStiXSupport +23 -21
- package/eigen/Eigen/PardisoSupport +17 -14
- package/eigen/Eigen/QR +18 -20
- package/eigen/Eigen/QtAlignedMalloc +5 -12
- package/eigen/Eigen/SPQRSupport +21 -14
- package/eigen/Eigen/SVD +23 -17
- package/eigen/Eigen/Sparse +1 -2
- package/eigen/Eigen/SparseCholesky +18 -15
- package/eigen/Eigen/SparseCore +18 -17
- package/eigen/Eigen/SparseLU +9 -9
- package/eigen/Eigen/SparseQR +16 -14
- package/eigen/Eigen/StdDeque +5 -2
- package/eigen/Eigen/StdList +5 -2
- package/eigen/Eigen/StdVector +5 -2
- package/eigen/Eigen/SuperLUSupport +30 -24
- package/eigen/Eigen/ThreadPool +80 -0
- package/eigen/Eigen/UmfPackSupport +19 -17
- package/eigen/Eigen/Version +14 -0
- package/eigen/Eigen/src/AccelerateSupport/AccelerateSupport.h +423 -0
- package/eigen/Eigen/src/AccelerateSupport/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/Cholesky/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/Cholesky/LDLT.h +366 -405
- package/eigen/Eigen/src/Cholesky/LLT.h +323 -367
- package/eigen/Eigen/src/Cholesky/LLT_LAPACKE.h +81 -56
- package/eigen/Eigen/src/CholmodSupport/CholmodSupport.h +585 -529
- package/eigen/Eigen/src/CholmodSupport/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/Core/ArithmeticSequence.h +143 -317
- package/eigen/Eigen/src/Core/Array.h +329 -370
- package/eigen/Eigen/src/Core/ArrayBase.h +190 -203
- package/eigen/Eigen/src/Core/ArrayWrapper.h +126 -170
- package/eigen/Eigen/src/Core/Assign.h +30 -40
- package/eigen/Eigen/src/Core/AssignEvaluator.h +651 -604
- package/eigen/Eigen/src/Core/Assign_MKL.h +125 -120
- package/eigen/Eigen/src/Core/BandMatrix.h +267 -282
- package/eigen/Eigen/src/Core/Block.h +371 -390
- package/eigen/Eigen/src/Core/CommaInitializer.h +85 -100
- package/eigen/Eigen/src/Core/ConditionEstimator.h +51 -53
- package/eigen/Eigen/src/Core/CoreEvaluators.h +1214 -937
- package/eigen/Eigen/src/Core/CoreIterators.h +72 -63
- package/eigen/Eigen/src/Core/CwiseBinaryOp.h +112 -129
- package/eigen/Eigen/src/Core/CwiseNullaryOp.h +676 -702
- package/eigen/Eigen/src/Core/CwiseTernaryOp.h +77 -103
- package/eigen/Eigen/src/Core/CwiseUnaryOp.h +55 -67
- package/eigen/Eigen/src/Core/CwiseUnaryView.h +127 -92
- package/eigen/Eigen/src/Core/DenseBase.h +630 -658
- package/eigen/Eigen/src/Core/DenseCoeffsBase.h +511 -628
- package/eigen/Eigen/src/Core/DenseStorage.h +511 -590
- package/eigen/Eigen/src/Core/DeviceWrapper.h +153 -0
- package/eigen/Eigen/src/Core/Diagonal.h +168 -207
- package/eigen/Eigen/src/Core/DiagonalMatrix.h +346 -317
- package/eigen/Eigen/src/Core/DiagonalProduct.h +12 -10
- package/eigen/Eigen/src/Core/Dot.h +167 -217
- package/eigen/Eigen/src/Core/EigenBase.h +74 -85
- package/eigen/Eigen/src/Core/Fill.h +138 -0
- package/eigen/Eigen/src/Core/FindCoeff.h +464 -0
- package/eigen/Eigen/src/Core/ForceAlignedAccess.h +90 -113
- package/eigen/Eigen/src/Core/Fuzzy.h +82 -105
- package/eigen/Eigen/src/Core/GeneralProduct.h +315 -261
- package/eigen/Eigen/src/Core/GenericPacketMath.h +1182 -520
- package/eigen/Eigen/src/Core/GlobalFunctions.h +193 -157
- package/eigen/Eigen/src/Core/IO.h +131 -156
- package/eigen/Eigen/src/Core/IndexedView.h +209 -125
- package/eigen/Eigen/src/Core/InnerProduct.h +260 -0
- package/eigen/Eigen/src/Core/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/Core/Inverse.h +50 -59
- package/eigen/Eigen/src/Core/Map.h +123 -141
- package/eigen/Eigen/src/Core/MapBase.h +255 -282
- package/eigen/Eigen/src/Core/MathFunctions.h +1247 -1201
- package/eigen/Eigen/src/Core/MathFunctionsImpl.h +162 -99
- package/eigen/Eigen/src/Core/Matrix.h +463 -494
- package/eigen/Eigen/src/Core/MatrixBase.h +468 -470
- package/eigen/Eigen/src/Core/NestByValue.h +58 -52
- package/eigen/Eigen/src/Core/NoAlias.h +79 -86
- package/eigen/Eigen/src/Core/NumTraits.h +206 -206
- package/eigen/Eigen/src/Core/PartialReduxEvaluator.h +163 -142
- package/eigen/Eigen/src/Core/PermutationMatrix.h +461 -511
- package/eigen/Eigen/src/Core/PlainObjectBase.h +858 -972
- package/eigen/Eigen/src/Core/Product.h +246 -130
- package/eigen/Eigen/src/Core/ProductEvaluators.h +779 -671
- package/eigen/Eigen/src/Core/Random.h +153 -164
- package/eigen/Eigen/src/Core/RandomImpl.h +262 -0
- package/eigen/Eigen/src/Core/RealView.h +250 -0
- package/eigen/Eigen/src/Core/Redux.h +334 -314
- package/eigen/Eigen/src/Core/Ref.h +259 -257
- package/eigen/Eigen/src/Core/Replicate.h +92 -104
- package/eigen/Eigen/src/Core/Reshaped.h +215 -271
- package/eigen/Eigen/src/Core/ReturnByValue.h +47 -55
- package/eigen/Eigen/src/Core/Reverse.h +133 -148
- package/eigen/Eigen/src/Core/Select.h +68 -140
- package/eigen/Eigen/src/Core/SelfAdjointView.h +254 -290
- package/eigen/Eigen/src/Core/SelfCwiseBinaryOp.h +23 -20
- package/eigen/Eigen/src/Core/SkewSymmetricMatrix3.h +382 -0
- package/eigen/Eigen/src/Core/Solve.h +88 -102
- package/eigen/Eigen/src/Core/SolveTriangular.h +126 -124
- package/eigen/Eigen/src/Core/SolverBase.h +132 -133
- package/eigen/Eigen/src/Core/StableNorm.h +113 -147
- package/eigen/Eigen/src/Core/StlIterators.h +404 -248
- package/eigen/Eigen/src/Core/Stride.h +90 -92
- package/eigen/Eigen/src/Core/Swap.h +70 -39
- package/eigen/Eigen/src/Core/Transpose.h +258 -295
- package/eigen/Eigen/src/Core/Transpositions.h +270 -333
- package/eigen/Eigen/src/Core/TriangularMatrix.h +642 -743
- package/eigen/Eigen/src/Core/VectorBlock.h +59 -72
- package/eigen/Eigen/src/Core/VectorwiseOp.h +653 -704
- package/eigen/Eigen/src/Core/Visitor.h +464 -308
- package/eigen/Eigen/src/Core/arch/AVX/Complex.h +380 -187
- package/eigen/Eigen/src/Core/arch/AVX/MathFunctions.h +65 -163
- package/eigen/Eigen/src/Core/arch/AVX/PacketMath.h +2145 -638
- package/eigen/Eigen/src/Core/arch/AVX/Reductions.h +353 -0
- package/eigen/Eigen/src/Core/arch/AVX/TypeCasting.h +253 -60
- package/eigen/Eigen/src/Core/arch/AVX512/Complex.h +278 -228
- package/eigen/Eigen/src/Core/arch/AVX512/GemmKernel.h +1245 -0
- package/eigen/Eigen/src/Core/arch/AVX512/MathFunctions.h +48 -269
- package/eigen/Eigen/src/Core/arch/AVX512/MathFunctionsFP16.h +75 -0
- package/eigen/Eigen/src/Core/arch/AVX512/PacketMath.h +1597 -754
- package/eigen/Eigen/src/Core/arch/AVX512/PacketMathFP16.h +1413 -0
- package/eigen/Eigen/src/Core/arch/AVX512/Reductions.h +297 -0
- package/eigen/Eigen/src/Core/arch/AVX512/TrsmKernel.h +1167 -0
- package/eigen/Eigen/src/Core/arch/AVX512/TrsmUnrolls.inc +1219 -0
- package/eigen/Eigen/src/Core/arch/AVX512/TypeCasting.h +229 -41
- package/eigen/Eigen/src/Core/arch/AVX512/TypeCastingFP16.h +130 -0
- package/eigen/Eigen/src/Core/arch/AltiVec/Complex.h +420 -184
- package/eigen/Eigen/src/Core/arch/AltiVec/MathFunctions.h +40 -49
- package/eigen/Eigen/src/Core/arch/AltiVec/MatrixProduct.h +2962 -2213
- package/eigen/Eigen/src/Core/arch/AltiVec/MatrixProductCommon.h +196 -212
- package/eigen/Eigen/src/Core/arch/AltiVec/MatrixProductMMA.h +713 -441
- package/eigen/Eigen/src/Core/arch/AltiVec/MatrixProductMMAbfloat16.h +742 -0
- package/eigen/Eigen/src/Core/arch/AltiVec/MatrixVectorProduct.inc +2818 -0
- package/eigen/Eigen/src/Core/arch/AltiVec/PacketMath.h +2380 -1362
- package/eigen/Eigen/src/Core/arch/AltiVec/TypeCasting.h +153 -0
- package/eigen/Eigen/src/Core/arch/Default/BFloat16.h +390 -224
- package/eigen/Eigen/src/Core/arch/Default/ConjHelper.h +78 -67
- package/eigen/Eigen/src/Core/arch/Default/GenericPacketMathFunctions.h +1784 -799
- package/eigen/Eigen/src/Core/arch/Default/GenericPacketMathFunctionsFwd.h +167 -50
- package/eigen/Eigen/src/Core/arch/Default/Half.h +528 -379
- package/eigen/Eigen/src/Core/arch/Default/Settings.h +10 -12
- package/eigen/Eigen/src/Core/arch/GPU/Complex.h +244 -0
- package/eigen/Eigen/src/Core/arch/GPU/MathFunctions.h +41 -40
- package/eigen/Eigen/src/Core/arch/GPU/PacketMath.h +550 -523
- package/eigen/Eigen/src/Core/arch/GPU/Tuple.h +268 -0
- package/eigen/Eigen/src/Core/arch/GPU/TypeCasting.h +27 -30
- package/eigen/Eigen/src/Core/arch/HIP/hcc/math_constants.h +8 -8
- package/eigen/Eigen/src/Core/arch/HVX/PacketMath.h +1088 -0
- package/eigen/Eigen/src/Core/arch/LSX/Complex.h +520 -0
- package/eigen/Eigen/src/Core/arch/LSX/GeneralBlockPanelKernel.h +23 -0
- package/eigen/Eigen/src/Core/arch/LSX/MathFunctions.h +43 -0
- package/eigen/Eigen/src/Core/arch/LSX/PacketMath.h +2866 -0
- package/eigen/Eigen/src/Core/arch/LSX/TypeCasting.h +526 -0
- package/eigen/Eigen/src/Core/arch/MSA/Complex.h +54 -82
- package/eigen/Eigen/src/Core/arch/MSA/MathFunctions.h +84 -92
- package/eigen/Eigen/src/Core/arch/MSA/PacketMath.h +51 -47
- package/eigen/Eigen/src/Core/arch/NEON/Complex.h +454 -306
- package/eigen/Eigen/src/Core/arch/NEON/GeneralBlockPanelKernel.h +175 -115
- package/eigen/Eigen/src/Core/arch/NEON/MathFunctions.h +23 -30
- package/eigen/Eigen/src/Core/arch/NEON/PacketMath.h +4366 -2857
- package/eigen/Eigen/src/Core/arch/NEON/TypeCasting.h +616 -393
- package/eigen/Eigen/src/Core/arch/NEON/UnaryFunctors.h +57 -0
- package/eigen/Eigen/src/Core/arch/SSE/Complex.h +350 -198
- package/eigen/Eigen/src/Core/arch/SSE/MathFunctions.h +38 -149
- package/eigen/Eigen/src/Core/arch/SSE/PacketMath.h +1791 -912
- package/eigen/Eigen/src/Core/arch/SSE/Reductions.h +324 -0
- package/eigen/Eigen/src/Core/arch/SSE/TypeCasting.h +128 -40
- package/eigen/Eigen/src/Core/arch/SVE/MathFunctions.h +10 -6
- package/eigen/Eigen/src/Core/arch/SVE/PacketMath.h +156 -234
- package/eigen/Eigen/src/Core/arch/SVE/TypeCasting.h +6 -3
- package/eigen/Eigen/src/Core/arch/SYCL/InteropHeaders.h +27 -32
- package/eigen/Eigen/src/Core/arch/SYCL/MathFunctions.h +119 -117
- package/eigen/Eigen/src/Core/arch/SYCL/PacketMath.h +325 -419
- package/eigen/Eigen/src/Core/arch/SYCL/TypeCasting.h +15 -17
- package/eigen/Eigen/src/Core/arch/ZVector/Complex.h +325 -181
- package/eigen/Eigen/src/Core/arch/ZVector/MathFunctions.h +94 -83
- package/eigen/Eigen/src/Core/arch/ZVector/PacketMath.h +811 -458
- package/eigen/Eigen/src/Core/functors/AssignmentFunctors.h +121 -124
- package/eigen/Eigen/src/Core/functors/BinaryFunctors.h +576 -370
- package/eigen/Eigen/src/Core/functors/NullaryFunctors.h +194 -109
- package/eigen/Eigen/src/Core/functors/StlFunctors.h +95 -112
- package/eigen/Eigen/src/Core/functors/TernaryFunctors.h +34 -7
- package/eigen/Eigen/src/Core/functors/UnaryFunctors.h +1038 -749
- package/eigen/Eigen/src/Core/products/GeneralBlockPanelKernel.h +1883 -1375
- package/eigen/Eigen/src/Core/products/GeneralMatrixMatrix.h +312 -370
- package/eigen/Eigen/src/Core/products/GeneralMatrixMatrixTriangular.h +189 -176
- package/eigen/Eigen/src/Core/products/GeneralMatrixMatrixTriangular_BLAS.h +84 -81
- package/eigen/Eigen/src/Core/products/GeneralMatrixMatrix_BLAS.h +154 -73
- package/eigen/Eigen/src/Core/products/GeneralMatrixVector.h +292 -337
- package/eigen/Eigen/src/Core/products/GeneralMatrixVector_BLAS.h +80 -77
- package/eigen/Eigen/src/Core/products/Parallelizer.h +207 -105
- package/eigen/Eigen/src/Core/products/SelfadjointMatrixMatrix.h +327 -388
- package/eigen/Eigen/src/Core/products/SelfadjointMatrixMatrix_BLAS.h +206 -224
- package/eigen/Eigen/src/Core/products/SelfadjointMatrixVector.h +138 -147
- package/eigen/Eigen/src/Core/products/SelfadjointMatrixVector_BLAS.h +58 -61
- package/eigen/Eigen/src/Core/products/SelfadjointProduct.h +71 -71
- package/eigen/Eigen/src/Core/products/SelfadjointRank2Update.h +48 -47
- package/eigen/Eigen/src/Core/products/TriangularMatrixMatrix.h +294 -369
- package/eigen/Eigen/src/Core/products/TriangularMatrixMatrix_BLAS.h +246 -238
- package/eigen/Eigen/src/Core/products/TriangularMatrixVector.h +244 -247
- package/eigen/Eigen/src/Core/products/TriangularMatrixVector_BLAS.h +212 -192
- package/eigen/Eigen/src/Core/products/TriangularSolverMatrix.h +328 -277
- package/eigen/Eigen/src/Core/products/TriangularSolverMatrix_BLAS.h +108 -109
- package/eigen/Eigen/src/Core/products/TriangularSolverVector.h +68 -94
- package/eigen/Eigen/src/Core/util/Assert.h +158 -0
- package/eigen/Eigen/src/Core/util/BlasUtil.h +342 -303
- package/eigen/Eigen/src/Core/util/ConfigureVectorization.h +348 -317
- package/eigen/Eigen/src/Core/util/Constants.h +297 -262
- package/eigen/Eigen/src/Core/util/DisableStupidWarnings.h +130 -90
- package/eigen/Eigen/src/Core/util/EmulateArray.h +270 -0
- package/eigen/Eigen/src/Core/util/ForwardDeclarations.h +449 -247
- package/eigen/Eigen/src/Core/util/GpuHipCudaDefines.inc +101 -0
- package/eigen/Eigen/src/Core/util/GpuHipCudaUndefines.inc +45 -0
- package/eigen/Eigen/src/Core/util/IndexedViewHelper.h +417 -116
- package/eigen/Eigen/src/Core/util/IntegralConstant.h +211 -204
- package/eigen/Eigen/src/Core/util/MKL_support.h +39 -37
- package/eigen/Eigen/src/Core/util/Macros.h +655 -773
- package/eigen/Eigen/src/Core/util/MaxSizeVector.h +139 -0
- package/eigen/Eigen/src/Core/util/Memory.h +970 -748
- package/eigen/Eigen/src/Core/util/Meta.h +581 -633
- package/eigen/Eigen/src/Core/util/MoreMeta.h +638 -0
- package/eigen/Eigen/src/Core/util/ReenableStupidWarnings.h +32 -19
- package/eigen/Eigen/src/Core/util/ReshapedHelper.h +17 -17
- package/eigen/Eigen/src/Core/util/Serializer.h +209 -0
- package/eigen/Eigen/src/Core/util/StaticAssert.h +50 -166
- package/eigen/Eigen/src/Core/util/SymbolicIndex.h +377 -225
- package/eigen/Eigen/src/Core/util/XprHelper.h +784 -547
- package/eigen/Eigen/src/Eigenvalues/ComplexEigenSolver.h +246 -277
- package/eigen/Eigen/src/Eigenvalues/ComplexSchur.h +299 -319
- package/eigen/Eigen/src/Eigenvalues/ComplexSchur_LAPACKE.h +52 -48
- package/eigen/Eigen/src/Eigenvalues/EigenSolver.h +413 -456
- package/eigen/Eigen/src/Eigenvalues/GeneralizedEigenSolver.h +309 -325
- package/eigen/Eigen/src/Eigenvalues/GeneralizedSelfAdjointEigenSolver.h +157 -171
- package/eigen/Eigen/src/Eigenvalues/HessenbergDecomposition.h +292 -310
- package/eigen/Eigen/src/Eigenvalues/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/Eigenvalues/MatrixBaseEigenvalues.h +89 -105
- package/eigen/Eigen/src/Eigenvalues/RealQZ.h +537 -607
- package/eigen/Eigen/src/Eigenvalues/RealSchur.h +342 -381
- package/eigen/Eigen/src/Eigenvalues/RealSchur_LAPACKE.h +41 -35
- package/eigen/Eigen/src/Eigenvalues/SelfAdjointEigenSolver.h +541 -595
- package/eigen/Eigen/src/Eigenvalues/SelfAdjointEigenSolver_LAPACKE.h +47 -44
- package/eigen/Eigen/src/Eigenvalues/Tridiagonalization.h +430 -462
- package/eigen/Eigen/src/Geometry/AlignedBox.h +226 -227
- package/eigen/Eigen/src/Geometry/AngleAxis.h +131 -133
- package/eigen/Eigen/src/Geometry/EulerAngles.h +163 -74
- package/eigen/Eigen/src/Geometry/Homogeneous.h +285 -333
- package/eigen/Eigen/src/Geometry/Hyperplane.h +151 -160
- package/eigen/Eigen/src/Geometry/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/Geometry/OrthoMethods.h +168 -146
- package/eigen/Eigen/src/Geometry/ParametrizedLine.h +127 -127
- package/eigen/Eigen/src/Geometry/Quaternion.h +566 -506
- package/eigen/Eigen/src/Geometry/Rotation2D.h +107 -105
- package/eigen/Eigen/src/Geometry/RotationBase.h +148 -145
- package/eigen/Eigen/src/Geometry/Scaling.h +113 -106
- package/eigen/Eigen/src/Geometry/Transform.h +858 -936
- package/eigen/Eigen/src/Geometry/Translation.h +94 -92
- package/eigen/Eigen/src/Geometry/Umeyama.h +79 -84
- package/eigen/Eigen/src/Geometry/arch/Geometry_SIMD.h +90 -104
- package/eigen/Eigen/src/Householder/BlockHouseholder.h +51 -46
- package/eigen/Eigen/src/Householder/Householder.h +102 -124
- package/eigen/Eigen/src/Householder/HouseholderSequence.h +412 -453
- package/eigen/Eigen/src/Householder/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/IterativeLinearSolvers/BasicPreconditioners.h +149 -162
- package/eigen/Eigen/src/IterativeLinearSolvers/BiCGSTAB.h +124 -119
- package/eigen/Eigen/src/IterativeLinearSolvers/ConjugateGradient.h +92 -104
- package/eigen/Eigen/src/IterativeLinearSolvers/IncompleteCholesky.h +251 -243
- package/eigen/Eigen/src/IterativeLinearSolvers/IncompleteLUT.h +224 -228
- package/eigen/Eigen/src/IterativeLinearSolvers/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/IterativeLinearSolvers/IterativeSolverBase.h +178 -227
- package/eigen/Eigen/src/IterativeLinearSolvers/LeastSquareConjugateGradient.h +79 -84
- package/eigen/Eigen/src/IterativeLinearSolvers/SolveWithGuess.h +54 -60
- package/eigen/Eigen/src/Jacobi/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/Jacobi/Jacobi.h +252 -308
- package/eigen/Eigen/src/KLUSupport/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/KLUSupport/KLUSupport.h +208 -227
- package/eigen/Eigen/src/LU/Determinant.h +50 -69
- package/eigen/Eigen/src/LU/FullPivLU.h +545 -596
- package/eigen/Eigen/src/LU/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/LU/InverseImpl.h +206 -285
- package/eigen/Eigen/src/LU/PartialPivLU.h +390 -428
- package/eigen/Eigen/src/LU/PartialPivLU_LAPACKE.h +54 -40
- package/eigen/Eigen/src/LU/arch/InverseSize4.h +72 -70
- package/eigen/Eigen/src/MetisSupport/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/MetisSupport/MetisSupport.h +81 -93
- package/eigen/Eigen/src/OrderingMethods/Amd.h +243 -265
- package/eigen/Eigen/src/OrderingMethods/Eigen_Colamd.h +831 -1004
- package/eigen/Eigen/src/OrderingMethods/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/OrderingMethods/Ordering.h +112 -119
- package/eigen/Eigen/src/PaStiXSupport/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/PaStiXSupport/PaStiXSupport.h +524 -570
- package/eigen/Eigen/src/PardisoSupport/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/PardisoSupport/PardisoSupport.h +385 -430
- package/eigen/Eigen/src/QR/ColPivHouseholderQR.h +479 -479
- package/eigen/Eigen/src/QR/ColPivHouseholderQR_LAPACKE.h +120 -56
- package/eigen/Eigen/src/QR/CompleteOrthogonalDecomposition.h +166 -153
- package/eigen/Eigen/src/QR/FullPivHouseholderQR.h +495 -475
- package/eigen/Eigen/src/QR/HouseholderQR.h +394 -285
- package/eigen/Eigen/src/QR/HouseholderQR_LAPACKE.h +32 -23
- package/eigen/Eigen/src/QR/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/SPQRSupport/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/SPQRSupport/SuiteSparseQRSupport.h +244 -264
- package/eigen/Eigen/src/SVD/BDCSVD.h +817 -713
- package/eigen/Eigen/src/SVD/BDCSVD_LAPACKE.h +174 -0
- package/eigen/Eigen/src/SVD/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/SVD/JacobiSVD.h +577 -543
- package/eigen/Eigen/src/SVD/JacobiSVD_LAPACKE.h +85 -49
- package/eigen/Eigen/src/SVD/SVDBase.h +242 -182
- package/eigen/Eigen/src/SVD/UpperBidiagonalization.h +200 -235
- package/eigen/Eigen/src/SparseCholesky/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/SparseCholesky/SimplicialCholesky.h +765 -594
- package/eigen/Eigen/src/SparseCholesky/SimplicialCholesky_impl.h +308 -94
- package/eigen/Eigen/src/SparseCore/AmbiVector.h +202 -251
- package/eigen/Eigen/src/SparseCore/CompressedStorage.h +184 -252
- package/eigen/Eigen/src/SparseCore/ConservativeSparseSparseProduct.h +134 -178
- package/eigen/Eigen/src/SparseCore/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/SparseCore/SparseAssign.h +149 -140
- package/eigen/Eigen/src/SparseCore/SparseBlock.h +403 -440
- package/eigen/Eigen/src/SparseCore/SparseColEtree.h +100 -112
- package/eigen/Eigen/src/SparseCore/SparseCompressedBase.h +525 -303
- package/eigen/Eigen/src/SparseCore/SparseCwiseBinaryOp.h +555 -339
- package/eigen/Eigen/src/SparseCore/SparseCwiseUnaryOp.h +100 -108
- package/eigen/Eigen/src/SparseCore/SparseDenseProduct.h +169 -197
- package/eigen/Eigen/src/SparseCore/SparseDiagonalProduct.h +71 -71
- package/eigen/Eigen/src/SparseCore/SparseDot.h +49 -47
- package/eigen/Eigen/src/SparseCore/SparseFuzzy.h +13 -11
- package/eigen/Eigen/src/SparseCore/SparseMap.h +243 -253
- package/eigen/Eigen/src/SparseCore/SparseMatrix.h +1603 -1245
- package/eigen/Eigen/src/SparseCore/SparseMatrixBase.h +403 -350
- package/eigen/Eigen/src/SparseCore/SparsePermutation.h +186 -115
- package/eigen/Eigen/src/SparseCore/SparseProduct.h +94 -97
- package/eigen/Eigen/src/SparseCore/SparseRedux.h +22 -24
- package/eigen/Eigen/src/SparseCore/SparseRef.h +268 -295
- package/eigen/Eigen/src/SparseCore/SparseSelfAdjointView.h +370 -416
- package/eigen/Eigen/src/SparseCore/SparseSolverBase.h +78 -87
- package/eigen/Eigen/src/SparseCore/SparseSparseProductWithPruning.h +81 -95
- package/eigen/Eigen/src/SparseCore/SparseTranspose.h +62 -71
- package/eigen/Eigen/src/SparseCore/SparseTriangularView.h +132 -144
- package/eigen/Eigen/src/SparseCore/SparseUtil.h +138 -115
- package/eigen/Eigen/src/SparseCore/SparseVector.h +426 -372
- package/eigen/Eigen/src/SparseCore/SparseView.h +164 -193
- package/eigen/Eigen/src/SparseCore/TriangularSolver.h +129 -170
- package/eigen/Eigen/src/SparseLU/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/SparseLU/SparseLU.h +756 -710
- package/eigen/Eigen/src/SparseLU/SparseLUImpl.h +61 -48
- package/eigen/Eigen/src/SparseLU/SparseLU_Memory.h +102 -118
- package/eigen/Eigen/src/SparseLU/SparseLU_Structs.h +38 -35
- package/eigen/Eigen/src/SparseLU/SparseLU_SupernodalMatrix.h +245 -301
- package/eigen/Eigen/src/SparseLU/SparseLU_Utils.h +44 -49
- package/eigen/Eigen/src/SparseLU/SparseLU_column_bmod.h +104 -108
- package/eigen/Eigen/src/SparseLU/SparseLU_column_dfs.h +89 -100
- package/eigen/Eigen/src/SparseLU/SparseLU_copy_to_ucol.h +57 -58
- package/eigen/Eigen/src/SparseLU/SparseLU_heap_relax_snode.h +43 -55
- package/eigen/Eigen/src/SparseLU/SparseLU_kernel_bmod.h +74 -71
- package/eigen/Eigen/src/SparseLU/SparseLU_panel_bmod.h +124 -132
- package/eigen/Eigen/src/SparseLU/SparseLU_panel_dfs.h +136 -159
- package/eigen/Eigen/src/SparseLU/SparseLU_pivotL.h +51 -52
- package/eigen/Eigen/src/SparseLU/SparseLU_pruneL.h +67 -73
- package/eigen/Eigen/src/SparseLU/SparseLU_relax_snode.h +24 -26
- package/eigen/Eigen/src/SparseQR/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/SparseQR/SparseQR.h +450 -502
- package/eigen/Eigen/src/StlSupport/StdDeque.h +28 -93
- package/eigen/Eigen/src/StlSupport/StdList.h +28 -84
- package/eigen/Eigen/src/StlSupport/StdVector.h +28 -108
- package/eigen/Eigen/src/StlSupport/details.h +48 -50
- package/eigen/Eigen/src/SuperLUSupport/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/SuperLUSupport/SuperLUSupport.h +634 -730
- package/eigen/Eigen/src/ThreadPool/Barrier.h +70 -0
- package/eigen/Eigen/src/ThreadPool/CoreThreadPoolDevice.h +336 -0
- package/eigen/Eigen/src/ThreadPool/EventCount.h +241 -0
- package/eigen/Eigen/src/ThreadPool/ForkJoin.h +140 -0
- package/eigen/Eigen/src/ThreadPool/InternalHeaderCheck.h +4 -0
- package/eigen/Eigen/src/ThreadPool/NonBlockingThreadPool.h +587 -0
- package/eigen/Eigen/src/ThreadPool/RunQueue.h +230 -0
- package/eigen/Eigen/src/ThreadPool/ThreadCancel.h +21 -0
- package/eigen/Eigen/src/ThreadPool/ThreadEnvironment.h +43 -0
- package/eigen/Eigen/src/ThreadPool/ThreadLocal.h +289 -0
- package/eigen/Eigen/src/ThreadPool/ThreadPoolInterface.h +50 -0
- package/eigen/Eigen/src/ThreadPool/ThreadYield.h +16 -0
- package/eigen/Eigen/src/UmfPackSupport/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/UmfPackSupport/UmfPackSupport.h +428 -464
- package/eigen/Eigen/src/misc/Image.h +41 -43
- package/eigen/Eigen/src/misc/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/misc/Kernel.h +39 -41
- package/eigen/Eigen/src/misc/RealSvd2x2.h +19 -21
- package/eigen/Eigen/src/misc/blas.h +83 -426
- package/eigen/Eigen/src/misc/lapacke.h +9972 -16179
- package/eigen/Eigen/src/misc/lapacke_helpers.h +163 -0
- package/eigen/Eigen/src/misc/lapacke_mangling.h +4 -5
- package/eigen/Eigen/src/plugins/ArrayCwiseBinaryOps.inc +344 -0
- package/eigen/Eigen/src/plugins/ArrayCwiseUnaryOps.inc +544 -0
- package/eigen/Eigen/src/plugins/{BlockMethods.h → BlockMethods.inc} +434 -506
- package/eigen/Eigen/src/plugins/CommonCwiseBinaryOps.inc +116 -0
- package/eigen/Eigen/src/plugins/{CommonCwiseUnaryOps.h → CommonCwiseUnaryOps.inc} +58 -68
- package/eigen/Eigen/src/plugins/IndexedViewMethods.inc +192 -0
- package/eigen/Eigen/src/plugins/InternalHeaderCheck.inc +3 -0
- package/eigen/Eigen/src/plugins/MatrixCwiseBinaryOps.inc +331 -0
- package/eigen/Eigen/src/plugins/MatrixCwiseUnaryOps.inc +118 -0
- package/eigen/Eigen/src/plugins/ReshapedMethods.inc +133 -0
- package/package.json +1 -1
- package/eigen/COPYING.APACHE +0 -203
- package/eigen/COPYING.BSD +0 -26
- package/eigen/COPYING.GPL +0 -674
- package/eigen/COPYING.LGPL +0 -502
- package/eigen/COPYING.MINPACK +0 -51
- package/eigen/COPYING.MPL2 +0 -373
- package/eigen/COPYING.README +0 -18
- package/eigen/Eigen/src/Core/BooleanRedux.h +0 -162
- package/eigen/Eigen/src/Core/arch/CUDA/Complex.h +0 -258
- package/eigen/Eigen/src/Core/arch/Default/TypeCasting.h +0 -120
- package/eigen/Eigen/src/Core/arch/SYCL/SyclMemoryModel.h +0 -694
- package/eigen/Eigen/src/Core/util/NonMPL2.h +0 -3
- package/eigen/Eigen/src/SparseCore/MappedSparseMatrix.h +0 -67
- package/eigen/Eigen/src/SparseLU/SparseLU_gemm_kernel.h +0 -280
- package/eigen/Eigen/src/misc/lapack.h +0 -152
- package/eigen/Eigen/src/plugins/ArrayCwiseBinaryOps.h +0 -358
- package/eigen/Eigen/src/plugins/ArrayCwiseUnaryOps.h +0 -696
- package/eigen/Eigen/src/plugins/CommonCwiseBinaryOps.h +0 -115
- package/eigen/Eigen/src/plugins/IndexedViewMethods.h +0 -262
- package/eigen/Eigen/src/plugins/MatrixCwiseBinaryOps.h +0 -152
- package/eigen/Eigen/src/plugins/MatrixCwiseUnaryOps.h +0 -95
- package/eigen/Eigen/src/plugins/ReshapedMethods.h +0 -149
- package/eigen/README.md +0 -5
|
@@ -11,12 +11,12 @@
|
|
|
11
11
|
#ifndef EIGEN_GENERAL_PRODUCT_H
|
|
12
12
|
#define EIGEN_GENERAL_PRODUCT_H
|
|
13
13
|
|
|
14
|
+
// IWYU pragma: private
|
|
15
|
+
#include "./InternalHeaderCheck.h"
|
|
16
|
+
|
|
14
17
|
namespace Eigen {
|
|
15
18
|
|
|
16
|
-
enum {
|
|
17
|
-
Large = 2,
|
|
18
|
-
Small = 3
|
|
19
|
-
};
|
|
19
|
+
enum { Large = 2, Small = 3 };
|
|
20
20
|
|
|
21
21
|
// Define the threshold value to fallback from the generic matrix-matrix product
|
|
22
22
|
// implementation (heavy) to the lightweight coeff-based product one.
|
|
@@ -30,64 +30,58 @@ enum {
|
|
|
30
30
|
|
|
31
31
|
namespace internal {
|
|
32
32
|
|
|
33
|
-
template<int Rows, int Cols, int Depth>
|
|
33
|
+
template <int Rows, int Cols, int Depth>
|
|
34
|
+
struct product_type_selector;
|
|
34
35
|
|
|
35
|
-
template<int Size, int MaxSize>
|
|
36
|
-
{
|
|
36
|
+
template <int Size, int MaxSize>
|
|
37
|
+
struct product_size_category {
|
|
37
38
|
enum {
|
|
38
|
-
|
|
39
|
-
is_large = MaxSize == Dynamic ||
|
|
40
|
-
Size >= EIGEN_CACHEFRIENDLY_PRODUCT_THRESHOLD
|
|
41
|
-
|
|
42
|
-
#else
|
|
39
|
+
#ifndef EIGEN_GPU_COMPILE_PHASE
|
|
40
|
+
is_large = MaxSize == Dynamic || Size >= EIGEN_CACHEFRIENDLY_PRODUCT_THRESHOLD ||
|
|
41
|
+
(Size == Dynamic && MaxSize >= EIGEN_CACHEFRIENDLY_PRODUCT_THRESHOLD),
|
|
42
|
+
#else
|
|
43
43
|
is_large = 0,
|
|
44
|
-
|
|
45
|
-
value = is_large
|
|
46
|
-
|
|
47
|
-
|
|
44
|
+
#endif
|
|
45
|
+
value = is_large ? Large
|
|
46
|
+
: Size == 1 ? 1
|
|
47
|
+
: Small
|
|
48
48
|
};
|
|
49
49
|
};
|
|
50
50
|
|
|
51
|
-
template<typename Lhs, typename Rhs>
|
|
52
|
-
{
|
|
53
|
-
typedef
|
|
54
|
-
typedef
|
|
51
|
+
template <typename Lhs, typename Rhs>
|
|
52
|
+
struct product_type {
|
|
53
|
+
typedef remove_all_t<Lhs> Lhs_;
|
|
54
|
+
typedef remove_all_t<Rhs> Rhs_;
|
|
55
55
|
enum {
|
|
56
|
-
MaxRows = traits<
|
|
57
|
-
Rows
|
|
58
|
-
MaxCols = traits<
|
|
59
|
-
Cols
|
|
60
|
-
MaxDepth =
|
|
61
|
-
|
|
62
|
-
Depth = EIGEN_SIZE_MIN_PREFER_FIXED(traits<_Lhs>::ColsAtCompileTime,
|
|
63
|
-
traits<_Rhs>::RowsAtCompileTime)
|
|
56
|
+
MaxRows = traits<Lhs_>::MaxRowsAtCompileTime,
|
|
57
|
+
Rows = traits<Lhs_>::RowsAtCompileTime,
|
|
58
|
+
MaxCols = traits<Rhs_>::MaxColsAtCompileTime,
|
|
59
|
+
Cols = traits<Rhs_>::ColsAtCompileTime,
|
|
60
|
+
MaxDepth = min_size_prefer_fixed(traits<Lhs_>::MaxColsAtCompileTime, traits<Rhs_>::MaxRowsAtCompileTime),
|
|
61
|
+
Depth = min_size_prefer_fixed(traits<Lhs_>::ColsAtCompileTime, traits<Rhs_>::RowsAtCompileTime)
|
|
64
62
|
};
|
|
65
63
|
|
|
66
64
|
// the splitting into different lines of code here, introducing the _select enums and the typedef below,
|
|
67
65
|
// is to work around an internal compiler error with gcc 4.1 and 4.2.
|
|
68
|
-
private:
|
|
66
|
+
private:
|
|
69
67
|
enum {
|
|
70
|
-
rows_select = product_size_category<Rows,MaxRows>::value,
|
|
71
|
-
cols_select = product_size_category<Cols,MaxCols>::value,
|
|
72
|
-
depth_select = product_size_category<Depth,MaxDepth>::value
|
|
68
|
+
rows_select = product_size_category<Rows, MaxRows>::value,
|
|
69
|
+
cols_select = product_size_category<Cols, MaxCols>::value,
|
|
70
|
+
depth_select = product_size_category<Depth, MaxDepth>::value
|
|
73
71
|
};
|
|
74
72
|
typedef product_type_selector<rows_select, cols_select, depth_select> selector;
|
|
75
73
|
|
|
76
|
-
public:
|
|
77
|
-
enum {
|
|
78
|
-
value = selector::ret,
|
|
79
|
-
ret = selector::ret
|
|
80
|
-
};
|
|
74
|
+
public:
|
|
75
|
+
enum { value = selector::ret, ret = selector::ret };
|
|
81
76
|
#ifdef EIGEN_DEBUG_PRODUCT
|
|
82
|
-
static void debug()
|
|
83
|
-
|
|
84
|
-
|
|
85
|
-
|
|
86
|
-
|
|
87
|
-
|
|
88
|
-
|
|
89
|
-
|
|
90
|
-
EIGEN_DEBUG_VAR(value);
|
|
77
|
+
static void debug() {
|
|
78
|
+
EIGEN_DEBUG_VAR(Rows);
|
|
79
|
+
EIGEN_DEBUG_VAR(Cols);
|
|
80
|
+
EIGEN_DEBUG_VAR(Depth);
|
|
81
|
+
EIGEN_DEBUG_VAR(rows_select);
|
|
82
|
+
EIGEN_DEBUG_VAR(cols_select);
|
|
83
|
+
EIGEN_DEBUG_VAR(depth_select);
|
|
84
|
+
EIGEN_DEBUG_VAR(value);
|
|
91
85
|
}
|
|
92
86
|
#endif
|
|
93
87
|
};
|
|
@@ -96,36 +90,108 @@ public:
|
|
|
96
90
|
* based on the three dimensions of the product.
|
|
97
91
|
* This is a compile time mapping from {1,Small,Large}^3 -> {product types} */
|
|
98
92
|
// FIXME I'm not sure the current mapping is the ideal one.
|
|
99
|
-
template<int M, int N>
|
|
100
|
-
|
|
101
|
-
|
|
102
|
-
|
|
103
|
-
template
|
|
104
|
-
|
|
105
|
-
|
|
106
|
-
|
|
107
|
-
template
|
|
108
|
-
|
|
109
|
-
|
|
110
|
-
|
|
111
|
-
template
|
|
112
|
-
|
|
113
|
-
|
|
114
|
-
|
|
115
|
-
template<>
|
|
116
|
-
|
|
117
|
-
|
|
118
|
-
|
|
119
|
-
template<>
|
|
120
|
-
|
|
121
|
-
|
|
122
|
-
|
|
123
|
-
|
|
124
|
-
|
|
93
|
+
template <int M, int N>
|
|
94
|
+
struct product_type_selector<M, N, 1> {
|
|
95
|
+
enum { ret = OuterProduct };
|
|
96
|
+
};
|
|
97
|
+
template <int M>
|
|
98
|
+
struct product_type_selector<M, 1, 1> {
|
|
99
|
+
enum { ret = LazyCoeffBasedProductMode };
|
|
100
|
+
};
|
|
101
|
+
template <int N>
|
|
102
|
+
struct product_type_selector<1, N, 1> {
|
|
103
|
+
enum { ret = LazyCoeffBasedProductMode };
|
|
104
|
+
};
|
|
105
|
+
template <int Depth>
|
|
106
|
+
struct product_type_selector<1, 1, Depth> {
|
|
107
|
+
enum { ret = InnerProduct };
|
|
108
|
+
};
|
|
109
|
+
template <>
|
|
110
|
+
struct product_type_selector<1, 1, 1> {
|
|
111
|
+
enum { ret = InnerProduct };
|
|
112
|
+
};
|
|
113
|
+
template <>
|
|
114
|
+
struct product_type_selector<Small, 1, Small> {
|
|
115
|
+
enum { ret = CoeffBasedProductMode };
|
|
116
|
+
};
|
|
117
|
+
template <>
|
|
118
|
+
struct product_type_selector<1, Small, Small> {
|
|
119
|
+
enum { ret = CoeffBasedProductMode };
|
|
120
|
+
};
|
|
121
|
+
template <>
|
|
122
|
+
struct product_type_selector<Small, Small, Small> {
|
|
123
|
+
enum { ret = CoeffBasedProductMode };
|
|
124
|
+
};
|
|
125
|
+
template <>
|
|
126
|
+
struct product_type_selector<Small, Small, 1> {
|
|
127
|
+
enum { ret = LazyCoeffBasedProductMode };
|
|
128
|
+
};
|
|
129
|
+
template <>
|
|
130
|
+
struct product_type_selector<Small, Large, 1> {
|
|
131
|
+
enum { ret = LazyCoeffBasedProductMode };
|
|
132
|
+
};
|
|
133
|
+
template <>
|
|
134
|
+
struct product_type_selector<Large, Small, 1> {
|
|
135
|
+
enum { ret = LazyCoeffBasedProductMode };
|
|
136
|
+
};
|
|
137
|
+
template <>
|
|
138
|
+
struct product_type_selector<1, Large, Small> {
|
|
139
|
+
enum { ret = CoeffBasedProductMode };
|
|
140
|
+
};
|
|
141
|
+
template <>
|
|
142
|
+
struct product_type_selector<1, Large, Large> {
|
|
143
|
+
enum { ret = GemvProduct };
|
|
144
|
+
};
|
|
145
|
+
template <>
|
|
146
|
+
struct product_type_selector<1, Small, Large> {
|
|
147
|
+
enum { ret = CoeffBasedProductMode };
|
|
148
|
+
};
|
|
149
|
+
template <>
|
|
150
|
+
struct product_type_selector<Large, 1, Small> {
|
|
151
|
+
enum { ret = CoeffBasedProductMode };
|
|
152
|
+
};
|
|
153
|
+
template <>
|
|
154
|
+
struct product_type_selector<Large, 1, Large> {
|
|
155
|
+
enum { ret = GemvProduct };
|
|
156
|
+
};
|
|
157
|
+
template <>
|
|
158
|
+
struct product_type_selector<Small, 1, Large> {
|
|
159
|
+
enum { ret = CoeffBasedProductMode };
|
|
160
|
+
};
|
|
161
|
+
template <>
|
|
162
|
+
struct product_type_selector<Small, Small, Large> {
|
|
163
|
+
enum { ret = GemmProduct };
|
|
164
|
+
};
|
|
165
|
+
template <>
|
|
166
|
+
struct product_type_selector<Large, Small, Large> {
|
|
167
|
+
enum { ret = GemmProduct };
|
|
168
|
+
};
|
|
169
|
+
template <>
|
|
170
|
+
struct product_type_selector<Small, Large, Large> {
|
|
171
|
+
enum { ret = GemmProduct };
|
|
172
|
+
};
|
|
173
|
+
template <>
|
|
174
|
+
struct product_type_selector<Large, Large, Large> {
|
|
175
|
+
enum { ret = GemmProduct };
|
|
176
|
+
};
|
|
177
|
+
template <>
|
|
178
|
+
struct product_type_selector<Large, Small, Small> {
|
|
179
|
+
enum { ret = CoeffBasedProductMode };
|
|
180
|
+
};
|
|
181
|
+
template <>
|
|
182
|
+
struct product_type_selector<Small, Large, Small> {
|
|
183
|
+
enum { ret = CoeffBasedProductMode };
|
|
184
|
+
};
|
|
185
|
+
template <>
|
|
186
|
+
struct product_type_selector<Large, Large, Small> {
|
|
187
|
+
enum { ret = GemmProduct };
|
|
188
|
+
};
|
|
189
|
+
|
|
190
|
+
} // end namespace internal
|
|
125
191
|
|
|
126
192
|
/***********************************************************************
|
|
127
|
-
* Implementation of Inner Vector Vector Product
|
|
128
|
-
***********************************************************************/
|
|
193
|
+
* Implementation of Inner Vector Vector Product
|
|
194
|
+
***********************************************************************/
|
|
129
195
|
|
|
130
196
|
// FIXME : maybe the "inner product" could return a Scalar
|
|
131
197
|
// instead of a 1x1 matrix ??
|
|
@@ -135,12 +201,12 @@ template<> struct product_type_selector<Large,Large,Small> { enum
|
|
|
135
201
|
// case, we could have a specialization for Block<MatrixType,1,1> with: operator=(Scalar x);
|
|
136
202
|
|
|
137
203
|
/***********************************************************************
|
|
138
|
-
* Implementation of Outer Vector Vector Product
|
|
139
|
-
***********************************************************************/
|
|
204
|
+
* Implementation of Outer Vector Vector Product
|
|
205
|
+
***********************************************************************/
|
|
140
206
|
|
|
141
207
|
/***********************************************************************
|
|
142
|
-
* Implementation of General Matrix Vector Product
|
|
143
|
-
***********************************************************************/
|
|
208
|
+
* Implementation of General Matrix Vector Product
|
|
209
|
+
***********************************************************************/
|
|
144
210
|
|
|
145
211
|
/* According to the shape/flags of the matrix we have to distinghish 3 different cases:
|
|
146
212
|
* 1 - the matrix is col-major, BLAS compatible and M is large => call fast BLAS-like colmajor routine
|
|
@@ -151,79 +217,72 @@ template<> struct product_type_selector<Large,Large,Small> { enum
|
|
|
151
217
|
*/
|
|
152
218
|
namespace internal {
|
|
153
219
|
|
|
154
|
-
template<int Side, int StorageOrder, bool BlasCompatible>
|
|
220
|
+
template <int Side, int StorageOrder, bool BlasCompatible>
|
|
155
221
|
struct gemv_dense_selector;
|
|
156
222
|
|
|
157
|
-
}
|
|
223
|
+
} // end namespace internal
|
|
158
224
|
|
|
159
225
|
namespace internal {
|
|
160
226
|
|
|
161
|
-
template<typename Scalar,int Size,int MaxSize,bool Cond>
|
|
227
|
+
template <typename Scalar, int Size, int MaxSize, bool Cond>
|
|
228
|
+
struct gemv_static_vector_if;
|
|
162
229
|
|
|
163
|
-
template<typename Scalar,int Size,int MaxSize>
|
|
164
|
-
struct gemv_static_vector_if<Scalar,Size,MaxSize,false>
|
|
165
|
-
{
|
|
166
|
-
|
|
230
|
+
template <typename Scalar, int Size, int MaxSize>
|
|
231
|
+
struct gemv_static_vector_if<Scalar, Size, MaxSize, false> {
|
|
232
|
+
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC constexpr Scalar* data() {
|
|
233
|
+
eigen_internal_assert(false && "should never be called");
|
|
234
|
+
return 0;
|
|
235
|
+
}
|
|
167
236
|
};
|
|
168
237
|
|
|
169
|
-
template<typename Scalar,int Size>
|
|
170
|
-
struct gemv_static_vector_if<Scalar,Size,Dynamic,true>
|
|
171
|
-
{
|
|
172
|
-
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC Scalar* data() { return 0; }
|
|
238
|
+
template <typename Scalar, int Size>
|
|
239
|
+
struct gemv_static_vector_if<Scalar, Size, Dynamic, true> {
|
|
240
|
+
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC constexpr Scalar* data() { return 0; }
|
|
173
241
|
};
|
|
174
242
|
|
|
175
|
-
template<typename Scalar,int Size,int MaxSize>
|
|
176
|
-
struct gemv_static_vector_if<Scalar,Size,MaxSize,true>
|
|
177
|
-
|
|
178
|
-
|
|
179
|
-
|
|
180
|
-
|
|
181
|
-
};
|
|
182
|
-
#if EIGEN_MAX_STATIC_ALIGN_BYTES!=0
|
|
183
|
-
internal::plain_array<Scalar,EIGEN_SIZE_MIN_PREFER_FIXED(Size,MaxSize),0,EIGEN_PLAIN_ENUM_MIN(AlignedMax,PacketSize)> m_data;
|
|
184
|
-
EIGEN_STRONG_INLINE Scalar* data() { return m_data.array; }
|
|
185
|
-
#else
|
|
243
|
+
template <typename Scalar, int Size, int MaxSize>
|
|
244
|
+
struct gemv_static_vector_if<Scalar, Size, MaxSize, true> {
|
|
245
|
+
#if EIGEN_MAX_STATIC_ALIGN_BYTES != 0
|
|
246
|
+
internal::plain_array<Scalar, internal::min_size_prefer_fixed(Size, MaxSize), 0, AlignedMax> m_data;
|
|
247
|
+
EIGEN_STRONG_INLINE constexpr Scalar* data() { return m_data.array; }
|
|
248
|
+
#else
|
|
186
249
|
// Some architectures cannot align on the stack,
|
|
187
250
|
// => let's manually enforce alignment by allocating more data and return the address of the first aligned element.
|
|
188
|
-
internal::plain_array<Scalar,
|
|
189
|
-
EIGEN_STRONG_INLINE Scalar* data() {
|
|
190
|
-
return
|
|
191
|
-
|
|
192
|
-
: m_data.array;
|
|
251
|
+
internal::plain_array<Scalar, internal::min_size_prefer_fixed(Size, MaxSize) + EIGEN_MAX_ALIGN_BYTES, 0> m_data;
|
|
252
|
+
EIGEN_STRONG_INLINE constexpr Scalar* data() {
|
|
253
|
+
return reinterpret_cast<Scalar*>((std::uintptr_t(m_data.array) & ~(std::size_t(EIGEN_MAX_ALIGN_BYTES - 1))) +
|
|
254
|
+
EIGEN_MAX_ALIGN_BYTES);
|
|
193
255
|
}
|
|
194
|
-
|
|
256
|
+
#endif
|
|
195
257
|
};
|
|
196
258
|
|
|
197
259
|
// The vector is on the left => transposition
|
|
198
|
-
template<int StorageOrder, bool BlasCompatible>
|
|
199
|
-
struct gemv_dense_selector<OnTheLeft,StorageOrder,BlasCompatible>
|
|
200
|
-
|
|
201
|
-
|
|
202
|
-
static void run(const Lhs &lhs, const Rhs &rhs, Dest& dest, const typename Dest::Scalar& alpha)
|
|
203
|
-
{
|
|
260
|
+
template <int StorageOrder, bool BlasCompatible>
|
|
261
|
+
struct gemv_dense_selector<OnTheLeft, StorageOrder, BlasCompatible> {
|
|
262
|
+
template <typename Lhs, typename Rhs, typename Dest>
|
|
263
|
+
static void run(const Lhs& lhs, const Rhs& rhs, Dest& dest, const typename Dest::Scalar& alpha) {
|
|
204
264
|
Transpose<Dest> destT(dest);
|
|
205
265
|
enum { OtherStorageOrder = StorageOrder == RowMajor ? ColMajor : RowMajor };
|
|
206
|
-
gemv_dense_selector<OnTheRight,OtherStorageOrder,BlasCompatible
|
|
207
|
-
|
|
266
|
+
gemv_dense_selector<OnTheRight, OtherStorageOrder, BlasCompatible>::run(rhs.transpose(), lhs.transpose(), destT,
|
|
267
|
+
alpha);
|
|
208
268
|
}
|
|
209
269
|
};
|
|
210
270
|
|
|
211
|
-
template<>
|
|
212
|
-
{
|
|
213
|
-
template<typename Lhs, typename Rhs, typename Dest>
|
|
214
|
-
static inline void run(const Lhs
|
|
215
|
-
|
|
216
|
-
typedef typename
|
|
217
|
-
typedef typename
|
|
218
|
-
|
|
219
|
-
typedef typename Dest::RealScalar RealScalar;
|
|
220
|
-
|
|
271
|
+
template <>
|
|
272
|
+
struct gemv_dense_selector<OnTheRight, ColMajor, true> {
|
|
273
|
+
template <typename Lhs, typename Rhs, typename Dest>
|
|
274
|
+
static inline void run(const Lhs& lhs, const Rhs& rhs, Dest& dest, const typename Dest::Scalar& alpha) {
|
|
275
|
+
typedef typename Lhs::Scalar LhsScalar;
|
|
276
|
+
typedef typename Rhs::Scalar RhsScalar;
|
|
277
|
+
typedef typename Dest::Scalar ResScalar;
|
|
278
|
+
|
|
221
279
|
typedef internal::blas_traits<Lhs> LhsBlasTraits;
|
|
222
280
|
typedef typename LhsBlasTraits::DirectLinearAccessType ActualLhsType;
|
|
223
281
|
typedef internal::blas_traits<Rhs> RhsBlasTraits;
|
|
224
282
|
typedef typename RhsBlasTraits::DirectLinearAccessType ActualRhsType;
|
|
225
|
-
|
|
226
|
-
typedef Map<Matrix<ResScalar,Dynamic,1>,
|
|
283
|
+
|
|
284
|
+
typedef Map<Matrix<ResScalar, Dynamic, 1>, plain_enum_min(AlignedMax, internal::packet_traits<ResScalar>::size)>
|
|
285
|
+
MappedDest;
|
|
227
286
|
|
|
228
287
|
ActualLhsType actualLhs = LhsBlasTraits::extract(lhs);
|
|
229
288
|
ActualRhsType actualRhs = RhsBlasTraits::extract(rhs);
|
|
@@ -231,68 +290,64 @@ template<> struct gemv_dense_selector<OnTheRight,ColMajor,true>
|
|
|
231
290
|
ResScalar actualAlpha = combine_scalar_factors(alpha, lhs, rhs);
|
|
232
291
|
|
|
233
292
|
// make sure Dest is a compile-time vector type (bug 1166)
|
|
234
|
-
typedef
|
|
293
|
+
typedef std::conditional_t<Dest::IsVectorAtCompileTime, Dest, typename Dest::ColXpr> ActualDest;
|
|
235
294
|
|
|
236
295
|
enum {
|
|
237
296
|
// FIXME find a way to allow an inner stride on the result if packet_traits<Scalar>::size==1
|
|
238
297
|
// on, the other hand it is good for the cache to pack the vector anyways...
|
|
239
|
-
EvalToDestAtCompileTime = (ActualDest::InnerStrideAtCompileTime==1),
|
|
298
|
+
EvalToDestAtCompileTime = (ActualDest::InnerStrideAtCompileTime == 1),
|
|
240
299
|
ComplexByReal = (NumTraits<LhsScalar>::IsComplex) && (!NumTraits<RhsScalar>::IsComplex),
|
|
241
|
-
MightCannotUseDest = ((!EvalToDestAtCompileTime) || ComplexByReal) && (ActualDest::MaxSizeAtCompileTime!=0)
|
|
300
|
+
MightCannotUseDest = ((!EvalToDestAtCompileTime) || ComplexByReal) && (ActualDest::MaxSizeAtCompileTime != 0)
|
|
242
301
|
};
|
|
243
302
|
|
|
244
|
-
typedef const_blas_data_mapper<LhsScalar,Index,ColMajor> LhsMapper;
|
|
245
|
-
typedef const_blas_data_mapper<RhsScalar,Index,RowMajor> RhsMapper;
|
|
246
|
-
RhsScalar compatibleAlpha = get_factor<ResScalar,RhsScalar>::run(actualAlpha);
|
|
303
|
+
typedef const_blas_data_mapper<LhsScalar, Index, ColMajor> LhsMapper;
|
|
304
|
+
typedef const_blas_data_mapper<RhsScalar, Index, RowMajor> RhsMapper;
|
|
305
|
+
RhsScalar compatibleAlpha = get_factor<ResScalar, RhsScalar>::run(actualAlpha);
|
|
247
306
|
|
|
248
|
-
if(!MightCannotUseDest)
|
|
249
|
-
{
|
|
307
|
+
if (!MightCannotUseDest) {
|
|
250
308
|
// shortcut if we are sure to be able to use dest directly,
|
|
251
309
|
// this ease the compiler to generate cleaner and more optimzized code for most common cases
|
|
252
|
-
general_matrix_vector_product
|
|
253
|
-
|
|
254
|
-
|
|
255
|
-
|
|
256
|
-
|
|
257
|
-
|
|
258
|
-
|
|
259
|
-
}
|
|
260
|
-
|
|
261
|
-
|
|
262
|
-
|
|
263
|
-
|
|
264
|
-
const bool alphaIsCompatible = (!ComplexByReal) || (numext::imag(actualAlpha)
|
|
310
|
+
general_matrix_vector_product<Index, LhsScalar, LhsMapper, ColMajor, LhsBlasTraits::NeedToConjugate, RhsScalar,
|
|
311
|
+
RhsMapper, RhsBlasTraits::NeedToConjugate>::run(actualLhs.rows(), actualLhs.cols(),
|
|
312
|
+
LhsMapper(actualLhs.data(),
|
|
313
|
+
actualLhs.outerStride()),
|
|
314
|
+
RhsMapper(actualRhs.data(),
|
|
315
|
+
actualRhs.innerStride()),
|
|
316
|
+
dest.data(), 1, compatibleAlpha);
|
|
317
|
+
} else {
|
|
318
|
+
gemv_static_vector_if<ResScalar, ActualDest::SizeAtCompileTime, ActualDest::MaxSizeAtCompileTime,
|
|
319
|
+
MightCannotUseDest>
|
|
320
|
+
static_dest;
|
|
321
|
+
|
|
322
|
+
const bool alphaIsCompatible = (!ComplexByReal) || (numext::is_exactly_zero(numext::imag(actualAlpha)));
|
|
265
323
|
const bool evalToDest = EvalToDestAtCompileTime && alphaIsCompatible;
|
|
266
324
|
|
|
267
|
-
ei_declare_aligned_stack_constructed_variable(ResScalar,actualDestPtr,dest.size(),
|
|
325
|
+
ei_declare_aligned_stack_constructed_variable(ResScalar, actualDestPtr, dest.size(),
|
|
268
326
|
evalToDest ? dest.data() : static_dest.data());
|
|
269
327
|
|
|
270
|
-
if(!evalToDest)
|
|
271
|
-
|
|
272
|
-
|
|
328
|
+
if (!evalToDest) {
|
|
329
|
+
#ifdef EIGEN_DENSE_STORAGE_CTOR_PLUGIN
|
|
330
|
+
constexpr int Size = Dest::SizeAtCompileTime;
|
|
273
331
|
Index size = dest.size();
|
|
274
332
|
EIGEN_DENSE_STORAGE_CTOR_PLUGIN
|
|
275
|
-
|
|
276
|
-
if(!alphaIsCompatible)
|
|
277
|
-
{
|
|
333
|
+
#endif
|
|
334
|
+
if (!alphaIsCompatible) {
|
|
278
335
|
MappedDest(actualDestPtr, dest.size()).setZero();
|
|
279
336
|
compatibleAlpha = RhsScalar(1);
|
|
280
|
-
}
|
|
281
|
-
else
|
|
337
|
+
} else
|
|
282
338
|
MappedDest(actualDestPtr, dest.size()) = dest;
|
|
283
339
|
}
|
|
284
340
|
|
|
285
|
-
general_matrix_vector_product
|
|
286
|
-
|
|
287
|
-
|
|
288
|
-
|
|
289
|
-
|
|
290
|
-
|
|
291
|
-
|
|
292
|
-
|
|
293
|
-
if (!evalToDest)
|
|
294
|
-
|
|
295
|
-
if(!alphaIsCompatible)
|
|
341
|
+
general_matrix_vector_product<Index, LhsScalar, LhsMapper, ColMajor, LhsBlasTraits::NeedToConjugate, RhsScalar,
|
|
342
|
+
RhsMapper, RhsBlasTraits::NeedToConjugate>::run(actualLhs.rows(), actualLhs.cols(),
|
|
343
|
+
LhsMapper(actualLhs.data(),
|
|
344
|
+
actualLhs.outerStride()),
|
|
345
|
+
RhsMapper(actualRhs.data(),
|
|
346
|
+
actualRhs.innerStride()),
|
|
347
|
+
actualDestPtr, 1, compatibleAlpha);
|
|
348
|
+
|
|
349
|
+
if (!evalToDest) {
|
|
350
|
+
if (!alphaIsCompatible)
|
|
296
351
|
dest.matrix() += actualAlpha * MappedDest(actualDestPtr, dest.size());
|
|
297
352
|
else
|
|
298
353
|
dest = MappedDest(actualDestPtr, dest.size());
|
|
@@ -301,165 +356,164 @@ template<> struct gemv_dense_selector<OnTheRight,ColMajor,true>
|
|
|
301
356
|
}
|
|
302
357
|
};
|
|
303
358
|
|
|
304
|
-
template<>
|
|
305
|
-
{
|
|
306
|
-
template<typename Lhs, typename Rhs, typename Dest>
|
|
307
|
-
static void run(const Lhs
|
|
308
|
-
|
|
309
|
-
typedef typename
|
|
310
|
-
typedef typename
|
|
311
|
-
|
|
312
|
-
|
|
359
|
+
template <>
|
|
360
|
+
struct gemv_dense_selector<OnTheRight, RowMajor, true> {
|
|
361
|
+
template <typename Lhs, typename Rhs, typename Dest>
|
|
362
|
+
static void run(const Lhs& lhs, const Rhs& rhs, Dest& dest, const typename Dest::Scalar& alpha) {
|
|
363
|
+
typedef typename Lhs::Scalar LhsScalar;
|
|
364
|
+
typedef typename Rhs::Scalar RhsScalar;
|
|
365
|
+
typedef typename Dest::Scalar ResScalar;
|
|
366
|
+
|
|
313
367
|
typedef internal::blas_traits<Lhs> LhsBlasTraits;
|
|
314
368
|
typedef typename LhsBlasTraits::DirectLinearAccessType ActualLhsType;
|
|
315
369
|
typedef internal::blas_traits<Rhs> RhsBlasTraits;
|
|
316
370
|
typedef typename RhsBlasTraits::DirectLinearAccessType ActualRhsType;
|
|
317
|
-
typedef
|
|
371
|
+
typedef internal::remove_all_t<ActualRhsType> ActualRhsTypeCleaned;
|
|
318
372
|
|
|
319
|
-
|
|
320
|
-
|
|
373
|
+
std::add_const_t<ActualLhsType> actualLhs = LhsBlasTraits::extract(lhs);
|
|
374
|
+
std::add_const_t<ActualRhsType> actualRhs = RhsBlasTraits::extract(rhs);
|
|
321
375
|
|
|
322
376
|
ResScalar actualAlpha = combine_scalar_factors(alpha, lhs, rhs);
|
|
323
377
|
|
|
324
378
|
enum {
|
|
325
379
|
// FIXME find a way to allow an inner stride on the result if packet_traits<Scalar>::size==1
|
|
326
380
|
// on, the other hand it is good for the cache to pack the vector anyways...
|
|
327
|
-
DirectlyUseRhs =
|
|
381
|
+
DirectlyUseRhs =
|
|
382
|
+
ActualRhsTypeCleaned::InnerStrideAtCompileTime == 1 || ActualRhsTypeCleaned::MaxSizeAtCompileTime == 0
|
|
328
383
|
};
|
|
329
384
|
|
|
330
|
-
gemv_static_vector_if<RhsScalar,ActualRhsTypeCleaned::SizeAtCompileTime,
|
|
385
|
+
gemv_static_vector_if<RhsScalar, ActualRhsTypeCleaned::SizeAtCompileTime,
|
|
386
|
+
ActualRhsTypeCleaned::MaxSizeAtCompileTime, !DirectlyUseRhs>
|
|
387
|
+
static_rhs;
|
|
331
388
|
|
|
332
|
-
ei_declare_aligned_stack_constructed_variable(
|
|
389
|
+
ei_declare_aligned_stack_constructed_variable(
|
|
390
|
+
RhsScalar, actualRhsPtr, actualRhs.size(),
|
|
333
391
|
DirectlyUseRhs ? const_cast<RhsScalar*>(actualRhs.data()) : static_rhs.data());
|
|
334
392
|
|
|
335
|
-
if(!DirectlyUseRhs)
|
|
336
|
-
|
|
337
|
-
|
|
393
|
+
if (!DirectlyUseRhs) {
|
|
394
|
+
#ifdef EIGEN_DENSE_STORAGE_CTOR_PLUGIN
|
|
395
|
+
constexpr int Size = ActualRhsTypeCleaned::SizeAtCompileTime;
|
|
338
396
|
Index size = actualRhs.size();
|
|
339
397
|
EIGEN_DENSE_STORAGE_CTOR_PLUGIN
|
|
340
|
-
|
|
398
|
+
#endif
|
|
341
399
|
Map<typename ActualRhsTypeCleaned::PlainObject>(actualRhsPtr, actualRhs.size()) = actualRhs;
|
|
342
400
|
}
|
|
343
401
|
|
|
344
|
-
typedef const_blas_data_mapper<LhsScalar,Index,RowMajor> LhsMapper;
|
|
345
|
-
typedef const_blas_data_mapper<RhsScalar,Index,ColMajor> RhsMapper;
|
|
346
|
-
general_matrix_vector_product
|
|
347
|
-
|
|
348
|
-
actualLhs.rows(), actualLhs.cols(),
|
|
349
|
-
|
|
350
|
-
|
|
351
|
-
|
|
352
|
-
|
|
402
|
+
typedef const_blas_data_mapper<LhsScalar, Index, RowMajor> LhsMapper;
|
|
403
|
+
typedef const_blas_data_mapper<RhsScalar, Index, ColMajor> RhsMapper;
|
|
404
|
+
general_matrix_vector_product<Index, LhsScalar, LhsMapper, RowMajor, LhsBlasTraits::NeedToConjugate, RhsScalar,
|
|
405
|
+
RhsMapper, RhsBlasTraits::NeedToConjugate>::
|
|
406
|
+
run(actualLhs.rows(), actualLhs.cols(), LhsMapper(actualLhs.data(), actualLhs.outerStride()),
|
|
407
|
+
RhsMapper(actualRhsPtr, 1), dest.data(),
|
|
408
|
+
dest.col(0).innerStride(), // NOTE if dest is not a vector at compile-time, then dest.innerStride() might
|
|
409
|
+
// be wrong. (bug 1166)
|
|
410
|
+
actualAlpha);
|
|
353
411
|
}
|
|
354
412
|
};
|
|
355
413
|
|
|
356
|
-
template<>
|
|
357
|
-
{
|
|
358
|
-
template<typename Lhs, typename Rhs, typename Dest>
|
|
359
|
-
static void run(const Lhs
|
|
360
|
-
|
|
361
|
-
|
|
362
|
-
// TODO if rhs is large enough it might be beneficial to make sure that dest is sequentially stored in memory,
|
|
363
|
-
|
|
414
|
+
template <>
|
|
415
|
+
struct gemv_dense_selector<OnTheRight, ColMajor, false> {
|
|
416
|
+
template <typename Lhs, typename Rhs, typename Dest>
|
|
417
|
+
static void run(const Lhs& lhs, const Rhs& rhs, Dest& dest, const typename Dest::Scalar& alpha) {
|
|
418
|
+
EIGEN_STATIC_ASSERT((!nested_eval<Lhs, 1>::Evaluate),
|
|
419
|
+
EIGEN_INTERNAL_COMPILATION_ERROR_OR_YOU_MADE_A_PROGRAMMING_MISTAKE);
|
|
420
|
+
// TODO if rhs is large enough it might be beneficial to make sure that dest is sequentially stored in memory,
|
|
421
|
+
// otherwise use a temp
|
|
422
|
+
typename nested_eval<Rhs, 1>::type actual_rhs(rhs);
|
|
364
423
|
const Index size = rhs.rows();
|
|
365
|
-
for(Index k=0; k<size; ++k)
|
|
366
|
-
dest += (alpha*actual_rhs.coeff(k)) * lhs.col(k);
|
|
424
|
+
for (Index k = 0; k < size; ++k) dest += (alpha * actual_rhs.coeff(k)) * lhs.col(k);
|
|
367
425
|
}
|
|
368
426
|
};
|
|
369
427
|
|
|
370
|
-
template<>
|
|
371
|
-
{
|
|
372
|
-
template<typename Lhs, typename Rhs, typename Dest>
|
|
373
|
-
static void run(const Lhs
|
|
374
|
-
|
|
375
|
-
|
|
376
|
-
typename nested_eval<Rhs,Lhs::RowsAtCompileTime>::type actual_rhs(rhs);
|
|
428
|
+
template <>
|
|
429
|
+
struct gemv_dense_selector<OnTheRight, RowMajor, false> {
|
|
430
|
+
template <typename Lhs, typename Rhs, typename Dest>
|
|
431
|
+
static void run(const Lhs& lhs, const Rhs& rhs, Dest& dest, const typename Dest::Scalar& alpha) {
|
|
432
|
+
EIGEN_STATIC_ASSERT((!nested_eval<Lhs, 1>::Evaluate),
|
|
433
|
+
EIGEN_INTERNAL_COMPILATION_ERROR_OR_YOU_MADE_A_PROGRAMMING_MISTAKE);
|
|
434
|
+
typename nested_eval<Rhs, Lhs::RowsAtCompileTime>::type actual_rhs(rhs);
|
|
377
435
|
const Index rows = dest.rows();
|
|
378
|
-
for(Index i=0; i<rows; ++i)
|
|
436
|
+
for (Index i = 0; i < rows; ++i)
|
|
379
437
|
dest.coeffRef(i) += alpha * (lhs.row(i).cwiseProduct(actual_rhs.transpose())).sum();
|
|
380
438
|
}
|
|
381
439
|
};
|
|
382
440
|
|
|
383
|
-
}
|
|
441
|
+
} // end namespace internal
|
|
384
442
|
|
|
385
443
|
/***************************************************************************
|
|
386
|
-
* Implementation of matrix base methods
|
|
387
|
-
***************************************************************************/
|
|
444
|
+
* Implementation of matrix base methods
|
|
445
|
+
***************************************************************************/
|
|
388
446
|
|
|
389
447
|
/** \returns the matrix product of \c *this and \a other.
|
|
390
|
-
|
|
391
|
-
|
|
392
|
-
|
|
393
|
-
|
|
394
|
-
|
|
395
|
-
template<typename Derived>
|
|
396
|
-
template<typename OtherDerived>
|
|
397
|
-
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE
|
|
398
|
-
const
|
|
399
|
-
MatrixBase<Derived>::operator*(const MatrixBase<OtherDerived> &other) const
|
|
400
|
-
{
|
|
448
|
+
*
|
|
449
|
+
* \note If instead of the matrix product you want the coefficient-wise product, see Cwise::operator*().
|
|
450
|
+
*
|
|
451
|
+
* \sa lazyProduct(), operator*=(const MatrixBase&), Cwise::operator*()
|
|
452
|
+
*/
|
|
453
|
+
template <typename Derived>
|
|
454
|
+
template <typename OtherDerived>
|
|
455
|
+
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE const Product<Derived, OtherDerived> MatrixBase<Derived>::operator*(
|
|
456
|
+
const MatrixBase<OtherDerived>& other) const {
|
|
401
457
|
// A note regarding the function declaration: In MSVC, this function will sometimes
|
|
402
458
|
// not be inlined since DenseStorage is an unwindable object for dynamic
|
|
403
459
|
// matrices and product types are holding a member to store the result.
|
|
404
460
|
// Thus it does not help tagging this function with EIGEN_STRONG_INLINE.
|
|
405
461
|
enum {
|
|
406
|
-
ProductIsValid =
|
|
407
|
-
|
|
408
|
-
|| int(Derived::ColsAtCompileTime)==int(OtherDerived::RowsAtCompileTime),
|
|
462
|
+
ProductIsValid = Derived::ColsAtCompileTime == Dynamic || OtherDerived::RowsAtCompileTime == Dynamic ||
|
|
463
|
+
int(Derived::ColsAtCompileTime) == int(OtherDerived::RowsAtCompileTime),
|
|
409
464
|
AreVectors = Derived::IsVectorAtCompileTime && OtherDerived::IsVectorAtCompileTime,
|
|
410
|
-
SameSizes = EIGEN_PREDICATE_SAME_MATRIX_SIZE(Derived,OtherDerived)
|
|
465
|
+
SameSizes = EIGEN_PREDICATE_SAME_MATRIX_SIZE(Derived, OtherDerived)
|
|
411
466
|
};
|
|
412
467
|
// note to the lost user:
|
|
413
468
|
// * for a dot product use: v1.dot(v2)
|
|
414
469
|
// * for a coeff-wise product use: v1.cwiseProduct(v2)
|
|
415
|
-
EIGEN_STATIC_ASSERT(
|
|
416
|
-
|
|
470
|
+
EIGEN_STATIC_ASSERT(
|
|
471
|
+
ProductIsValid || !(AreVectors && SameSizes),
|
|
472
|
+
INVALID_VECTOR_VECTOR_PRODUCT__IF_YOU_WANTED_A_DOT_OR_COEFF_WISE_PRODUCT_YOU_MUST_USE_THE_EXPLICIT_FUNCTIONS)
|
|
417
473
|
EIGEN_STATIC_ASSERT(ProductIsValid || !(SameSizes && !AreVectors),
|
|
418
|
-
|
|
474
|
+
INVALID_MATRIX_PRODUCT__IF_YOU_WANTED_A_COEFF_WISE_PRODUCT_YOU_MUST_USE_THE_EXPLICIT_FUNCTION)
|
|
419
475
|
EIGEN_STATIC_ASSERT(ProductIsValid || SameSizes, INVALID_MATRIX_PRODUCT)
|
|
420
476
|
#ifdef EIGEN_DEBUG_PRODUCT
|
|
421
|
-
internal::product_type<Derived,OtherDerived>::debug();
|
|
477
|
+
internal::product_type<Derived, OtherDerived>::debug();
|
|
422
478
|
#endif
|
|
423
479
|
|
|
424
480
|
return Product<Derived, OtherDerived>(derived(), other.derived());
|
|
425
481
|
}
|
|
426
482
|
|
|
427
483
|
/** \returns an expression of the matrix product of \c *this and \a other without implicit evaluation.
|
|
428
|
-
|
|
429
|
-
|
|
430
|
-
|
|
431
|
-
|
|
432
|
-
|
|
433
|
-
|
|
434
|
-
|
|
435
|
-
|
|
436
|
-
|
|
437
|
-
|
|
438
|
-
template<typename Derived>
|
|
439
|
-
template<typename OtherDerived>
|
|
440
|
-
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE
|
|
441
|
-
const
|
|
442
|
-
MatrixBase<Derived>::lazyProduct(const MatrixBase<OtherDerived> &other) const
|
|
443
|
-
{
|
|
484
|
+
*
|
|
485
|
+
* The returned product will behave like any other expressions: the coefficients of the product will be
|
|
486
|
+
* computed once at a time as requested. This might be useful in some extremely rare cases when only
|
|
487
|
+
* a small and no coherent fraction of the result's coefficients have to be computed.
|
|
488
|
+
*
|
|
489
|
+
* \warning This version of the matrix product can be much much slower. So use it only if you know
|
|
490
|
+
* what you are doing and that you measured a true speed improvement.
|
|
491
|
+
*
|
|
492
|
+
* \sa operator*(const MatrixBase&)
|
|
493
|
+
*/
|
|
494
|
+
template <typename Derived>
|
|
495
|
+
template <typename OtherDerived>
|
|
496
|
+
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE const Product<Derived, OtherDerived, LazyProduct>
|
|
497
|
+
MatrixBase<Derived>::lazyProduct(const MatrixBase<OtherDerived>& other) const {
|
|
444
498
|
enum {
|
|
445
|
-
ProductIsValid =
|
|
446
|
-
|
|
447
|
-
|| int(Derived::ColsAtCompileTime)==int(OtherDerived::RowsAtCompileTime),
|
|
499
|
+
ProductIsValid = Derived::ColsAtCompileTime == Dynamic || OtherDerived::RowsAtCompileTime == Dynamic ||
|
|
500
|
+
int(Derived::ColsAtCompileTime) == int(OtherDerived::RowsAtCompileTime),
|
|
448
501
|
AreVectors = Derived::IsVectorAtCompileTime && OtherDerived::IsVectorAtCompileTime,
|
|
449
|
-
SameSizes = EIGEN_PREDICATE_SAME_MATRIX_SIZE(Derived,OtherDerived)
|
|
502
|
+
SameSizes = EIGEN_PREDICATE_SAME_MATRIX_SIZE(Derived, OtherDerived)
|
|
450
503
|
};
|
|
451
504
|
// note to the lost user:
|
|
452
505
|
// * for a dot product use: v1.dot(v2)
|
|
453
506
|
// * for a coeff-wise product use: v1.cwiseProduct(v2)
|
|
454
|
-
EIGEN_STATIC_ASSERT(
|
|
455
|
-
|
|
507
|
+
EIGEN_STATIC_ASSERT(
|
|
508
|
+
ProductIsValid || !(AreVectors && SameSizes),
|
|
509
|
+
INVALID_VECTOR_VECTOR_PRODUCT__IF_YOU_WANTED_A_DOT_OR_COEFF_WISE_PRODUCT_YOU_MUST_USE_THE_EXPLICIT_FUNCTIONS)
|
|
456
510
|
EIGEN_STATIC_ASSERT(ProductIsValid || !(SameSizes && !AreVectors),
|
|
457
|
-
|
|
511
|
+
INVALID_MATRIX_PRODUCT__IF_YOU_WANTED_A_COEFF_WISE_PRODUCT_YOU_MUST_USE_THE_EXPLICIT_FUNCTION)
|
|
458
512
|
EIGEN_STATIC_ASSERT(ProductIsValid || SameSizes, INVALID_MATRIX_PRODUCT)
|
|
459
513
|
|
|
460
|
-
return Product<Derived,OtherDerived,LazyProduct>(derived(), other.derived());
|
|
514
|
+
return Product<Derived, OtherDerived, LazyProduct>(derived(), other.derived());
|
|
461
515
|
}
|
|
462
516
|
|
|
463
|
-
}
|
|
517
|
+
} // end namespace Eigen
|
|
464
518
|
|
|
465
|
-
#endif
|
|
519
|
+
#endif // EIGEN_PRODUCT_H
|