@smake/eigen 1.0.2 → 1.1.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +1 -1
- package/eigen/Eigen/AccelerateSupport +52 -0
- package/eigen/Eigen/Cholesky +18 -21
- package/eigen/Eigen/CholmodSupport +28 -28
- package/eigen/Eigen/Core +235 -326
- package/eigen/Eigen/Eigenvalues +16 -14
- package/eigen/Eigen/Geometry +21 -24
- package/eigen/Eigen/Householder +9 -8
- package/eigen/Eigen/IterativeLinearSolvers +8 -4
- package/eigen/Eigen/Jacobi +14 -14
- package/eigen/Eigen/KLUSupport +43 -0
- package/eigen/Eigen/LU +16 -20
- package/eigen/Eigen/MetisSupport +12 -12
- package/eigen/Eigen/OrderingMethods +54 -54
- package/eigen/Eigen/PaStiXSupport +23 -20
- package/eigen/Eigen/PardisoSupport +17 -14
- package/eigen/Eigen/QR +18 -21
- package/eigen/Eigen/QtAlignedMalloc +5 -13
- package/eigen/Eigen/SPQRSupport +21 -14
- package/eigen/Eigen/SVD +23 -18
- package/eigen/Eigen/Sparse +1 -4
- package/eigen/Eigen/SparseCholesky +18 -23
- package/eigen/Eigen/SparseCore +18 -17
- package/eigen/Eigen/SparseLU +12 -8
- package/eigen/Eigen/SparseQR +16 -14
- package/eigen/Eigen/StdDeque +5 -2
- package/eigen/Eigen/StdList +5 -2
- package/eigen/Eigen/StdVector +5 -2
- package/eigen/Eigen/SuperLUSupport +30 -24
- package/eigen/Eigen/ThreadPool +80 -0
- package/eigen/Eigen/UmfPackSupport +19 -17
- package/eigen/Eigen/Version +14 -0
- package/eigen/Eigen/src/AccelerateSupport/AccelerateSupport.h +423 -0
- package/eigen/Eigen/src/AccelerateSupport/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/Cholesky/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/Cholesky/LDLT.h +377 -401
- package/eigen/Eigen/src/Cholesky/LLT.h +332 -360
- package/eigen/Eigen/src/Cholesky/LLT_LAPACKE.h +81 -56
- package/eigen/Eigen/src/CholmodSupport/CholmodSupport.h +620 -521
- package/eigen/Eigen/src/CholmodSupport/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/Core/ArithmeticSequence.h +239 -0
- package/eigen/Eigen/src/Core/Array.h +341 -294
- package/eigen/Eigen/src/Core/ArrayBase.h +190 -203
- package/eigen/Eigen/src/Core/ArrayWrapper.h +127 -171
- package/eigen/Eigen/src/Core/Assign.h +30 -40
- package/eigen/Eigen/src/Core/AssignEvaluator.h +711 -589
- package/eigen/Eigen/src/Core/Assign_MKL.h +130 -125
- package/eigen/Eigen/src/Core/BandMatrix.h +268 -283
- package/eigen/Eigen/src/Core/Block.h +375 -398
- package/eigen/Eigen/src/Core/CommaInitializer.h +86 -97
- package/eigen/Eigen/src/Core/ConditionEstimator.h +51 -53
- package/eigen/Eigen/src/Core/CoreEvaluators.h +1356 -1026
- package/eigen/Eigen/src/Core/CoreIterators.h +73 -59
- package/eigen/Eigen/src/Core/CwiseBinaryOp.h +114 -132
- package/eigen/Eigen/src/Core/CwiseNullaryOp.h +726 -617
- package/eigen/Eigen/src/Core/CwiseTernaryOp.h +77 -103
- package/eigen/Eigen/src/Core/CwiseUnaryOp.h +56 -68
- package/eigen/Eigen/src/Core/CwiseUnaryView.h +132 -95
- package/eigen/Eigen/src/Core/DenseBase.h +632 -571
- package/eigen/Eigen/src/Core/DenseCoeffsBase.h +511 -624
- package/eigen/Eigen/src/Core/DenseStorage.h +512 -509
- package/eigen/Eigen/src/Core/DeviceWrapper.h +153 -0
- package/eigen/Eigen/src/Core/Diagonal.h +169 -210
- package/eigen/Eigen/src/Core/DiagonalMatrix.h +351 -274
- package/eigen/Eigen/src/Core/DiagonalProduct.h +12 -10
- package/eigen/Eigen/src/Core/Dot.h +172 -222
- package/eigen/Eigen/src/Core/EigenBase.h +75 -85
- package/eigen/Eigen/src/Core/Fill.h +138 -0
- package/eigen/Eigen/src/Core/FindCoeff.h +464 -0
- package/eigen/Eigen/src/Core/ForceAlignedAccess.h +90 -109
- package/eigen/Eigen/src/Core/Fuzzy.h +82 -105
- package/eigen/Eigen/src/Core/GeneralProduct.h +327 -263
- package/eigen/Eigen/src/Core/GenericPacketMath.h +1472 -360
- package/eigen/Eigen/src/Core/GlobalFunctions.h +194 -151
- package/eigen/Eigen/src/Core/IO.h +147 -139
- package/eigen/Eigen/src/Core/IndexedView.h +321 -0
- package/eigen/Eigen/src/Core/InnerProduct.h +260 -0
- package/eigen/Eigen/src/Core/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/Core/Inverse.h +56 -66
- package/eigen/Eigen/src/Core/Map.h +124 -142
- package/eigen/Eigen/src/Core/MapBase.h +256 -281
- package/eigen/Eigen/src/Core/MathFunctions.h +1620 -938
- package/eigen/Eigen/src/Core/MathFunctionsImpl.h +233 -71
- package/eigen/Eigen/src/Core/Matrix.h +491 -416
- package/eigen/Eigen/src/Core/MatrixBase.h +468 -453
- package/eigen/Eigen/src/Core/NestByValue.h +66 -85
- package/eigen/Eigen/src/Core/NoAlias.h +79 -85
- package/eigen/Eigen/src/Core/NumTraits.h +235 -148
- package/eigen/Eigen/src/Core/PartialReduxEvaluator.h +253 -0
- package/eigen/Eigen/src/Core/PermutationMatrix.h +461 -511
- package/eigen/Eigen/src/Core/PlainObjectBase.h +871 -894
- package/eigen/Eigen/src/Core/Product.h +260 -139
- package/eigen/Eigen/src/Core/ProductEvaluators.h +863 -714
- package/eigen/Eigen/src/Core/Random.h +161 -136
- package/eigen/Eigen/src/Core/RandomImpl.h +262 -0
- package/eigen/Eigen/src/Core/RealView.h +250 -0
- package/eigen/Eigen/src/Core/Redux.h +366 -336
- package/eigen/Eigen/src/Core/Ref.h +308 -209
- package/eigen/Eigen/src/Core/Replicate.h +94 -106
- package/eigen/Eigen/src/Core/Reshaped.h +398 -0
- package/eigen/Eigen/src/Core/ReturnByValue.h +49 -55
- package/eigen/Eigen/src/Core/Reverse.h +136 -145
- package/eigen/Eigen/src/Core/Select.h +70 -140
- package/eigen/Eigen/src/Core/SelfAdjointView.h +262 -285
- package/eigen/Eigen/src/Core/SelfCwiseBinaryOp.h +23 -20
- package/eigen/Eigen/src/Core/SkewSymmetricMatrix3.h +382 -0
- package/eigen/Eigen/src/Core/Solve.h +97 -111
- package/eigen/Eigen/src/Core/SolveTriangular.h +131 -129
- package/eigen/Eigen/src/Core/SolverBase.h +138 -101
- package/eigen/Eigen/src/Core/StableNorm.h +156 -160
- package/eigen/Eigen/src/Core/StlIterators.h +619 -0
- package/eigen/Eigen/src/Core/Stride.h +91 -88
- package/eigen/Eigen/src/Core/Swap.h +70 -38
- package/eigen/Eigen/src/Core/Transpose.h +295 -273
- package/eigen/Eigen/src/Core/Transpositions.h +272 -317
- package/eigen/Eigen/src/Core/TriangularMatrix.h +670 -755
- package/eigen/Eigen/src/Core/VectorBlock.h +59 -72
- package/eigen/Eigen/src/Core/VectorwiseOp.h +668 -630
- package/eigen/Eigen/src/Core/Visitor.h +480 -216
- package/eigen/Eigen/src/Core/arch/AVX/Complex.h +407 -293
- package/eigen/Eigen/src/Core/arch/AVX/MathFunctions.h +79 -388
- package/eigen/Eigen/src/Core/arch/AVX/PacketMath.h +2935 -491
- package/eigen/Eigen/src/Core/arch/AVX/Reductions.h +353 -0
- package/eigen/Eigen/src/Core/arch/AVX/TypeCasting.h +279 -22
- package/eigen/Eigen/src/Core/arch/AVX512/Complex.h +472 -0
- package/eigen/Eigen/src/Core/arch/AVX512/GemmKernel.h +1245 -0
- package/eigen/Eigen/src/Core/arch/AVX512/MathFunctions.h +85 -333
- package/eigen/Eigen/src/Core/arch/AVX512/MathFunctionsFP16.h +75 -0
- package/eigen/Eigen/src/Core/arch/AVX512/PacketMath.h +2490 -649
- package/eigen/Eigen/src/Core/arch/AVX512/PacketMathFP16.h +1413 -0
- package/eigen/Eigen/src/Core/arch/AVX512/Reductions.h +297 -0
- package/eigen/Eigen/src/Core/arch/AVX512/TrsmKernel.h +1167 -0
- package/eigen/Eigen/src/Core/arch/AVX512/TrsmUnrolls.inc +1219 -0
- package/eigen/Eigen/src/Core/arch/AVX512/TypeCasting.h +277 -0
- package/eigen/Eigen/src/Core/arch/AVX512/TypeCastingFP16.h +130 -0
- package/eigen/Eigen/src/Core/arch/AltiVec/Complex.h +521 -298
- package/eigen/Eigen/src/Core/arch/AltiVec/MathFunctions.h +39 -280
- package/eigen/Eigen/src/Core/arch/AltiVec/MatrixProduct.h +3686 -0
- package/eigen/Eigen/src/Core/arch/AltiVec/MatrixProductCommon.h +205 -0
- package/eigen/Eigen/src/Core/arch/AltiVec/MatrixProductMMA.h +901 -0
- package/eigen/Eigen/src/Core/arch/AltiVec/MatrixProductMMAbfloat16.h +742 -0
- package/eigen/Eigen/src/Core/arch/AltiVec/MatrixVectorProduct.inc +2818 -0
- package/eigen/Eigen/src/Core/arch/AltiVec/PacketMath.h +3391 -723
- package/eigen/Eigen/src/Core/arch/AltiVec/TypeCasting.h +153 -0
- package/eigen/Eigen/src/Core/arch/Default/BFloat16.h +866 -0
- package/eigen/Eigen/src/Core/arch/Default/ConjHelper.h +113 -14
- package/eigen/Eigen/src/Core/arch/Default/GenericPacketMathFunctions.h +2634 -0
- package/eigen/Eigen/src/Core/arch/Default/GenericPacketMathFunctionsFwd.h +227 -0
- package/eigen/Eigen/src/Core/arch/Default/Half.h +1091 -0
- package/eigen/Eigen/src/Core/arch/Default/Settings.h +11 -13
- package/eigen/Eigen/src/Core/arch/GPU/Complex.h +244 -0
- package/eigen/Eigen/src/Core/arch/GPU/MathFunctions.h +104 -0
- package/eigen/Eigen/src/Core/arch/GPU/PacketMath.h +1712 -0
- package/eigen/Eigen/src/Core/arch/GPU/Tuple.h +268 -0
- package/eigen/Eigen/src/Core/arch/GPU/TypeCasting.h +77 -0
- package/eigen/Eigen/src/Core/arch/HIP/hcc/math_constants.h +23 -0
- package/eigen/Eigen/src/Core/arch/HVX/PacketMath.h +1088 -0
- package/eigen/Eigen/src/Core/arch/LSX/Complex.h +520 -0
- package/eigen/Eigen/src/Core/arch/LSX/GeneralBlockPanelKernel.h +23 -0
- package/eigen/Eigen/src/Core/arch/LSX/MathFunctions.h +43 -0
- package/eigen/Eigen/src/Core/arch/LSX/PacketMath.h +2866 -0
- package/eigen/Eigen/src/Core/arch/LSX/TypeCasting.h +526 -0
- package/eigen/Eigen/src/Core/arch/MSA/Complex.h +620 -0
- package/eigen/Eigen/src/Core/arch/MSA/MathFunctions.h +379 -0
- package/eigen/Eigen/src/Core/arch/MSA/PacketMath.h +1237 -0
- package/eigen/Eigen/src/Core/arch/NEON/Complex.h +531 -289
- package/eigen/Eigen/src/Core/arch/NEON/GeneralBlockPanelKernel.h +243 -0
- package/eigen/Eigen/src/Core/arch/NEON/MathFunctions.h +50 -73
- package/eigen/Eigen/src/Core/arch/NEON/PacketMath.h +5915 -579
- package/eigen/Eigen/src/Core/arch/NEON/TypeCasting.h +1642 -0
- package/eigen/Eigen/src/Core/arch/NEON/UnaryFunctors.h +57 -0
- package/eigen/Eigen/src/Core/arch/SSE/Complex.h +366 -334
- package/eigen/Eigen/src/Core/arch/SSE/MathFunctions.h +40 -514
- package/eigen/Eigen/src/Core/arch/SSE/PacketMath.h +2164 -675
- package/eigen/Eigen/src/Core/arch/SSE/Reductions.h +324 -0
- package/eigen/Eigen/src/Core/arch/SSE/TypeCasting.h +188 -35
- package/eigen/Eigen/src/Core/arch/SVE/MathFunctions.h +48 -0
- package/eigen/Eigen/src/Core/arch/SVE/PacketMath.h +674 -0
- package/eigen/Eigen/src/Core/arch/SVE/TypeCasting.h +52 -0
- package/eigen/Eigen/src/Core/arch/SYCL/InteropHeaders.h +227 -0
- package/eigen/Eigen/src/Core/arch/SYCL/MathFunctions.h +303 -0
- package/eigen/Eigen/src/Core/arch/SYCL/PacketMath.h +576 -0
- package/eigen/Eigen/src/Core/arch/SYCL/TypeCasting.h +83 -0
- package/eigen/Eigen/src/Core/arch/ZVector/Complex.h +434 -261
- package/eigen/Eigen/src/Core/arch/ZVector/MathFunctions.h +160 -53
- package/eigen/Eigen/src/Core/arch/ZVector/PacketMath.h +1073 -605
- package/eigen/Eigen/src/Core/functors/AssignmentFunctors.h +123 -117
- package/eigen/Eigen/src/Core/functors/BinaryFunctors.h +594 -322
- package/eigen/Eigen/src/Core/functors/NullaryFunctors.h +204 -118
- package/eigen/Eigen/src/Core/functors/StlFunctors.h +110 -97
- package/eigen/Eigen/src/Core/functors/TernaryFunctors.h +34 -7
- package/eigen/Eigen/src/Core/functors/UnaryFunctors.h +1158 -530
- package/eigen/Eigen/src/Core/products/GeneralBlockPanelKernel.h +2329 -1333
- package/eigen/Eigen/src/Core/products/GeneralMatrixMatrix.h +328 -364
- package/eigen/Eigen/src/Core/products/GeneralMatrixMatrixTriangular.h +191 -178
- package/eigen/Eigen/src/Core/products/GeneralMatrixMatrixTriangular_BLAS.h +85 -82
- package/eigen/Eigen/src/Core/products/GeneralMatrixMatrix_BLAS.h +154 -73
- package/eigen/Eigen/src/Core/products/GeneralMatrixVector.h +396 -542
- package/eigen/Eigen/src/Core/products/GeneralMatrixVector_BLAS.h +80 -77
- package/eigen/Eigen/src/Core/products/Parallelizer.h +208 -92
- package/eigen/Eigen/src/Core/products/SelfadjointMatrixMatrix.h +331 -375
- package/eigen/Eigen/src/Core/products/SelfadjointMatrixMatrix_BLAS.h +206 -224
- package/eigen/Eigen/src/Core/products/SelfadjointMatrixVector.h +139 -146
- package/eigen/Eigen/src/Core/products/SelfadjointMatrixVector_BLAS.h +58 -61
- package/eigen/Eigen/src/Core/products/SelfadjointProduct.h +71 -71
- package/eigen/Eigen/src/Core/products/SelfadjointRank2Update.h +48 -46
- package/eigen/Eigen/src/Core/products/TriangularMatrixMatrix.h +294 -369
- package/eigen/Eigen/src/Core/products/TriangularMatrixMatrix_BLAS.h +246 -238
- package/eigen/Eigen/src/Core/products/TriangularMatrixVector.h +244 -247
- package/eigen/Eigen/src/Core/products/TriangularMatrixVector_BLAS.h +212 -192
- package/eigen/Eigen/src/Core/products/TriangularSolverMatrix.h +328 -275
- package/eigen/Eigen/src/Core/products/TriangularSolverMatrix_BLAS.h +108 -109
- package/eigen/Eigen/src/Core/products/TriangularSolverVector.h +70 -93
- package/eigen/Eigen/src/Core/util/Assert.h +158 -0
- package/eigen/Eigen/src/Core/util/BlasUtil.h +413 -290
- package/eigen/Eigen/src/Core/util/ConfigureVectorization.h +543 -0
- package/eigen/Eigen/src/Core/util/Constants.h +314 -263
- package/eigen/Eigen/src/Core/util/DisableStupidWarnings.h +130 -78
- package/eigen/Eigen/src/Core/util/EmulateArray.h +270 -0
- package/eigen/Eigen/src/Core/util/ForwardDeclarations.h +450 -224
- package/eigen/Eigen/src/Core/util/GpuHipCudaDefines.inc +101 -0
- package/eigen/Eigen/src/Core/util/GpuHipCudaUndefines.inc +45 -0
- package/eigen/Eigen/src/Core/util/IndexedViewHelper.h +487 -0
- package/eigen/Eigen/src/Core/util/IntegralConstant.h +279 -0
- package/eigen/Eigen/src/Core/util/MKL_support.h +39 -30
- package/eigen/Eigen/src/Core/util/Macros.h +939 -646
- package/eigen/Eigen/src/Core/util/MaxSizeVector.h +139 -0
- package/eigen/Eigen/src/Core/util/Memory.h +1042 -650
- package/eigen/Eigen/src/Core/util/Meta.h +618 -426
- package/eigen/Eigen/src/Core/util/MoreMeta.h +638 -0
- package/eigen/Eigen/src/Core/util/ReenableStupidWarnings.h +32 -19
- package/eigen/Eigen/src/Core/util/ReshapedHelper.h +51 -0
- package/eigen/Eigen/src/Core/util/Serializer.h +209 -0
- package/eigen/Eigen/src/Core/util/StaticAssert.h +51 -164
- package/eigen/Eigen/src/Core/util/SymbolicIndex.h +445 -0
- package/eigen/Eigen/src/Core/util/XprHelper.h +793 -538
- package/eigen/Eigen/src/Eigenvalues/ComplexEigenSolver.h +246 -277
- package/eigen/Eigen/src/Eigenvalues/ComplexSchur.h +299 -319
- package/eigen/Eigen/src/Eigenvalues/ComplexSchur_LAPACKE.h +52 -48
- package/eigen/Eigen/src/Eigenvalues/EigenSolver.h +413 -456
- package/eigen/Eigen/src/Eigenvalues/GeneralizedEigenSolver.h +309 -325
- package/eigen/Eigen/src/Eigenvalues/GeneralizedSelfAdjointEigenSolver.h +157 -171
- package/eigen/Eigen/src/Eigenvalues/HessenbergDecomposition.h +292 -310
- package/eigen/Eigen/src/Eigenvalues/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/Eigenvalues/MatrixBaseEigenvalues.h +91 -107
- package/eigen/Eigen/src/Eigenvalues/RealQZ.h +539 -606
- package/eigen/Eigen/src/Eigenvalues/RealSchur.h +348 -382
- package/eigen/Eigen/src/Eigenvalues/RealSchur_LAPACKE.h +41 -35
- package/eigen/Eigen/src/Eigenvalues/SelfAdjointEigenSolver.h +579 -600
- package/eigen/Eigen/src/Eigenvalues/SelfAdjointEigenSolver_LAPACKE.h +47 -44
- package/eigen/Eigen/src/Eigenvalues/Tridiagonalization.h +434 -461
- package/eigen/Eigen/src/Geometry/AlignedBox.h +307 -214
- package/eigen/Eigen/src/Geometry/AngleAxis.h +135 -137
- package/eigen/Eigen/src/Geometry/EulerAngles.h +163 -74
- package/eigen/Eigen/src/Geometry/Homogeneous.h +289 -333
- package/eigen/Eigen/src/Geometry/Hyperplane.h +152 -161
- package/eigen/Eigen/src/Geometry/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/Geometry/OrthoMethods.h +168 -145
- package/eigen/Eigen/src/Geometry/ParametrizedLine.h +141 -104
- package/eigen/Eigen/src/Geometry/Quaternion.h +595 -497
- package/eigen/Eigen/src/Geometry/Rotation2D.h +110 -108
- package/eigen/Eigen/src/Geometry/RotationBase.h +148 -145
- package/eigen/Eigen/src/Geometry/Scaling.h +115 -90
- package/eigen/Eigen/src/Geometry/Transform.h +896 -953
- package/eigen/Eigen/src/Geometry/Translation.h +100 -98
- package/eigen/Eigen/src/Geometry/Umeyama.h +79 -84
- package/eigen/Eigen/src/Geometry/arch/Geometry_SIMD.h +154 -0
- package/eigen/Eigen/src/Householder/BlockHouseholder.h +54 -42
- package/eigen/Eigen/src/Householder/Householder.h +104 -122
- package/eigen/Eigen/src/Householder/HouseholderSequence.h +416 -382
- package/eigen/Eigen/src/Householder/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/IterativeLinearSolvers/BasicPreconditioners.h +153 -166
- package/eigen/Eigen/src/IterativeLinearSolvers/BiCGSTAB.h +127 -138
- package/eigen/Eigen/src/IterativeLinearSolvers/ConjugateGradient.h +95 -124
- package/eigen/Eigen/src/IterativeLinearSolvers/IncompleteCholesky.h +269 -267
- package/eigen/Eigen/src/IterativeLinearSolvers/IncompleteLUT.h +246 -259
- package/eigen/Eigen/src/IterativeLinearSolvers/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/IterativeLinearSolvers/IterativeSolverBase.h +218 -217
- package/eigen/Eigen/src/IterativeLinearSolvers/LeastSquareConjugateGradient.h +80 -103
- package/eigen/Eigen/src/IterativeLinearSolvers/SolveWithGuess.h +59 -63
- package/eigen/Eigen/src/Jacobi/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/Jacobi/Jacobi.h +256 -291
- package/eigen/Eigen/src/KLUSupport/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/KLUSupport/KLUSupport.h +339 -0
- package/eigen/Eigen/src/LU/Determinant.h +60 -63
- package/eigen/Eigen/src/LU/FullPivLU.h +561 -626
- package/eigen/Eigen/src/LU/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/LU/InverseImpl.h +213 -275
- package/eigen/Eigen/src/LU/PartialPivLU.h +407 -435
- package/eigen/Eigen/src/LU/PartialPivLU_LAPACKE.h +54 -40
- package/eigen/Eigen/src/LU/arch/InverseSize4.h +353 -0
- package/eigen/Eigen/src/MetisSupport/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/MetisSupport/MetisSupport.h +81 -93
- package/eigen/Eigen/src/OrderingMethods/Amd.h +250 -282
- package/eigen/Eigen/src/OrderingMethods/Eigen_Colamd.h +950 -1103
- package/eigen/Eigen/src/OrderingMethods/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/OrderingMethods/Ordering.h +111 -122
- package/eigen/Eigen/src/PaStiXSupport/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/PaStiXSupport/PaStiXSupport.h +524 -570
- package/eigen/Eigen/src/PardisoSupport/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/PardisoSupport/PardisoSupport.h +385 -429
- package/eigen/Eigen/src/QR/ColPivHouseholderQR.h +494 -473
- package/eigen/Eigen/src/QR/ColPivHouseholderQR_LAPACKE.h +120 -56
- package/eigen/Eigen/src/QR/CompleteOrthogonalDecomposition.h +223 -137
- package/eigen/Eigen/src/QR/FullPivHouseholderQR.h +517 -460
- package/eigen/Eigen/src/QR/HouseholderQR.h +412 -278
- package/eigen/Eigen/src/QR/HouseholderQR_LAPACKE.h +32 -23
- package/eigen/Eigen/src/QR/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/SPQRSupport/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/SPQRSupport/SuiteSparseQRSupport.h +263 -261
- package/eigen/Eigen/src/SVD/BDCSVD.h +872 -679
- package/eigen/Eigen/src/SVD/BDCSVD_LAPACKE.h +174 -0
- package/eigen/Eigen/src/SVD/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/SVD/JacobiSVD.h +585 -543
- package/eigen/Eigen/src/SVD/JacobiSVD_LAPACKE.h +85 -49
- package/eigen/Eigen/src/SVD/SVDBase.h +281 -160
- package/eigen/Eigen/src/SVD/UpperBidiagonalization.h +202 -237
- package/eigen/Eigen/src/SparseCholesky/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/SparseCholesky/SimplicialCholesky.h +769 -590
- package/eigen/Eigen/src/SparseCholesky/SimplicialCholesky_impl.h +318 -129
- package/eigen/Eigen/src/SparseCore/AmbiVector.h +202 -251
- package/eigen/Eigen/src/SparseCore/CompressedStorage.h +184 -236
- package/eigen/Eigen/src/SparseCore/ConservativeSparseSparseProduct.h +140 -184
- package/eigen/Eigen/src/SparseCore/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/SparseCore/SparseAssign.h +174 -111
- package/eigen/Eigen/src/SparseCore/SparseBlock.h +408 -477
- package/eigen/Eigen/src/SparseCore/SparseColEtree.h +100 -112
- package/eigen/Eigen/src/SparseCore/SparseCompressedBase.h +531 -280
- package/eigen/Eigen/src/SparseCore/SparseCwiseBinaryOp.h +559 -347
- package/eigen/Eigen/src/SparseCore/SparseCwiseUnaryOp.h +100 -108
- package/eigen/Eigen/src/SparseCore/SparseDenseProduct.h +185 -191
- package/eigen/Eigen/src/SparseCore/SparseDiagonalProduct.h +71 -71
- package/eigen/Eigen/src/SparseCore/SparseDot.h +49 -47
- package/eigen/Eigen/src/SparseCore/SparseFuzzy.h +13 -11
- package/eigen/Eigen/src/SparseCore/SparseMap.h +243 -253
- package/eigen/Eigen/src/SparseCore/SparseMatrix.h +1614 -1142
- package/eigen/Eigen/src/SparseCore/SparseMatrixBase.h +403 -357
- package/eigen/Eigen/src/SparseCore/SparsePermutation.h +186 -115
- package/eigen/Eigen/src/SparseCore/SparseProduct.h +100 -91
- package/eigen/Eigen/src/SparseCore/SparseRedux.h +22 -24
- package/eigen/Eigen/src/SparseCore/SparseRef.h +268 -295
- package/eigen/Eigen/src/SparseCore/SparseSelfAdjointView.h +371 -414
- package/eigen/Eigen/src/SparseCore/SparseSolverBase.h +78 -87
- package/eigen/Eigen/src/SparseCore/SparseSparseProductWithPruning.h +81 -95
- package/eigen/Eigen/src/SparseCore/SparseTranspose.h +62 -71
- package/eigen/Eigen/src/SparseCore/SparseTriangularView.h +132 -144
- package/eigen/Eigen/src/SparseCore/SparseUtil.h +146 -115
- package/eigen/Eigen/src/SparseCore/SparseVector.h +426 -372
- package/eigen/Eigen/src/SparseCore/SparseView.h +164 -193
- package/eigen/Eigen/src/SparseCore/TriangularSolver.h +129 -170
- package/eigen/Eigen/src/SparseLU/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/SparseLU/SparseLU.h +814 -618
- package/eigen/Eigen/src/SparseLU/SparseLUImpl.h +61 -48
- package/eigen/Eigen/src/SparseLU/SparseLU_Memory.h +102 -118
- package/eigen/Eigen/src/SparseLU/SparseLU_Structs.h +38 -35
- package/eigen/Eigen/src/SparseLU/SparseLU_SupernodalMatrix.h +273 -255
- package/eigen/Eigen/src/SparseLU/SparseLU_Utils.h +44 -49
- package/eigen/Eigen/src/SparseLU/SparseLU_column_bmod.h +104 -108
- package/eigen/Eigen/src/SparseLU/SparseLU_column_dfs.h +90 -101
- package/eigen/Eigen/src/SparseLU/SparseLU_copy_to_ucol.h +57 -58
- package/eigen/Eigen/src/SparseLU/SparseLU_heap_relax_snode.h +43 -55
- package/eigen/Eigen/src/SparseLU/SparseLU_kernel_bmod.h +74 -71
- package/eigen/Eigen/src/SparseLU/SparseLU_panel_bmod.h +125 -133
- package/eigen/Eigen/src/SparseLU/SparseLU_panel_dfs.h +136 -159
- package/eigen/Eigen/src/SparseLU/SparseLU_pivotL.h +51 -52
- package/eigen/Eigen/src/SparseLU/SparseLU_pruneL.h +67 -73
- package/eigen/Eigen/src/SparseLU/SparseLU_relax_snode.h +24 -26
- package/eigen/Eigen/src/SparseQR/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/SparseQR/SparseQR.h +451 -490
- package/eigen/Eigen/src/StlSupport/StdDeque.h +28 -105
- package/eigen/Eigen/src/StlSupport/StdList.h +28 -84
- package/eigen/Eigen/src/StlSupport/StdVector.h +28 -108
- package/eigen/Eigen/src/StlSupport/details.h +48 -50
- package/eigen/Eigen/src/SuperLUSupport/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/SuperLUSupport/SuperLUSupport.h +634 -732
- package/eigen/Eigen/src/ThreadPool/Barrier.h +70 -0
- package/eigen/Eigen/src/ThreadPool/CoreThreadPoolDevice.h +336 -0
- package/eigen/Eigen/src/ThreadPool/EventCount.h +241 -0
- package/eigen/Eigen/src/ThreadPool/ForkJoin.h +140 -0
- package/eigen/Eigen/src/ThreadPool/InternalHeaderCheck.h +4 -0
- package/eigen/Eigen/src/ThreadPool/NonBlockingThreadPool.h +587 -0
- package/eigen/Eigen/src/ThreadPool/RunQueue.h +230 -0
- package/eigen/Eigen/src/ThreadPool/ThreadCancel.h +21 -0
- package/eigen/Eigen/src/ThreadPool/ThreadEnvironment.h +43 -0
- package/eigen/Eigen/src/ThreadPool/ThreadLocal.h +289 -0
- package/eigen/Eigen/src/ThreadPool/ThreadPoolInterface.h +50 -0
- package/eigen/Eigen/src/ThreadPool/ThreadYield.h +16 -0
- package/eigen/Eigen/src/UmfPackSupport/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/UmfPackSupport/UmfPackSupport.h +480 -380
- package/eigen/Eigen/src/misc/Image.h +41 -43
- package/eigen/Eigen/src/misc/InternalHeaderCheck.h +3 -0
- package/eigen/Eigen/src/misc/Kernel.h +39 -41
- package/eigen/Eigen/src/misc/RealSvd2x2.h +19 -21
- package/eigen/Eigen/src/misc/blas.h +83 -426
- package/eigen/Eigen/src/misc/lapacke.h +9976 -16182
- package/eigen/Eigen/src/misc/lapacke_helpers.h +163 -0
- package/eigen/Eigen/src/misc/lapacke_mangling.h +4 -5
- package/eigen/Eigen/src/plugins/ArrayCwiseBinaryOps.inc +344 -0
- package/eigen/Eigen/src/plugins/ArrayCwiseUnaryOps.inc +544 -0
- package/eigen/Eigen/src/plugins/BlockMethods.inc +1370 -0
- package/eigen/Eigen/src/plugins/CommonCwiseBinaryOps.inc +116 -0
- package/eigen/Eigen/src/plugins/CommonCwiseUnaryOps.inc +167 -0
- package/eigen/Eigen/src/plugins/IndexedViewMethods.inc +192 -0
- package/eigen/Eigen/src/plugins/InternalHeaderCheck.inc +3 -0
- package/eigen/Eigen/src/plugins/MatrixCwiseBinaryOps.inc +331 -0
- package/eigen/Eigen/src/plugins/MatrixCwiseUnaryOps.inc +118 -0
- package/eigen/Eigen/src/plugins/ReshapedMethods.inc +133 -0
- package/lib/LibEigen.d.ts +4 -0
- package/lib/LibEigen.js +14 -0
- package/lib/index.d.ts +1 -1
- package/lib/index.js +7 -3
- package/package.json +2 -10
- package/eigen/Eigen/CMakeLists.txt +0 -19
- package/eigen/Eigen/src/Core/BooleanRedux.h +0 -164
- package/eigen/Eigen/src/Core/arch/CUDA/Complex.h +0 -103
- package/eigen/Eigen/src/Core/arch/CUDA/Half.h +0 -675
- package/eigen/Eigen/src/Core/arch/CUDA/MathFunctions.h +0 -91
- package/eigen/Eigen/src/Core/arch/CUDA/PacketMath.h +0 -333
- package/eigen/Eigen/src/Core/arch/CUDA/PacketMathHalf.h +0 -1124
- package/eigen/Eigen/src/Core/arch/CUDA/TypeCasting.h +0 -212
- package/eigen/Eigen/src/Core/util/NonMPL2.h +0 -3
- package/eigen/Eigen/src/Geometry/arch/Geometry_SSE.h +0 -161
- package/eigen/Eigen/src/LU/arch/Inverse_SSE.h +0 -338
- package/eigen/Eigen/src/SparseCore/MappedSparseMatrix.h +0 -67
- package/eigen/Eigen/src/SparseLU/SparseLU_gemm_kernel.h +0 -280
- package/eigen/Eigen/src/misc/lapack.h +0 -152
- package/eigen/Eigen/src/plugins/ArrayCwiseBinaryOps.h +0 -332
- package/eigen/Eigen/src/plugins/ArrayCwiseUnaryOps.h +0 -552
- package/eigen/Eigen/src/plugins/BlockMethods.h +0 -1058
- package/eigen/Eigen/src/plugins/CommonCwiseBinaryOps.h +0 -115
- package/eigen/Eigen/src/plugins/CommonCwiseUnaryOps.h +0 -163
- package/eigen/Eigen/src/plugins/MatrixCwiseBinaryOps.h +0 -152
- package/eigen/Eigen/src/plugins/MatrixCwiseUnaryOps.h +0 -85
- package/lib/eigen.d.ts +0 -2
- package/lib/eigen.js +0 -15
|
@@ -11,78 +11,195 @@
|
|
|
11
11
|
#ifndef EIGEN_COMPLEX_NEON_H
|
|
12
12
|
#define EIGEN_COMPLEX_NEON_H
|
|
13
13
|
|
|
14
|
+
// IWYU pragma: private
|
|
15
|
+
#include "../../InternalHeaderCheck.h"
|
|
16
|
+
|
|
14
17
|
namespace Eigen {
|
|
15
18
|
|
|
16
19
|
namespace internal {
|
|
17
20
|
|
|
18
21
|
inline uint32x4_t p4ui_CONJ_XOR() {
|
|
19
22
|
// See bug 1325, clang fails to call vld1q_u64.
|
|
20
|
-
#if EIGEN_COMP_CLANG
|
|
21
|
-
uint32x4_t ret = {
|
|
23
|
+
#if EIGEN_COMP_CLANG || EIGEN_COMP_CASTXML
|
|
24
|
+
uint32x4_t ret = {0x00000000, 0x80000000, 0x00000000, 0x80000000};
|
|
22
25
|
return ret;
|
|
23
26
|
#else
|
|
24
|
-
static const uint32_t conj_XOR_DATA[] = {
|
|
25
|
-
return vld1q_u32(
|
|
27
|
+
static const uint32_t conj_XOR_DATA[] = {0x00000000, 0x80000000, 0x00000000, 0x80000000};
|
|
28
|
+
return vld1q_u32(conj_XOR_DATA);
|
|
26
29
|
#endif
|
|
27
30
|
}
|
|
28
31
|
|
|
29
32
|
inline uint32x2_t p2ui_CONJ_XOR() {
|
|
30
|
-
static const uint32_t conj_XOR_DATA[] = {
|
|
31
|
-
return vld1_u32(
|
|
33
|
+
static const uint32_t conj_XOR_DATA[] = {0x00000000, 0x80000000};
|
|
34
|
+
return vld1_u32(conj_XOR_DATA);
|
|
32
35
|
}
|
|
33
36
|
|
|
34
37
|
//---------- float ----------
|
|
35
|
-
|
|
36
|
-
{
|
|
38
|
+
|
|
39
|
+
struct Packet1cf {
|
|
40
|
+
EIGEN_STRONG_INLINE Packet1cf() {}
|
|
41
|
+
EIGEN_STRONG_INLINE explicit Packet1cf(const Packet2f& a) : v(a) {}
|
|
42
|
+
Packet2f v;
|
|
43
|
+
};
|
|
44
|
+
struct Packet2cf {
|
|
37
45
|
EIGEN_STRONG_INLINE Packet2cf() {}
|
|
38
46
|
EIGEN_STRONG_INLINE explicit Packet2cf(const Packet4f& a) : v(a) {}
|
|
39
|
-
Packet4f
|
|
47
|
+
Packet4f v;
|
|
40
48
|
};
|
|
41
49
|
|
|
42
|
-
template<>
|
|
43
|
-
{
|
|
50
|
+
template <>
|
|
51
|
+
struct packet_traits<std::complex<float>> : default_packet_traits {
|
|
44
52
|
typedef Packet2cf type;
|
|
45
|
-
typedef
|
|
53
|
+
typedef Packet1cf half;
|
|
46
54
|
enum {
|
|
47
55
|
Vectorizable = 1,
|
|
48
56
|
AlignedOnScalar = 1,
|
|
49
57
|
size = 2,
|
|
50
|
-
HasHalfPacket = 0,
|
|
51
58
|
|
|
52
|
-
HasAdd
|
|
53
|
-
HasSub
|
|
54
|
-
HasMul
|
|
55
|
-
HasDiv
|
|
59
|
+
HasAdd = 1,
|
|
60
|
+
HasSub = 1,
|
|
61
|
+
HasMul = 1,
|
|
62
|
+
HasDiv = 1,
|
|
56
63
|
HasNegate = 1,
|
|
57
|
-
|
|
58
|
-
|
|
59
|
-
|
|
60
|
-
|
|
64
|
+
HasSqrt = 1,
|
|
65
|
+
HasLog = 1,
|
|
66
|
+
HasExp = 1,
|
|
67
|
+
HasAbs = 0,
|
|
68
|
+
HasAbs2 = 0,
|
|
69
|
+
HasMin = 0,
|
|
70
|
+
HasMax = 0,
|
|
61
71
|
HasSetLinear = 0
|
|
62
72
|
};
|
|
63
73
|
};
|
|
64
74
|
|
|
65
|
-
template<>
|
|
75
|
+
template <>
|
|
76
|
+
struct unpacket_traits<Packet1cf> : neon_unpacket_default<Packet1cf, std::complex<float>> {
|
|
77
|
+
using as_real = Packet2f;
|
|
78
|
+
};
|
|
79
|
+
template <>
|
|
80
|
+
struct unpacket_traits<Packet2cf> : neon_unpacket_default<Packet2cf, std::complex<float>> {
|
|
81
|
+
using half = Packet1cf;
|
|
82
|
+
using as_real = Packet4f;
|
|
83
|
+
};
|
|
84
|
+
|
|
85
|
+
template <>
|
|
86
|
+
EIGEN_STRONG_INLINE Packet1cf pcast<float, Packet1cf>(const float& a) {
|
|
87
|
+
return Packet1cf(vset_lane_f32(a, vdup_n_f32(0.f), 0));
|
|
88
|
+
}
|
|
89
|
+
template <>
|
|
90
|
+
EIGEN_STRONG_INLINE Packet2cf pcast<Packet2f, Packet2cf>(const Packet2f& a) {
|
|
91
|
+
return Packet2cf(vreinterpretq_f32_u64(vmovl_u32(vreinterpret_u32_f32(a))));
|
|
92
|
+
}
|
|
93
|
+
|
|
94
|
+
template <>
|
|
95
|
+
EIGEN_STRONG_INLINE Packet1cf pzero(const Packet1cf& /*a*/) {
|
|
96
|
+
return Packet1cf(vdup_n_f32(0.0f));
|
|
97
|
+
}
|
|
66
98
|
|
|
67
|
-
template<>
|
|
68
|
-
{
|
|
69
|
-
|
|
70
|
-
|
|
99
|
+
template <>
|
|
100
|
+
EIGEN_STRONG_INLINE Packet2cf pzero(const Packet2cf& /*a*/) {
|
|
101
|
+
return Packet2cf(vdupq_n_f32(0.0f));
|
|
102
|
+
}
|
|
71
103
|
|
|
104
|
+
template <>
|
|
105
|
+
EIGEN_STRONG_INLINE Packet1cf pset1<Packet1cf>(const std::complex<float>& from) {
|
|
106
|
+
return Packet1cf(vld1_f32(reinterpret_cast<const float*>(&from)));
|
|
107
|
+
}
|
|
108
|
+
template <>
|
|
109
|
+
EIGEN_STRONG_INLINE Packet2cf pset1<Packet2cf>(const std::complex<float>& from) {
|
|
110
|
+
const float32x2_t r64 = vld1_f32(reinterpret_cast<const float*>(&from));
|
|
72
111
|
return Packet2cf(vcombine_f32(r64, r64));
|
|
73
112
|
}
|
|
74
113
|
|
|
75
|
-
template<>
|
|
76
|
-
|
|
77
|
-
|
|
78
|
-
|
|
79
|
-
|
|
80
|
-
|
|
114
|
+
template <>
|
|
115
|
+
EIGEN_STRONG_INLINE Packet1cf padd<Packet1cf>(const Packet1cf& a, const Packet1cf& b) {
|
|
116
|
+
return Packet1cf(padd<Packet2f>(a.v, b.v));
|
|
117
|
+
}
|
|
118
|
+
template <>
|
|
119
|
+
EIGEN_STRONG_INLINE Packet2cf padd<Packet2cf>(const Packet2cf& a, const Packet2cf& b) {
|
|
120
|
+
return Packet2cf(padd<Packet4f>(a.v, b.v));
|
|
121
|
+
}
|
|
122
|
+
|
|
123
|
+
template <>
|
|
124
|
+
EIGEN_STRONG_INLINE Packet1cf psub<Packet1cf>(const Packet1cf& a, const Packet1cf& b) {
|
|
125
|
+
return Packet1cf(psub<Packet2f>(a.v, b.v));
|
|
126
|
+
}
|
|
127
|
+
template <>
|
|
128
|
+
EIGEN_STRONG_INLINE Packet2cf psub<Packet2cf>(const Packet2cf& a, const Packet2cf& b) {
|
|
129
|
+
return Packet2cf(psub<Packet4f>(a.v, b.v));
|
|
130
|
+
}
|
|
131
|
+
|
|
132
|
+
template <>
|
|
133
|
+
EIGEN_STRONG_INLINE Packet1cf pnegate(const Packet1cf& a) {
|
|
134
|
+
return Packet1cf(pnegate<Packet2f>(a.v));
|
|
135
|
+
}
|
|
136
|
+
template <>
|
|
137
|
+
EIGEN_STRONG_INLINE Packet2cf pnegate(const Packet2cf& a) {
|
|
138
|
+
return Packet2cf(pnegate<Packet4f>(a.v));
|
|
139
|
+
}
|
|
140
|
+
|
|
141
|
+
template <>
|
|
142
|
+
EIGEN_STRONG_INLINE Packet1cf pconj(const Packet1cf& a) {
|
|
143
|
+
const Packet2ui b = Packet2ui(vreinterpret_u32_f32(a.v));
|
|
144
|
+
return Packet1cf(vreinterpret_f32_u32(veor_u32(b, p2ui_CONJ_XOR())));
|
|
145
|
+
}
|
|
146
|
+
template <>
|
|
147
|
+
EIGEN_STRONG_INLINE Packet2cf pconj(const Packet2cf& a) {
|
|
148
|
+
const Packet4ui b = Packet4ui(vreinterpretq_u32_f32(a.v));
|
|
81
149
|
return Packet2cf(vreinterpretq_f32_u32(veorq_u32(b, p4ui_CONJ_XOR())));
|
|
82
150
|
}
|
|
83
151
|
|
|
84
|
-
|
|
85
|
-
|
|
152
|
+
#ifdef __ARM_FEATURE_COMPLEX
|
|
153
|
+
template <>
|
|
154
|
+
EIGEN_STRONG_INLINE Packet1cf pmadd<Packet1cf>(const Packet1cf& a, const Packet1cf& b, const Packet1cf& c) {
|
|
155
|
+
Packet1cf result;
|
|
156
|
+
result.v = vcmla_f32(c.v, a.v, b.v);
|
|
157
|
+
result.v = vcmla_rot90_f32(result.v, a.v, b.v);
|
|
158
|
+
return result;
|
|
159
|
+
}
|
|
160
|
+
|
|
161
|
+
template <>
|
|
162
|
+
EIGEN_STRONG_INLINE Packet1cf pmul<Packet1cf>(const Packet1cf& a, const Packet1cf& b) {
|
|
163
|
+
return pmadd(a, b, pzero(a));
|
|
164
|
+
}
|
|
165
|
+
#else
|
|
166
|
+
template <>
|
|
167
|
+
EIGEN_STRONG_INLINE Packet1cf pmul<Packet1cf>(const Packet1cf& a, const Packet1cf& b) {
|
|
168
|
+
Packet2f v1, v2;
|
|
169
|
+
|
|
170
|
+
// Get the real values of a | a1_re | a1_re |
|
|
171
|
+
v1 = vdup_lane_f32(a.v, 0);
|
|
172
|
+
// Get the imag values of a | a1_im | a1_im |
|
|
173
|
+
v2 = vdup_lane_f32(a.v, 1);
|
|
174
|
+
// Multiply the real a with b
|
|
175
|
+
v1 = vmul_f32(v1, b.v);
|
|
176
|
+
// Multiply the imag a with b
|
|
177
|
+
v2 = vmul_f32(v2, b.v);
|
|
178
|
+
// Conjugate v2
|
|
179
|
+
v2 = vreinterpret_f32_u32(veor_u32(vreinterpret_u32_f32(v2), p2ui_CONJ_XOR()));
|
|
180
|
+
// Swap real/imag elements in v2.
|
|
181
|
+
v2 = vrev64_f32(v2);
|
|
182
|
+
// Add and return the result
|
|
183
|
+
return Packet1cf(vadd_f32(v1, v2));
|
|
184
|
+
}
|
|
185
|
+
#endif
|
|
186
|
+
|
|
187
|
+
#ifdef __ARM_FEATURE_COMPLEX
|
|
188
|
+
template <>
|
|
189
|
+
EIGEN_STRONG_INLINE Packet2cf pmadd<Packet2cf>(const Packet2cf& a, const Packet2cf& b, const Packet2cf& c) {
|
|
190
|
+
Packet2cf result;
|
|
191
|
+
result.v = vcmlaq_f32(c.v, a.v, b.v);
|
|
192
|
+
result.v = vcmlaq_rot90_f32(result.v, a.v, b.v);
|
|
193
|
+
return result;
|
|
194
|
+
}
|
|
195
|
+
|
|
196
|
+
template <>
|
|
197
|
+
EIGEN_STRONG_INLINE Packet2cf pmul<Packet2cf>(const Packet2cf& a, const Packet2cf& b) {
|
|
198
|
+
return pmadd(a, b, pzero(a));
|
|
199
|
+
}
|
|
200
|
+
#else
|
|
201
|
+
template <>
|
|
202
|
+
EIGEN_STRONG_INLINE Packet2cf pmul<Packet2cf>(const Packet2cf& a, const Packet2cf& b) {
|
|
86
203
|
Packet4f v1, v2;
|
|
87
204
|
|
|
88
205
|
// Get the real values of a | a1_re | a1_re | a2_re | a2_re |
|
|
@@ -93,114 +210,214 @@ template<> EIGEN_STRONG_INLINE Packet2cf pmul<Packet2cf>(const Packet2cf& a, con
|
|
|
93
210
|
v1 = vmulq_f32(v1, b.v);
|
|
94
211
|
// Multiply the imag a with b
|
|
95
212
|
v2 = vmulq_f32(v2, b.v);
|
|
96
|
-
// Conjugate v2
|
|
213
|
+
// Conjugate v2
|
|
97
214
|
v2 = vreinterpretq_f32_u32(veorq_u32(vreinterpretq_u32_f32(v2), p4ui_CONJ_XOR()));
|
|
98
215
|
// Swap real/imag elements in v2.
|
|
99
216
|
v2 = vrev64q_f32(v2);
|
|
100
217
|
// Add and return the result
|
|
101
218
|
return Packet2cf(vaddq_f32(v1, v2));
|
|
102
219
|
}
|
|
220
|
+
#endif
|
|
221
|
+
|
|
222
|
+
template <>
|
|
223
|
+
EIGEN_STRONG_INLINE Packet1cf pcmp_eq(const Packet1cf& a, const Packet1cf& b) {
|
|
224
|
+
// Compare real and imaginary parts of a and b to get the mask vector:
|
|
225
|
+
// [re(a[0])==re(b[0]), im(a[0])==im(b[0])]
|
|
226
|
+
Packet2f eq = pcmp_eq<Packet2f>(a.v, b.v);
|
|
227
|
+
// Swap real/imag elements in the mask in to get:
|
|
228
|
+
// [im(a[0])==im(b[0]), re(a[0])==re(b[0])]
|
|
229
|
+
Packet2f eq_swapped = vrev64_f32(eq);
|
|
230
|
+
// Return re(a)==re(b) && im(a)==im(b) by computing bitwise AND of eq and eq_swapped
|
|
231
|
+
return Packet1cf(pand<Packet2f>(eq, eq_swapped));
|
|
232
|
+
}
|
|
233
|
+
template <>
|
|
234
|
+
EIGEN_STRONG_INLINE Packet2cf pcmp_eq(const Packet2cf& a, const Packet2cf& b) {
|
|
235
|
+
// Compare real and imaginary parts of a and b to get the mask vector:
|
|
236
|
+
// [re(a[0])==re(b[0]), im(a[0])==im(b[0]), re(a[1])==re(b[1]), im(a[1])==im(b[1])]
|
|
237
|
+
Packet4f eq = pcmp_eq<Packet4f>(a.v, b.v);
|
|
238
|
+
// Swap real/imag elements in the mask in to get:
|
|
239
|
+
// [im(a[0])==im(b[0]), re(a[0])==re(b[0]), im(a[1])==im(b[1]), re(a[1])==re(b[1])]
|
|
240
|
+
Packet4f eq_swapped = vrev64q_f32(eq);
|
|
241
|
+
// Return re(a)==re(b) && im(a)==im(b) by computing bitwise AND of eq and eq_swapped
|
|
242
|
+
return Packet2cf(pand<Packet4f>(eq, eq_swapped));
|
|
243
|
+
}
|
|
244
|
+
|
|
245
|
+
template <>
|
|
246
|
+
EIGEN_STRONG_INLINE Packet1cf pand<Packet1cf>(const Packet1cf& a, const Packet1cf& b) {
|
|
247
|
+
return Packet1cf(vreinterpret_f32_u32(vand_u32(vreinterpret_u32_f32(a.v), vreinterpret_u32_f32(b.v))));
|
|
248
|
+
}
|
|
249
|
+
template <>
|
|
250
|
+
EIGEN_STRONG_INLINE Packet2cf pand<Packet2cf>(const Packet2cf& a, const Packet2cf& b) {
|
|
251
|
+
return Packet2cf(vreinterpretq_f32_u32(vandq_u32(vreinterpretq_u32_f32(a.v), vreinterpretq_u32_f32(b.v))));
|
|
252
|
+
}
|
|
103
253
|
|
|
104
|
-
template<>
|
|
105
|
-
{
|
|
106
|
-
return
|
|
254
|
+
template <>
|
|
255
|
+
EIGEN_STRONG_INLINE Packet1cf por<Packet1cf>(const Packet1cf& a, const Packet1cf& b) {
|
|
256
|
+
return Packet1cf(vreinterpret_f32_u32(vorr_u32(vreinterpret_u32_f32(a.v), vreinterpret_u32_f32(b.v))));
|
|
107
257
|
}
|
|
108
|
-
template<>
|
|
109
|
-
{
|
|
110
|
-
return Packet2cf(vreinterpretq_f32_u32(vorrq_u32(vreinterpretq_u32_f32(a.v),vreinterpretq_u32_f32(b.v))));
|
|
258
|
+
template <>
|
|
259
|
+
EIGEN_STRONG_INLINE Packet2cf por<Packet2cf>(const Packet2cf& a, const Packet2cf& b) {
|
|
260
|
+
return Packet2cf(vreinterpretq_f32_u32(vorrq_u32(vreinterpretq_u32_f32(a.v), vreinterpretq_u32_f32(b.v))));
|
|
111
261
|
}
|
|
112
|
-
|
|
113
|
-
|
|
114
|
-
|
|
262
|
+
|
|
263
|
+
template <>
|
|
264
|
+
EIGEN_STRONG_INLINE Packet1cf pxor<Packet1cf>(const Packet1cf& a, const Packet1cf& b) {
|
|
265
|
+
return Packet1cf(vreinterpret_f32_u32(veor_u32(vreinterpret_u32_f32(a.v), vreinterpret_u32_f32(b.v))));
|
|
115
266
|
}
|
|
116
|
-
template<>
|
|
117
|
-
{
|
|
118
|
-
return Packet2cf(vreinterpretq_f32_u32(
|
|
267
|
+
template <>
|
|
268
|
+
EIGEN_STRONG_INLINE Packet2cf pxor<Packet2cf>(const Packet2cf& a, const Packet2cf& b) {
|
|
269
|
+
return Packet2cf(vreinterpretq_f32_u32(veorq_u32(vreinterpretq_u32_f32(a.v), vreinterpretq_u32_f32(b.v))));
|
|
119
270
|
}
|
|
120
271
|
|
|
121
|
-
template<>
|
|
122
|
-
|
|
272
|
+
template <>
|
|
273
|
+
EIGEN_STRONG_INLINE Packet1cf pandnot<Packet1cf>(const Packet1cf& a, const Packet1cf& b) {
|
|
274
|
+
return Packet1cf(vreinterpret_f32_u32(vbic_u32(vreinterpret_u32_f32(a.v), vreinterpret_u32_f32(b.v))));
|
|
275
|
+
}
|
|
276
|
+
template <>
|
|
277
|
+
EIGEN_STRONG_INLINE Packet2cf pandnot<Packet2cf>(const Packet2cf& a, const Packet2cf& b) {
|
|
278
|
+
return Packet2cf(vreinterpretq_f32_u32(vbicq_u32(vreinterpretq_u32_f32(a.v), vreinterpretq_u32_f32(b.v))));
|
|
279
|
+
}
|
|
123
280
|
|
|
124
|
-
template<>
|
|
281
|
+
template <>
|
|
282
|
+
EIGEN_STRONG_INLINE Packet1cf pload<Packet1cf>(const std::complex<float>* from) {
|
|
283
|
+
EIGEN_DEBUG_ALIGNED_LOAD return Packet1cf(
|
|
284
|
+
pload<Packet2f>(assume_aligned<unpacket_traits<Packet1cf>::alignment>(reinterpret_cast<const float*>(from))));
|
|
285
|
+
}
|
|
286
|
+
template <>
|
|
287
|
+
EIGEN_STRONG_INLINE Packet2cf pload<Packet2cf>(const std::complex<float>* from) {
|
|
288
|
+
EIGEN_DEBUG_ALIGNED_LOAD return Packet2cf(
|
|
289
|
+
pload<Packet4f>(assume_aligned<unpacket_traits<Packet2cf>::alignment>(reinterpret_cast<const float*>(from))));
|
|
290
|
+
}
|
|
125
291
|
|
|
126
|
-
template<>
|
|
127
|
-
|
|
292
|
+
template <>
|
|
293
|
+
EIGEN_STRONG_INLINE Packet1cf ploadu<Packet1cf>(const std::complex<float>* from) {
|
|
294
|
+
EIGEN_DEBUG_UNALIGNED_LOAD return Packet1cf(ploadu<Packet2f>((const float*)from));
|
|
295
|
+
}
|
|
296
|
+
template <>
|
|
297
|
+
EIGEN_STRONG_INLINE Packet2cf ploadu<Packet2cf>(const std::complex<float>* from) {
|
|
298
|
+
EIGEN_DEBUG_UNALIGNED_LOAD return Packet2cf(ploadu<Packet4f>(reinterpret_cast<const float*>(from)));
|
|
299
|
+
}
|
|
128
300
|
|
|
129
|
-
template<>
|
|
130
|
-
{
|
|
131
|
-
|
|
132
|
-
|
|
133
|
-
|
|
134
|
-
|
|
135
|
-
|
|
136
|
-
return Packet2cf(res);
|
|
301
|
+
template <>
|
|
302
|
+
EIGEN_STRONG_INLINE Packet1cf ploaddup<Packet1cf>(const std::complex<float>* from) {
|
|
303
|
+
return pset1<Packet1cf>(*from);
|
|
304
|
+
}
|
|
305
|
+
template <>
|
|
306
|
+
EIGEN_STRONG_INLINE Packet2cf ploaddup<Packet2cf>(const std::complex<float>* from) {
|
|
307
|
+
return pset1<Packet2cf>(*from);
|
|
137
308
|
}
|
|
138
309
|
|
|
139
|
-
template<>
|
|
140
|
-
{
|
|
141
|
-
|
|
142
|
-
|
|
310
|
+
template <>
|
|
311
|
+
EIGEN_STRONG_INLINE void pstore<std::complex<float>>(std::complex<float>* to, const Packet1cf& from) {
|
|
312
|
+
EIGEN_DEBUG_ALIGNED_STORE pstore(assume_aligned<unpacket_traits<Packet1cf>::alignment>(reinterpret_cast<float*>(to)),
|
|
313
|
+
from.v);
|
|
314
|
+
}
|
|
315
|
+
template <>
|
|
316
|
+
EIGEN_STRONG_INLINE void pstore<std::complex<float>>(std::complex<float>* to, const Packet2cf& from) {
|
|
317
|
+
EIGEN_DEBUG_ALIGNED_STORE pstore(assume_aligned<unpacket_traits<Packet2cf>::alignment>(reinterpret_cast<float*>(to)),
|
|
318
|
+
from.v);
|
|
143
319
|
}
|
|
144
320
|
|
|
145
|
-
template<>
|
|
321
|
+
template <>
|
|
322
|
+
EIGEN_STRONG_INLINE void pstoreu<std::complex<float>>(std::complex<float>* to, const Packet1cf& from) {
|
|
323
|
+
EIGEN_DEBUG_UNALIGNED_STORE pstoreu((float*)to, from.v);
|
|
324
|
+
}
|
|
325
|
+
template <>
|
|
326
|
+
EIGEN_STRONG_INLINE void pstoreu<std::complex<float>>(std::complex<float>* to, const Packet2cf& from) {
|
|
327
|
+
EIGEN_DEBUG_UNALIGNED_STORE pstoreu(reinterpret_cast<float*>(to), from.v);
|
|
328
|
+
}
|
|
146
329
|
|
|
147
|
-
template<>
|
|
148
|
-
|
|
149
|
-
|
|
150
|
-
|
|
151
|
-
return
|
|
330
|
+
template <>
|
|
331
|
+
EIGEN_DEVICE_FUNC inline Packet1cf pgather<std::complex<float>, Packet1cf>(const std::complex<float>* from,
|
|
332
|
+
Index stride) {
|
|
333
|
+
const Packet2f tmp = vdup_n_f32(std::real(from[0 * stride]));
|
|
334
|
+
return Packet1cf(vset_lane_f32(std::imag(from[0 * stride]), tmp, 1));
|
|
335
|
+
}
|
|
336
|
+
template <>
|
|
337
|
+
EIGEN_DEVICE_FUNC inline Packet2cf pgather<std::complex<float>, Packet2cf>(const std::complex<float>* from,
|
|
338
|
+
Index stride) {
|
|
339
|
+
Packet4f res = vdupq_n_f32(std::real(from[0 * stride]));
|
|
340
|
+
res = vsetq_lane_f32(std::imag(from[0 * stride]), res, 1);
|
|
341
|
+
res = vsetq_lane_f32(std::real(from[1 * stride]), res, 2);
|
|
342
|
+
res = vsetq_lane_f32(std::imag(from[1 * stride]), res, 3);
|
|
343
|
+
return Packet2cf(res);
|
|
152
344
|
}
|
|
153
345
|
|
|
154
|
-
template<>
|
|
155
|
-
|
|
156
|
-
|
|
157
|
-
|
|
346
|
+
template <>
|
|
347
|
+
EIGEN_DEVICE_FUNC inline void pscatter<std::complex<float>, Packet1cf>(std::complex<float>* to, const Packet1cf& from,
|
|
348
|
+
Index stride) {
|
|
349
|
+
to[stride * 0] = std::complex<float>(vget_lane_f32(from.v, 0), vget_lane_f32(from.v, 1));
|
|
350
|
+
}
|
|
351
|
+
template <>
|
|
352
|
+
EIGEN_DEVICE_FUNC inline void pscatter<std::complex<float>, Packet2cf>(std::complex<float>* to, const Packet2cf& from,
|
|
353
|
+
Index stride) {
|
|
354
|
+
to[stride * 0] = std::complex<float>(vgetq_lane_f32(from.v, 0), vgetq_lane_f32(from.v, 1));
|
|
355
|
+
to[stride * 1] = std::complex<float>(vgetq_lane_f32(from.v, 2), vgetq_lane_f32(from.v, 3));
|
|
356
|
+
}
|
|
357
|
+
|
|
358
|
+
template <>
|
|
359
|
+
EIGEN_STRONG_INLINE void prefetch<std::complex<float>>(const std::complex<float>* addr) {
|
|
360
|
+
EIGEN_ARM_PREFETCH(reinterpret_cast<const float*>(addr));
|
|
361
|
+
}
|
|
158
362
|
|
|
159
|
-
|
|
160
|
-
|
|
161
|
-
|
|
363
|
+
template <>
|
|
364
|
+
EIGEN_STRONG_INLINE std::complex<float> pfirst<Packet1cf>(const Packet1cf& a) {
|
|
365
|
+
EIGEN_ALIGN16 std::complex<float> x;
|
|
366
|
+
vst1_f32(reinterpret_cast<float*>(&x), a.v);
|
|
367
|
+
return x;
|
|
368
|
+
}
|
|
369
|
+
template <>
|
|
370
|
+
EIGEN_STRONG_INLINE std::complex<float> pfirst<Packet2cf>(const Packet2cf& a) {
|
|
371
|
+
EIGEN_ALIGN16 std::complex<float> x[2];
|
|
372
|
+
vst1q_f32(reinterpret_cast<float*>(x), a.v);
|
|
373
|
+
return x[0];
|
|
374
|
+
}
|
|
162
375
|
|
|
163
|
-
|
|
376
|
+
template <>
|
|
377
|
+
EIGEN_STRONG_INLINE Packet1cf preverse(const Packet1cf& a) {
|
|
378
|
+
return a;
|
|
379
|
+
}
|
|
380
|
+
template <>
|
|
381
|
+
EIGEN_STRONG_INLINE Packet2cf preverse(const Packet2cf& a) {
|
|
382
|
+
return Packet2cf(vcombine_f32(vget_high_f32(a.v), vget_low_f32(a.v)));
|
|
164
383
|
}
|
|
165
384
|
|
|
166
|
-
template<>
|
|
167
|
-
{
|
|
385
|
+
template <>
|
|
386
|
+
EIGEN_STRONG_INLINE Packet1cf pcplxflip<Packet1cf>(const Packet1cf& a) {
|
|
387
|
+
return Packet1cf(vrev64_f32(a.v));
|
|
388
|
+
}
|
|
389
|
+
template <>
|
|
390
|
+
EIGEN_STRONG_INLINE Packet2cf pcplxflip<Packet2cf>(const Packet2cf& a) {
|
|
168
391
|
return Packet2cf(vrev64q_f32(a.v));
|
|
169
392
|
}
|
|
170
393
|
|
|
171
|
-
template<>
|
|
172
|
-
{
|
|
173
|
-
float32x2_t a1, a2;
|
|
394
|
+
template <>
|
|
395
|
+
EIGEN_STRONG_INLINE std::complex<float> predux<Packet1cf>(const Packet1cf& a) {
|
|
174
396
|
std::complex<float> s;
|
|
175
|
-
|
|
176
|
-
a1 = vget_low_f32(a.v);
|
|
177
|
-
a2 = vget_high_f32(a.v);
|
|
178
|
-
a2 = vadd_f32(a1, a2);
|
|
179
|
-
vst1_f32((float *)&s, a2);
|
|
180
|
-
|
|
397
|
+
vst1_f32((float*)&s, a.v);
|
|
181
398
|
return s;
|
|
182
399
|
}
|
|
183
|
-
|
|
184
|
-
|
|
185
|
-
|
|
186
|
-
|
|
187
|
-
|
|
188
|
-
// Add the first two 64-bit float32x2_t of vecs[0]
|
|
189
|
-
sum1 = vcombine_f32(vget_low_f32(vecs[0].v), vget_low_f32(vecs[1].v));
|
|
190
|
-
sum2 = vcombine_f32(vget_high_f32(vecs[0].v), vget_high_f32(vecs[1].v));
|
|
191
|
-
sum = vaddq_f32(sum1, sum2);
|
|
192
|
-
|
|
193
|
-
return Packet2cf(sum);
|
|
400
|
+
template <>
|
|
401
|
+
EIGEN_STRONG_INLINE std::complex<float> predux<Packet2cf>(const Packet2cf& a) {
|
|
402
|
+
std::complex<float> s;
|
|
403
|
+
vst1_f32(reinterpret_cast<float*>(&s), vadd_f32(vget_low_f32(a.v), vget_high_f32(a.v)));
|
|
404
|
+
return s;
|
|
194
405
|
}
|
|
195
406
|
|
|
196
|
-
template<>
|
|
197
|
-
{
|
|
407
|
+
template <>
|
|
408
|
+
EIGEN_STRONG_INLINE std::complex<float> predux_mul<Packet1cf>(const Packet1cf& a) {
|
|
409
|
+
std::complex<float> s;
|
|
410
|
+
vst1_f32((float*)&s, a.v);
|
|
411
|
+
return s;
|
|
412
|
+
}
|
|
413
|
+
template <>
|
|
414
|
+
EIGEN_STRONG_INLINE std::complex<float> predux_mul<Packet2cf>(const Packet2cf& a) {
|
|
198
415
|
float32x2_t a1, a2, v1, v2, prod;
|
|
199
416
|
std::complex<float> s;
|
|
200
417
|
|
|
201
418
|
a1 = vget_low_f32(a.v);
|
|
202
419
|
a2 = vget_high_f32(a.v);
|
|
203
|
-
|
|
420
|
+
// Get the real values of a | a1_re | a1_re | a2_re | a2_re |
|
|
204
421
|
v1 = vdup_lane_f32(a1, 0);
|
|
205
422
|
// Get the real values of a | a1_im | a1_im | a2_im | a2_im |
|
|
206
423
|
v2 = vdup_lane_f32(a1, 1);
|
|
@@ -208,144 +425,171 @@ template<> EIGEN_STRONG_INLINE std::complex<float> predux_mul<Packet2cf>(const P
|
|
|
208
425
|
v1 = vmul_f32(v1, a2);
|
|
209
426
|
// Multiply the imag a with b
|
|
210
427
|
v2 = vmul_f32(v2, a2);
|
|
211
|
-
// Conjugate v2
|
|
428
|
+
// Conjugate v2
|
|
212
429
|
v2 = vreinterpret_f32_u32(veor_u32(vreinterpret_u32_f32(v2), p2ui_CONJ_XOR()));
|
|
213
430
|
// Swap real/imag elements in v2.
|
|
214
431
|
v2 = vrev64_f32(v2);
|
|
215
432
|
// Add v1, v2
|
|
216
433
|
prod = vadd_f32(v1, v2);
|
|
217
434
|
|
|
218
|
-
vst1_f32((
|
|
435
|
+
vst1_f32(reinterpret_cast<float*>(&s), prod);
|
|
219
436
|
|
|
220
437
|
return s;
|
|
221
438
|
}
|
|
222
439
|
|
|
223
|
-
|
|
224
|
-
|
|
225
|
-
{
|
|
226
|
-
EIGEN_STRONG_INLINE static void run(Packet2cf& first, const Packet2cf& second)
|
|
227
|
-
{
|
|
228
|
-
if (Offset==1)
|
|
229
|
-
{
|
|
230
|
-
first.v = vextq_f32(first.v, second.v, 2);
|
|
231
|
-
}
|
|
232
|
-
}
|
|
233
|
-
};
|
|
234
|
-
|
|
235
|
-
template<> struct conj_helper<Packet2cf, Packet2cf, false,true>
|
|
236
|
-
{
|
|
237
|
-
EIGEN_STRONG_INLINE Packet2cf pmadd(const Packet2cf& x, const Packet2cf& y, const Packet2cf& c) const
|
|
238
|
-
{ return padd(pmul(x,y),c); }
|
|
440
|
+
EIGEN_MAKE_CONJ_HELPER_CPLX_REAL(Packet1cf, Packet2f)
|
|
441
|
+
EIGEN_MAKE_CONJ_HELPER_CPLX_REAL(Packet2cf, Packet4f)
|
|
239
442
|
|
|
240
|
-
|
|
241
|
-
|
|
242
|
-
|
|
243
|
-
|
|
244
|
-
|
|
245
|
-
|
|
246
|
-
|
|
247
|
-
|
|
248
|
-
EIGEN_STRONG_INLINE Packet2cf pmadd(const Packet2cf& x, const Packet2cf& y, const Packet2cf& c) const
|
|
249
|
-
{ return padd(pmul(x,y),c); }
|
|
250
|
-
|
|
251
|
-
EIGEN_STRONG_INLINE Packet2cf pmul(const Packet2cf& a, const Packet2cf& b) const
|
|
252
|
-
{
|
|
253
|
-
return internal::pmul(pconj(a), b);
|
|
254
|
-
}
|
|
255
|
-
};
|
|
443
|
+
template <>
|
|
444
|
+
EIGEN_STRONG_INLINE Packet1cf pdiv<Packet1cf>(const Packet1cf& a, const Packet1cf& b) {
|
|
445
|
+
return pdiv_complex(a, b);
|
|
446
|
+
}
|
|
447
|
+
template <>
|
|
448
|
+
EIGEN_STRONG_INLINE Packet2cf pdiv<Packet2cf>(const Packet2cf& a, const Packet2cf& b) {
|
|
449
|
+
return pdiv_complex(a, b);
|
|
450
|
+
}
|
|
256
451
|
|
|
257
|
-
|
|
258
|
-
{
|
|
259
|
-
|
|
260
|
-
|
|
452
|
+
EIGEN_DEVICE_FUNC inline void ptranspose(PacketBlock<Packet1cf, 1>& /*kernel*/) {}
|
|
453
|
+
EIGEN_DEVICE_FUNC inline void ptranspose(PacketBlock<Packet2cf, 2>& kernel) {
|
|
454
|
+
Packet4f tmp = vcombine_f32(vget_high_f32(kernel.packet[0].v), vget_high_f32(kernel.packet[1].v));
|
|
455
|
+
kernel.packet[0].v = vcombine_f32(vget_low_f32(kernel.packet[0].v), vget_low_f32(kernel.packet[1].v));
|
|
456
|
+
kernel.packet[1].v = tmp;
|
|
457
|
+
}
|
|
261
458
|
|
|
262
|
-
|
|
263
|
-
|
|
264
|
-
|
|
265
|
-
|
|
266
|
-
};
|
|
459
|
+
template <>
|
|
460
|
+
EIGEN_STRONG_INLINE Packet1cf psqrt<Packet1cf>(const Packet1cf& a) {
|
|
461
|
+
return psqrt_complex<Packet1cf>(a);
|
|
462
|
+
}
|
|
267
463
|
|
|
268
|
-
|
|
464
|
+
template <>
|
|
465
|
+
EIGEN_STRONG_INLINE Packet2cf psqrt<Packet2cf>(const Packet2cf& a) {
|
|
466
|
+
return psqrt_complex<Packet2cf>(a);
|
|
467
|
+
}
|
|
269
468
|
|
|
270
|
-
template<>
|
|
271
|
-
{
|
|
272
|
-
|
|
273
|
-
|
|
274
|
-
Packet4f s, rev_s;
|
|
469
|
+
template <>
|
|
470
|
+
EIGEN_STRONG_INLINE Packet1cf plog<Packet1cf>(const Packet1cf& a) {
|
|
471
|
+
return plog_complex(a);
|
|
472
|
+
}
|
|
275
473
|
|
|
276
|
-
|
|
277
|
-
|
|
278
|
-
|
|
474
|
+
template <>
|
|
475
|
+
EIGEN_STRONG_INLINE Packet2cf plog<Packet2cf>(const Packet2cf& a) {
|
|
476
|
+
return plog_complex(a);
|
|
477
|
+
}
|
|
279
478
|
|
|
280
|
-
|
|
479
|
+
template <>
|
|
480
|
+
EIGEN_STRONG_INLINE Packet1cf pexp<Packet1cf>(const Packet1cf& a) {
|
|
481
|
+
return pexp_complex(a);
|
|
281
482
|
}
|
|
282
483
|
|
|
283
|
-
|
|
284
|
-
|
|
285
|
-
|
|
286
|
-
kernel.packet[0].v = vcombine_f32(vget_low_f32(kernel.packet[0].v), vget_low_f32(kernel.packet[1].v));
|
|
287
|
-
kernel.packet[1].v = tmp;
|
|
484
|
+
template <>
|
|
485
|
+
EIGEN_STRONG_INLINE Packet2cf pexp<Packet2cf>(const Packet2cf& a) {
|
|
486
|
+
return pexp_complex(a);
|
|
288
487
|
}
|
|
289
488
|
|
|
290
489
|
//---------- double ----------
|
|
291
490
|
#if EIGEN_ARCH_ARM64 && !EIGEN_APPLE_DOUBLE_NEON_BUG
|
|
292
491
|
|
|
293
|
-
|
|
294
|
-
|
|
295
|
-
|
|
296
|
-
|
|
297
|
-
const uint64_t p2ul_conj_XOR_DATA[] = { 0x0, 0x8000000000000000 };
|
|
298
|
-
static uint64x2_t p2ul_CONJ_XOR = vld1q_u64( p2ul_conj_XOR_DATA );
|
|
299
|
-
#endif
|
|
492
|
+
inline uint64x2_t p2ul_CONJ_XOR() {
|
|
493
|
+
static const uint64_t p2ul_conj_XOR_DATA[] = {0x0, 0x8000000000000000};
|
|
494
|
+
return vld1q_u64(p2ul_conj_XOR_DATA);
|
|
495
|
+
}
|
|
300
496
|
|
|
301
|
-
struct Packet1cd
|
|
302
|
-
{
|
|
497
|
+
struct Packet1cd {
|
|
303
498
|
EIGEN_STRONG_INLINE Packet1cd() {}
|
|
304
499
|
EIGEN_STRONG_INLINE explicit Packet1cd(const Packet2d& a) : v(a) {}
|
|
305
500
|
Packet2d v;
|
|
306
501
|
};
|
|
307
502
|
|
|
308
|
-
template<>
|
|
309
|
-
{
|
|
503
|
+
template <>
|
|
504
|
+
struct packet_traits<std::complex<double>> : default_packet_traits {
|
|
310
505
|
typedef Packet1cd type;
|
|
311
506
|
typedef Packet1cd half;
|
|
312
507
|
enum {
|
|
313
508
|
Vectorizable = 1,
|
|
314
509
|
AlignedOnScalar = 0,
|
|
315
510
|
size = 1,
|
|
316
|
-
HasHalfPacket = 0,
|
|
317
511
|
|
|
318
|
-
HasAdd
|
|
319
|
-
HasSub
|
|
320
|
-
HasMul
|
|
321
|
-
HasDiv
|
|
512
|
+
HasAdd = 1,
|
|
513
|
+
HasSub = 1,
|
|
514
|
+
HasMul = 1,
|
|
515
|
+
HasDiv = 1,
|
|
322
516
|
HasNegate = 1,
|
|
323
|
-
|
|
324
|
-
|
|
325
|
-
|
|
326
|
-
|
|
517
|
+
HasSqrt = 1,
|
|
518
|
+
HasLog = 1,
|
|
519
|
+
HasAbs = 0,
|
|
520
|
+
HasAbs2 = 0,
|
|
521
|
+
HasMin = 0,
|
|
522
|
+
HasMax = 0,
|
|
327
523
|
HasSetLinear = 0
|
|
328
524
|
};
|
|
329
525
|
};
|
|
330
526
|
|
|
331
|
-
template<>
|
|
527
|
+
template <>
|
|
528
|
+
struct unpacket_traits<Packet1cd> : neon_unpacket_default<Packet1cd, std::complex<double>> {
|
|
529
|
+
using as_real = Packet2d;
|
|
530
|
+
};
|
|
531
|
+
|
|
532
|
+
template <>
|
|
533
|
+
EIGEN_STRONG_INLINE Packet1cd pload<Packet1cd>(const std::complex<double>* from) {
|
|
534
|
+
EIGEN_DEBUG_ALIGNED_LOAD return Packet1cd(
|
|
535
|
+
pload<Packet2d>(assume_aligned<unpacket_traits<Packet1cd>::alignment>(reinterpret_cast<const double*>(from))));
|
|
536
|
+
}
|
|
537
|
+
|
|
538
|
+
template <>
|
|
539
|
+
EIGEN_STRONG_INLINE Packet1cd ploadu<Packet1cd>(const std::complex<double>* from) {
|
|
540
|
+
EIGEN_DEBUG_UNALIGNED_LOAD return Packet1cd(ploadu<Packet2d>(reinterpret_cast<const double*>(from)));
|
|
541
|
+
}
|
|
542
|
+
|
|
543
|
+
template <>
|
|
544
|
+
EIGEN_STRONG_INLINE Packet1cd pzero<Packet1cd>(const Packet1cd& /*a*/) {
|
|
545
|
+
return Packet1cd(vdupq_n_f64(0.0));
|
|
546
|
+
}
|
|
547
|
+
|
|
548
|
+
template <>
|
|
549
|
+
EIGEN_STRONG_INLINE Packet1cd pset1<Packet1cd>(const std::complex<double>& from) {
|
|
550
|
+
/* here we really have to use unaligned loads :( */
|
|
551
|
+
return ploadu<Packet1cd>(&from);
|
|
552
|
+
}
|
|
332
553
|
|
|
333
|
-
template<>
|
|
334
|
-
|
|
554
|
+
template <>
|
|
555
|
+
EIGEN_STRONG_INLINE Packet1cd padd<Packet1cd>(const Packet1cd& a, const Packet1cd& b) {
|
|
556
|
+
return Packet1cd(padd<Packet2d>(a.v, b.v));
|
|
557
|
+
}
|
|
335
558
|
|
|
336
|
-
template<>
|
|
337
|
-
|
|
559
|
+
template <>
|
|
560
|
+
EIGEN_STRONG_INLINE Packet1cd psub<Packet1cd>(const Packet1cd& a, const Packet1cd& b) {
|
|
561
|
+
return Packet1cd(psub<Packet2d>(a.v, b.v));
|
|
562
|
+
}
|
|
338
563
|
|
|
339
|
-
template<>
|
|
340
|
-
|
|
341
|
-
|
|
342
|
-
|
|
564
|
+
template <>
|
|
565
|
+
EIGEN_STRONG_INLINE Packet1cd pnegate(const Packet1cd& a) {
|
|
566
|
+
return Packet1cd(pnegate<Packet2d>(a.v));
|
|
567
|
+
}
|
|
343
568
|
|
|
344
|
-
template<>
|
|
345
|
-
{
|
|
569
|
+
template <>
|
|
570
|
+
EIGEN_STRONG_INLINE Packet1cd pconj(const Packet1cd& a) {
|
|
571
|
+
return Packet1cd(vreinterpretq_f64_u64(veorq_u64(vreinterpretq_u64_f64(a.v), p2ul_CONJ_XOR())));
|
|
572
|
+
}
|
|
573
|
+
|
|
574
|
+
#ifdef __ARM_FEATURE_COMPLEX
|
|
575
|
+
template <>
|
|
576
|
+
EIGEN_STRONG_INLINE Packet1cd pmadd<Packet1cd>(const Packet1cd& a, const Packet1cd& b, const Packet1cd& c) {
|
|
577
|
+
Packet1cd result;
|
|
578
|
+
result.v = vcmlaq_f64(c.v, a.v, b.v);
|
|
579
|
+
result.v = vcmlaq_rot90_f64(result.v, a.v, b.v);
|
|
580
|
+
return result;
|
|
581
|
+
}
|
|
582
|
+
|
|
583
|
+
template <>
|
|
584
|
+
EIGEN_STRONG_INLINE Packet1cd pmul<Packet1cd>(const Packet1cd& a, const Packet1cd& b) {
|
|
585
|
+
return pmadd(a, b, pzero(a));
|
|
586
|
+
}
|
|
587
|
+
#else
|
|
588
|
+
template <>
|
|
589
|
+
EIGEN_STRONG_INLINE Packet1cd pmul<Packet1cd>(const Packet1cd& a, const Packet1cd& b) {
|
|
346
590
|
Packet2d v1, v2;
|
|
347
591
|
|
|
348
|
-
// Get the real values of a
|
|
592
|
+
// Get the real values of a
|
|
349
593
|
v1 = vdupq_lane_f64(vget_low_f64(a.v), 0);
|
|
350
594
|
// Get the imag values of a
|
|
351
595
|
v2 = vdupq_lane_f64(vget_high_f64(a.v), 0);
|
|
@@ -353,138 +597,136 @@ template<> EIGEN_STRONG_INLINE Packet1cd pmul<Packet1cd>(const Packet1cd& a, con
|
|
|
353
597
|
v1 = vmulq_f64(v1, b.v);
|
|
354
598
|
// Multiply the imag a with b
|
|
355
599
|
v2 = vmulq_f64(v2, b.v);
|
|
356
|
-
// Conjugate v2
|
|
357
|
-
v2 = vreinterpretq_f64_u64(veorq_u64(vreinterpretq_u64_f64(v2), p2ul_CONJ_XOR));
|
|
600
|
+
// Conjugate v2
|
|
601
|
+
v2 = vreinterpretq_f64_u64(veorq_u64(vreinterpretq_u64_f64(v2), p2ul_CONJ_XOR()));
|
|
358
602
|
// Swap real/imag elements in v2.
|
|
359
603
|
v2 = preverse<Packet2d>(v2);
|
|
360
604
|
// Add and return the result
|
|
361
605
|
return Packet1cd(vaddq_f64(v1, v2));
|
|
362
606
|
}
|
|
607
|
+
#endif
|
|
608
|
+
|
|
609
|
+
template <>
|
|
610
|
+
EIGEN_STRONG_INLINE Packet1cd pcmp_eq(const Packet1cd& a, const Packet1cd& b) {
|
|
611
|
+
// Compare real and imaginary parts of a and b to get the mask vector:
|
|
612
|
+
// [re(a)==re(b), im(a)==im(b)]
|
|
613
|
+
Packet2d eq = pcmp_eq<Packet2d>(a.v, b.v);
|
|
614
|
+
// Swap real/imag elements in the mask in to get:
|
|
615
|
+
// [im(a)==im(b), re(a)==re(b)]
|
|
616
|
+
Packet2d eq_swapped = vreinterpretq_f64_u32(vrev64q_u32(vreinterpretq_u32_f64(eq)));
|
|
617
|
+
// Return re(a)==re(b) & im(a)==im(b) by computing bitwise AND of eq and eq_swapped
|
|
618
|
+
return Packet1cd(pand<Packet2d>(eq, eq_swapped));
|
|
619
|
+
}
|
|
620
|
+
|
|
621
|
+
template <>
|
|
622
|
+
EIGEN_STRONG_INLINE Packet1cd pand<Packet1cd>(const Packet1cd& a, const Packet1cd& b) {
|
|
623
|
+
return Packet1cd(vreinterpretq_f64_u64(vandq_u64(vreinterpretq_u64_f64(a.v), vreinterpretq_u64_f64(b.v))));
|
|
624
|
+
}
|
|
363
625
|
|
|
364
|
-
template<>
|
|
365
|
-
{
|
|
366
|
-
return Packet1cd(vreinterpretq_f64_u64(
|
|
626
|
+
template <>
|
|
627
|
+
EIGEN_STRONG_INLINE Packet1cd por<Packet1cd>(const Packet1cd& a, const Packet1cd& b) {
|
|
628
|
+
return Packet1cd(vreinterpretq_f64_u64(vorrq_u64(vreinterpretq_u64_f64(a.v), vreinterpretq_u64_f64(b.v))));
|
|
367
629
|
}
|
|
368
|
-
|
|
369
|
-
|
|
370
|
-
|
|
630
|
+
|
|
631
|
+
template <>
|
|
632
|
+
EIGEN_STRONG_INLINE Packet1cd pxor<Packet1cd>(const Packet1cd& a, const Packet1cd& b) {
|
|
633
|
+
return Packet1cd(vreinterpretq_f64_u64(veorq_u64(vreinterpretq_u64_f64(a.v), vreinterpretq_u64_f64(b.v))));
|
|
371
634
|
}
|
|
372
|
-
|
|
373
|
-
|
|
374
|
-
|
|
635
|
+
|
|
636
|
+
template <>
|
|
637
|
+
EIGEN_STRONG_INLINE Packet1cd pandnot<Packet1cd>(const Packet1cd& a, const Packet1cd& b) {
|
|
638
|
+
return Packet1cd(vreinterpretq_f64_u64(vbicq_u64(vreinterpretq_u64_f64(a.v), vreinterpretq_u64_f64(b.v))));
|
|
375
639
|
}
|
|
376
|
-
|
|
377
|
-
|
|
378
|
-
|
|
640
|
+
|
|
641
|
+
template <>
|
|
642
|
+
EIGEN_STRONG_INLINE Packet1cd ploaddup<Packet1cd>(const std::complex<double>* from) {
|
|
643
|
+
return pset1<Packet1cd>(*from);
|
|
379
644
|
}
|
|
380
645
|
|
|
381
|
-
template<>
|
|
646
|
+
template <>
|
|
647
|
+
EIGEN_STRONG_INLINE void pstore<std::complex<double>>(std::complex<double>* to, const Packet1cd& from) {
|
|
648
|
+
EIGEN_DEBUG_ALIGNED_STORE pstore(assume_aligned<unpacket_traits<Packet1cd>::alignment>(reinterpret_cast<double*>(to)),
|
|
649
|
+
from.v);
|
|
650
|
+
}
|
|
382
651
|
|
|
383
|
-
template<>
|
|
384
|
-
|
|
652
|
+
template <>
|
|
653
|
+
EIGEN_STRONG_INLINE void pstoreu<std::complex<double>>(std::complex<double>* to, const Packet1cd& from) {
|
|
654
|
+
EIGEN_DEBUG_UNALIGNED_STORE pstoreu(reinterpret_cast<double*>(to), from.v);
|
|
655
|
+
}
|
|
385
656
|
|
|
386
|
-
template<>
|
|
657
|
+
template <>
|
|
658
|
+
EIGEN_STRONG_INLINE void prefetch<std::complex<double>>(const std::complex<double>* addr) {
|
|
659
|
+
EIGEN_ARM_PREFETCH(reinterpret_cast<const double*>(addr));
|
|
660
|
+
}
|
|
387
661
|
|
|
388
|
-
template<>
|
|
389
|
-
|
|
662
|
+
template <>
|
|
663
|
+
EIGEN_DEVICE_FUNC inline Packet1cd pgather<std::complex<double>, Packet1cd>(const std::complex<double>* from,
|
|
664
|
+
Index stride) {
|
|
390
665
|
Packet2d res = pset1<Packet2d>(0.0);
|
|
391
|
-
res = vsetq_lane_f64(std::real(from[0*stride]), res, 0);
|
|
392
|
-
res = vsetq_lane_f64(std::imag(from[0*stride]), res, 1);
|
|
666
|
+
res = vsetq_lane_f64(std::real(from[0 * stride]), res, 0);
|
|
667
|
+
res = vsetq_lane_f64(std::imag(from[0 * stride]), res, 1);
|
|
393
668
|
return Packet1cd(res);
|
|
394
669
|
}
|
|
395
670
|
|
|
396
|
-
template<>
|
|
397
|
-
|
|
398
|
-
|
|
671
|
+
template <>
|
|
672
|
+
EIGEN_DEVICE_FUNC inline void pscatter<std::complex<double>, Packet1cd>(std::complex<double>* to, const Packet1cd& from,
|
|
673
|
+
Index stride) {
|
|
674
|
+
to[stride * 0] = std::complex<double>(vgetq_lane_f64(from.v, 0), vgetq_lane_f64(from.v, 1));
|
|
399
675
|
}
|
|
400
676
|
|
|
401
|
-
|
|
402
|
-
|
|
403
|
-
|
|
404
|
-
std::complex<double
|
|
405
|
-
pstore<std::complex<double> >(&res, a);
|
|
406
|
-
|
|
677
|
+
template <>
|
|
678
|
+
EIGEN_STRONG_INLINE std::complex<double> pfirst<Packet1cd>(const Packet1cd& a) {
|
|
679
|
+
EIGEN_ALIGN16 std::complex<double> res;
|
|
680
|
+
pstore<std::complex<double>>(&res, a);
|
|
407
681
|
return res;
|
|
408
682
|
}
|
|
409
683
|
|
|
410
|
-
template<>
|
|
411
|
-
|
|
412
|
-
|
|
413
|
-
|
|
414
|
-
template<> EIGEN_STRONG_INLINE Packet1cd preduxp<Packet1cd>(const Packet1cd* vecs) { return vecs[0]; }
|
|
415
|
-
|
|
416
|
-
template<> EIGEN_STRONG_INLINE std::complex<double> predux_mul<Packet1cd>(const Packet1cd& a) { return pfirst(a); }
|
|
417
|
-
|
|
418
|
-
template<int Offset>
|
|
419
|
-
struct palign_impl<Offset,Packet1cd>
|
|
420
|
-
{
|
|
421
|
-
static EIGEN_STRONG_INLINE void run(Packet1cd& /*first*/, const Packet1cd& /*second*/)
|
|
422
|
-
{
|
|
423
|
-
// FIXME is it sure we never have to align a Packet1cd?
|
|
424
|
-
// Even though a std::complex<double> has 16 bytes, it is not necessarily aligned on a 16 bytes boundary...
|
|
425
|
-
}
|
|
426
|
-
};
|
|
427
|
-
|
|
428
|
-
template<> struct conj_helper<Packet1cd, Packet1cd, false,true>
|
|
429
|
-
{
|
|
430
|
-
EIGEN_STRONG_INLINE Packet1cd pmadd(const Packet1cd& x, const Packet1cd& y, const Packet1cd& c) const
|
|
431
|
-
{ return padd(pmul(x,y),c); }
|
|
432
|
-
|
|
433
|
-
EIGEN_STRONG_INLINE Packet1cd pmul(const Packet1cd& a, const Packet1cd& b) const
|
|
434
|
-
{
|
|
435
|
-
return internal::pmul(a, pconj(b));
|
|
436
|
-
}
|
|
437
|
-
};
|
|
438
|
-
|
|
439
|
-
template<> struct conj_helper<Packet1cd, Packet1cd, true,false>
|
|
440
|
-
{
|
|
441
|
-
EIGEN_STRONG_INLINE Packet1cd pmadd(const Packet1cd& x, const Packet1cd& y, const Packet1cd& c) const
|
|
442
|
-
{ return padd(pmul(x,y),c); }
|
|
443
|
-
|
|
444
|
-
EIGEN_STRONG_INLINE Packet1cd pmul(const Packet1cd& a, const Packet1cd& b) const
|
|
445
|
-
{
|
|
446
|
-
return internal::pmul(pconj(a), b);
|
|
447
|
-
}
|
|
448
|
-
};
|
|
449
|
-
|
|
450
|
-
template<> struct conj_helper<Packet1cd, Packet1cd, true,true>
|
|
451
|
-
{
|
|
452
|
-
EIGEN_STRONG_INLINE Packet1cd pmadd(const Packet1cd& x, const Packet1cd& y, const Packet1cd& c) const
|
|
453
|
-
{ return padd(pmul(x,y),c); }
|
|
684
|
+
template <>
|
|
685
|
+
EIGEN_STRONG_INLINE Packet1cd preverse(const Packet1cd& a) {
|
|
686
|
+
return a;
|
|
687
|
+
}
|
|
454
688
|
|
|
455
|
-
|
|
456
|
-
|
|
457
|
-
|
|
458
|
-
|
|
459
|
-
};
|
|
689
|
+
template <>
|
|
690
|
+
EIGEN_STRONG_INLINE std::complex<double> predux<Packet1cd>(const Packet1cd& a) {
|
|
691
|
+
return pfirst(a);
|
|
692
|
+
}
|
|
460
693
|
|
|
461
|
-
|
|
694
|
+
template <>
|
|
695
|
+
EIGEN_STRONG_INLINE std::complex<double> predux_mul<Packet1cd>(const Packet1cd& a) {
|
|
696
|
+
return pfirst(a);
|
|
697
|
+
}
|
|
462
698
|
|
|
463
|
-
|
|
464
|
-
{
|
|
465
|
-
// TODO optimize it for NEON
|
|
466
|
-
Packet1cd res = conj_helper<Packet1cd,Packet1cd,false,true>().pmul(a,b);
|
|
467
|
-
Packet2d s = pmul<Packet2d>(b.v, b.v);
|
|
468
|
-
Packet2d rev_s = preverse<Packet2d>(s);
|
|
699
|
+
EIGEN_MAKE_CONJ_HELPER_CPLX_REAL(Packet1cd, Packet2d)
|
|
469
700
|
|
|
470
|
-
|
|
701
|
+
template <>
|
|
702
|
+
EIGEN_STRONG_INLINE Packet1cd pdiv<Packet1cd>(const Packet1cd& a, const Packet1cd& b) {
|
|
703
|
+
return pdiv_complex(a, b);
|
|
471
704
|
}
|
|
472
705
|
|
|
473
|
-
EIGEN_STRONG_INLINE Packet1cd pcplxflip/*<Packet1cd>*/(const Packet1cd& x)
|
|
474
|
-
{
|
|
706
|
+
EIGEN_STRONG_INLINE Packet1cd pcplxflip /*<Packet1cd>*/ (const Packet1cd& x) {
|
|
475
707
|
return Packet1cd(preverse(Packet2d(x.v)));
|
|
476
708
|
}
|
|
477
709
|
|
|
478
|
-
EIGEN_STRONG_INLINE void ptranspose(PacketBlock<Packet1cd,2>& kernel)
|
|
479
|
-
{
|
|
710
|
+
EIGEN_STRONG_INLINE void ptranspose(PacketBlock<Packet1cd, 2>& kernel) {
|
|
480
711
|
Packet2d tmp = vcombine_f64(vget_high_f64(kernel.packet[0].v), vget_high_f64(kernel.packet[1].v));
|
|
481
712
|
kernel.packet[0].v = vcombine_f64(vget_low_f64(kernel.packet[0].v), vget_low_f64(kernel.packet[1].v));
|
|
482
713
|
kernel.packet[1].v = tmp;
|
|
483
714
|
}
|
|
484
|
-
#endif // EIGEN_ARCH_ARM64
|
|
485
715
|
|
|
486
|
-
|
|
716
|
+
template <>
|
|
717
|
+
EIGEN_STRONG_INLINE Packet1cd psqrt<Packet1cd>(const Packet1cd& a) {
|
|
718
|
+
return psqrt_complex<Packet1cd>(a);
|
|
719
|
+
}
|
|
720
|
+
|
|
721
|
+
template <>
|
|
722
|
+
EIGEN_STRONG_INLINE Packet1cd plog<Packet1cd>(const Packet1cd& a) {
|
|
723
|
+
return plog_complex(a);
|
|
724
|
+
}
|
|
725
|
+
|
|
726
|
+
#endif // EIGEN_ARCH_ARM64
|
|
727
|
+
|
|
728
|
+
} // end namespace internal
|
|
487
729
|
|
|
488
|
-
}
|
|
730
|
+
} // end namespace Eigen
|
|
489
731
|
|
|
490
|
-
#endif
|
|
732
|
+
#endif // EIGEN_COMPLEX_NEON_H
|