tomoto 0.1.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +7 -0
- data/CHANGELOG.md +3 -0
- data/LICENSE.txt +22 -0
- data/README.md +123 -0
- data/ext/tomoto/ext.cpp +245 -0
- data/ext/tomoto/extconf.rb +28 -0
- data/lib/tomoto.rb +12 -0
- data/lib/tomoto/ct.rb +11 -0
- data/lib/tomoto/hdp.rb +11 -0
- data/lib/tomoto/lda.rb +67 -0
- data/lib/tomoto/version.rb +3 -0
- data/vendor/EigenRand/EigenRand/Core.h +1139 -0
- data/vendor/EigenRand/EigenRand/Dists/Basic.h +111 -0
- data/vendor/EigenRand/EigenRand/Dists/Discrete.h +877 -0
- data/vendor/EigenRand/EigenRand/Dists/GammaPoisson.h +108 -0
- data/vendor/EigenRand/EigenRand/Dists/NormalExp.h +626 -0
- data/vendor/EigenRand/EigenRand/EigenRand +19 -0
- data/vendor/EigenRand/EigenRand/Macro.h +24 -0
- data/vendor/EigenRand/EigenRand/MorePacketMath.h +978 -0
- data/vendor/EigenRand/EigenRand/PacketFilter.h +286 -0
- data/vendor/EigenRand/EigenRand/PacketRandomEngine.h +624 -0
- data/vendor/EigenRand/EigenRand/RandUtils.h +413 -0
- data/vendor/EigenRand/EigenRand/doc.h +220 -0
- data/vendor/EigenRand/LICENSE +21 -0
- data/vendor/EigenRand/README.md +288 -0
- data/vendor/eigen/COPYING.BSD +26 -0
- data/vendor/eigen/COPYING.GPL +674 -0
- data/vendor/eigen/COPYING.LGPL +502 -0
- data/vendor/eigen/COPYING.MINPACK +52 -0
- data/vendor/eigen/COPYING.MPL2 +373 -0
- data/vendor/eigen/COPYING.README +18 -0
- data/vendor/eigen/Eigen/CMakeLists.txt +19 -0
- data/vendor/eigen/Eigen/Cholesky +46 -0
- data/vendor/eigen/Eigen/CholmodSupport +48 -0
- data/vendor/eigen/Eigen/Core +537 -0
- data/vendor/eigen/Eigen/Dense +7 -0
- data/vendor/eigen/Eigen/Eigen +2 -0
- data/vendor/eigen/Eigen/Eigenvalues +61 -0
- data/vendor/eigen/Eigen/Geometry +62 -0
- data/vendor/eigen/Eigen/Householder +30 -0
- data/vendor/eigen/Eigen/IterativeLinearSolvers +48 -0
- data/vendor/eigen/Eigen/Jacobi +33 -0
- data/vendor/eigen/Eigen/LU +50 -0
- data/vendor/eigen/Eigen/MetisSupport +35 -0
- data/vendor/eigen/Eigen/OrderingMethods +73 -0
- data/vendor/eigen/Eigen/PaStiXSupport +48 -0
- data/vendor/eigen/Eigen/PardisoSupport +35 -0
- data/vendor/eigen/Eigen/QR +51 -0
- data/vendor/eigen/Eigen/QtAlignedMalloc +40 -0
- data/vendor/eigen/Eigen/SPQRSupport +34 -0
- data/vendor/eigen/Eigen/SVD +51 -0
- data/vendor/eigen/Eigen/Sparse +36 -0
- data/vendor/eigen/Eigen/SparseCholesky +45 -0
- data/vendor/eigen/Eigen/SparseCore +69 -0
- data/vendor/eigen/Eigen/SparseLU +46 -0
- data/vendor/eigen/Eigen/SparseQR +37 -0
- data/vendor/eigen/Eigen/StdDeque +27 -0
- data/vendor/eigen/Eigen/StdList +26 -0
- data/vendor/eigen/Eigen/StdVector +27 -0
- data/vendor/eigen/Eigen/SuperLUSupport +64 -0
- data/vendor/eigen/Eigen/UmfPackSupport +40 -0
- data/vendor/eigen/Eigen/src/Cholesky/LDLT.h +673 -0
- data/vendor/eigen/Eigen/src/Cholesky/LLT.h +542 -0
- data/vendor/eigen/Eigen/src/Cholesky/LLT_LAPACKE.h +99 -0
- data/vendor/eigen/Eigen/src/CholmodSupport/CholmodSupport.h +639 -0
- data/vendor/eigen/Eigen/src/Core/Array.h +329 -0
- data/vendor/eigen/Eigen/src/Core/ArrayBase.h +226 -0
- data/vendor/eigen/Eigen/src/Core/ArrayWrapper.h +209 -0
- data/vendor/eigen/Eigen/src/Core/Assign.h +90 -0
- data/vendor/eigen/Eigen/src/Core/AssignEvaluator.h +935 -0
- data/vendor/eigen/Eigen/src/Core/Assign_MKL.h +178 -0
- data/vendor/eigen/Eigen/src/Core/BandMatrix.h +353 -0
- data/vendor/eigen/Eigen/src/Core/Block.h +452 -0
- data/vendor/eigen/Eigen/src/Core/BooleanRedux.h +164 -0
- data/vendor/eigen/Eigen/src/Core/CommaInitializer.h +160 -0
- data/vendor/eigen/Eigen/src/Core/ConditionEstimator.h +175 -0
- data/vendor/eigen/Eigen/src/Core/CoreEvaluators.h +1688 -0
- data/vendor/eigen/Eigen/src/Core/CoreIterators.h +127 -0
- data/vendor/eigen/Eigen/src/Core/CwiseBinaryOp.h +184 -0
- data/vendor/eigen/Eigen/src/Core/CwiseNullaryOp.h +866 -0
- data/vendor/eigen/Eigen/src/Core/CwiseTernaryOp.h +197 -0
- data/vendor/eigen/Eigen/src/Core/CwiseUnaryOp.h +103 -0
- data/vendor/eigen/Eigen/src/Core/CwiseUnaryView.h +128 -0
- data/vendor/eigen/Eigen/src/Core/DenseBase.h +611 -0
- data/vendor/eigen/Eigen/src/Core/DenseCoeffsBase.h +681 -0
- data/vendor/eigen/Eigen/src/Core/DenseStorage.h +570 -0
- data/vendor/eigen/Eigen/src/Core/Diagonal.h +260 -0
- data/vendor/eigen/Eigen/src/Core/DiagonalMatrix.h +343 -0
- data/vendor/eigen/Eigen/src/Core/DiagonalProduct.h +28 -0
- data/vendor/eigen/Eigen/src/Core/Dot.h +318 -0
- data/vendor/eigen/Eigen/src/Core/EigenBase.h +159 -0
- data/vendor/eigen/Eigen/src/Core/ForceAlignedAccess.h +146 -0
- data/vendor/eigen/Eigen/src/Core/Fuzzy.h +155 -0
- data/vendor/eigen/Eigen/src/Core/GeneralProduct.h +455 -0
- data/vendor/eigen/Eigen/src/Core/GenericPacketMath.h +593 -0
- data/vendor/eigen/Eigen/src/Core/GlobalFunctions.h +187 -0
- data/vendor/eigen/Eigen/src/Core/IO.h +225 -0
- data/vendor/eigen/Eigen/src/Core/Inverse.h +118 -0
- data/vendor/eigen/Eigen/src/Core/Map.h +171 -0
- data/vendor/eigen/Eigen/src/Core/MapBase.h +303 -0
- data/vendor/eigen/Eigen/src/Core/MathFunctions.h +1415 -0
- data/vendor/eigen/Eigen/src/Core/MathFunctionsImpl.h +101 -0
- data/vendor/eigen/Eigen/src/Core/Matrix.h +459 -0
- data/vendor/eigen/Eigen/src/Core/MatrixBase.h +529 -0
- data/vendor/eigen/Eigen/src/Core/NestByValue.h +110 -0
- data/vendor/eigen/Eigen/src/Core/NoAlias.h +108 -0
- data/vendor/eigen/Eigen/src/Core/NumTraits.h +248 -0
- data/vendor/eigen/Eigen/src/Core/PermutationMatrix.h +633 -0
- data/vendor/eigen/Eigen/src/Core/PlainObjectBase.h +1035 -0
- data/vendor/eigen/Eigen/src/Core/Product.h +186 -0
- data/vendor/eigen/Eigen/src/Core/ProductEvaluators.h +1112 -0
- data/vendor/eigen/Eigen/src/Core/Random.h +182 -0
- data/vendor/eigen/Eigen/src/Core/Redux.h +505 -0
- data/vendor/eigen/Eigen/src/Core/Ref.h +283 -0
- data/vendor/eigen/Eigen/src/Core/Replicate.h +142 -0
- data/vendor/eigen/Eigen/src/Core/ReturnByValue.h +117 -0
- data/vendor/eigen/Eigen/src/Core/Reverse.h +211 -0
- data/vendor/eigen/Eigen/src/Core/Select.h +162 -0
- data/vendor/eigen/Eigen/src/Core/SelfAdjointView.h +352 -0
- data/vendor/eigen/Eigen/src/Core/SelfCwiseBinaryOp.h +47 -0
- data/vendor/eigen/Eigen/src/Core/Solve.h +188 -0
- data/vendor/eigen/Eigen/src/Core/SolveTriangular.h +235 -0
- data/vendor/eigen/Eigen/src/Core/SolverBase.h +130 -0
- data/vendor/eigen/Eigen/src/Core/StableNorm.h +221 -0
- data/vendor/eigen/Eigen/src/Core/Stride.h +111 -0
- data/vendor/eigen/Eigen/src/Core/Swap.h +67 -0
- data/vendor/eigen/Eigen/src/Core/Transpose.h +403 -0
- data/vendor/eigen/Eigen/src/Core/Transpositions.h +407 -0
- data/vendor/eigen/Eigen/src/Core/TriangularMatrix.h +983 -0
- data/vendor/eigen/Eigen/src/Core/VectorBlock.h +96 -0
- data/vendor/eigen/Eigen/src/Core/VectorwiseOp.h +695 -0
- data/vendor/eigen/Eigen/src/Core/Visitor.h +273 -0
- data/vendor/eigen/Eigen/src/Core/arch/AVX/Complex.h +451 -0
- data/vendor/eigen/Eigen/src/Core/arch/AVX/MathFunctions.h +439 -0
- data/vendor/eigen/Eigen/src/Core/arch/AVX/PacketMath.h +637 -0
- data/vendor/eigen/Eigen/src/Core/arch/AVX/TypeCasting.h +51 -0
- data/vendor/eigen/Eigen/src/Core/arch/AVX512/MathFunctions.h +391 -0
- data/vendor/eigen/Eigen/src/Core/arch/AVX512/PacketMath.h +1316 -0
- data/vendor/eigen/Eigen/src/Core/arch/AltiVec/Complex.h +430 -0
- data/vendor/eigen/Eigen/src/Core/arch/AltiVec/MathFunctions.h +322 -0
- data/vendor/eigen/Eigen/src/Core/arch/AltiVec/PacketMath.h +1061 -0
- data/vendor/eigen/Eigen/src/Core/arch/CUDA/Complex.h +103 -0
- data/vendor/eigen/Eigen/src/Core/arch/CUDA/Half.h +674 -0
- data/vendor/eigen/Eigen/src/Core/arch/CUDA/MathFunctions.h +91 -0
- data/vendor/eigen/Eigen/src/Core/arch/CUDA/PacketMath.h +333 -0
- data/vendor/eigen/Eigen/src/Core/arch/CUDA/PacketMathHalf.h +1124 -0
- data/vendor/eigen/Eigen/src/Core/arch/CUDA/TypeCasting.h +212 -0
- data/vendor/eigen/Eigen/src/Core/arch/Default/ConjHelper.h +29 -0
- data/vendor/eigen/Eigen/src/Core/arch/Default/Settings.h +49 -0
- data/vendor/eigen/Eigen/src/Core/arch/NEON/Complex.h +490 -0
- data/vendor/eigen/Eigen/src/Core/arch/NEON/MathFunctions.h +91 -0
- data/vendor/eigen/Eigen/src/Core/arch/NEON/PacketMath.h +760 -0
- data/vendor/eigen/Eigen/src/Core/arch/SSE/Complex.h +471 -0
- data/vendor/eigen/Eigen/src/Core/arch/SSE/MathFunctions.h +562 -0
- data/vendor/eigen/Eigen/src/Core/arch/SSE/PacketMath.h +895 -0
- data/vendor/eigen/Eigen/src/Core/arch/SSE/TypeCasting.h +77 -0
- data/vendor/eigen/Eigen/src/Core/arch/ZVector/Complex.h +397 -0
- data/vendor/eigen/Eigen/src/Core/arch/ZVector/MathFunctions.h +137 -0
- data/vendor/eigen/Eigen/src/Core/arch/ZVector/PacketMath.h +945 -0
- data/vendor/eigen/Eigen/src/Core/functors/AssignmentFunctors.h +168 -0
- data/vendor/eigen/Eigen/src/Core/functors/BinaryFunctors.h +475 -0
- data/vendor/eigen/Eigen/src/Core/functors/NullaryFunctors.h +188 -0
- data/vendor/eigen/Eigen/src/Core/functors/StlFunctors.h +136 -0
- data/vendor/eigen/Eigen/src/Core/functors/TernaryFunctors.h +25 -0
- data/vendor/eigen/Eigen/src/Core/functors/UnaryFunctors.h +792 -0
- data/vendor/eigen/Eigen/src/Core/products/GeneralBlockPanelKernel.h +2156 -0
- data/vendor/eigen/Eigen/src/Core/products/GeneralMatrixMatrix.h +492 -0
- data/vendor/eigen/Eigen/src/Core/products/GeneralMatrixMatrixTriangular.h +311 -0
- data/vendor/eigen/Eigen/src/Core/products/GeneralMatrixMatrixTriangular_BLAS.h +145 -0
- data/vendor/eigen/Eigen/src/Core/products/GeneralMatrixMatrix_BLAS.h +122 -0
- data/vendor/eigen/Eigen/src/Core/products/GeneralMatrixVector.h +619 -0
- data/vendor/eigen/Eigen/src/Core/products/GeneralMatrixVector_BLAS.h +136 -0
- data/vendor/eigen/Eigen/src/Core/products/Parallelizer.h +163 -0
- data/vendor/eigen/Eigen/src/Core/products/SelfadjointMatrixMatrix.h +521 -0
- data/vendor/eigen/Eigen/src/Core/products/SelfadjointMatrixMatrix_BLAS.h +287 -0
- data/vendor/eigen/Eigen/src/Core/products/SelfadjointMatrixVector.h +260 -0
- data/vendor/eigen/Eigen/src/Core/products/SelfadjointMatrixVector_BLAS.h +118 -0
- data/vendor/eigen/Eigen/src/Core/products/SelfadjointProduct.h +133 -0
- data/vendor/eigen/Eigen/src/Core/products/SelfadjointRank2Update.h +93 -0
- data/vendor/eigen/Eigen/src/Core/products/TriangularMatrixMatrix.h +466 -0
- data/vendor/eigen/Eigen/src/Core/products/TriangularMatrixMatrix_BLAS.h +315 -0
- data/vendor/eigen/Eigen/src/Core/products/TriangularMatrixVector.h +350 -0
- data/vendor/eigen/Eigen/src/Core/products/TriangularMatrixVector_BLAS.h +255 -0
- data/vendor/eigen/Eigen/src/Core/products/TriangularSolverMatrix.h +335 -0
- data/vendor/eigen/Eigen/src/Core/products/TriangularSolverMatrix_BLAS.h +163 -0
- data/vendor/eigen/Eigen/src/Core/products/TriangularSolverVector.h +145 -0
- data/vendor/eigen/Eigen/src/Core/util/BlasUtil.h +398 -0
- data/vendor/eigen/Eigen/src/Core/util/Constants.h +547 -0
- data/vendor/eigen/Eigen/src/Core/util/DisableStupidWarnings.h +83 -0
- data/vendor/eigen/Eigen/src/Core/util/ForwardDeclarations.h +302 -0
- data/vendor/eigen/Eigen/src/Core/util/MKL_support.h +130 -0
- data/vendor/eigen/Eigen/src/Core/util/Macros.h +1001 -0
- data/vendor/eigen/Eigen/src/Core/util/Memory.h +993 -0
- data/vendor/eigen/Eigen/src/Core/util/Meta.h +534 -0
- data/vendor/eigen/Eigen/src/Core/util/NonMPL2.h +3 -0
- data/vendor/eigen/Eigen/src/Core/util/ReenableStupidWarnings.h +27 -0
- data/vendor/eigen/Eigen/src/Core/util/StaticAssert.h +218 -0
- data/vendor/eigen/Eigen/src/Core/util/XprHelper.h +821 -0
- data/vendor/eigen/Eigen/src/Eigenvalues/ComplexEigenSolver.h +346 -0
- data/vendor/eigen/Eigen/src/Eigenvalues/ComplexSchur.h +459 -0
- data/vendor/eigen/Eigen/src/Eigenvalues/ComplexSchur_LAPACKE.h +91 -0
- data/vendor/eigen/Eigen/src/Eigenvalues/EigenSolver.h +622 -0
- data/vendor/eigen/Eigen/src/Eigenvalues/GeneralizedEigenSolver.h +418 -0
- data/vendor/eigen/Eigen/src/Eigenvalues/GeneralizedSelfAdjointEigenSolver.h +226 -0
- data/vendor/eigen/Eigen/src/Eigenvalues/HessenbergDecomposition.h +374 -0
- data/vendor/eigen/Eigen/src/Eigenvalues/MatrixBaseEigenvalues.h +158 -0
- data/vendor/eigen/Eigen/src/Eigenvalues/RealQZ.h +654 -0
- data/vendor/eigen/Eigen/src/Eigenvalues/RealSchur.h +546 -0
- data/vendor/eigen/Eigen/src/Eigenvalues/RealSchur_LAPACKE.h +77 -0
- data/vendor/eigen/Eigen/src/Eigenvalues/SelfAdjointEigenSolver.h +870 -0
- data/vendor/eigen/Eigen/src/Eigenvalues/SelfAdjointEigenSolver_LAPACKE.h +87 -0
- data/vendor/eigen/Eigen/src/Eigenvalues/Tridiagonalization.h +556 -0
- data/vendor/eigen/Eigen/src/Geometry/AlignedBox.h +392 -0
- data/vendor/eigen/Eigen/src/Geometry/AngleAxis.h +247 -0
- data/vendor/eigen/Eigen/src/Geometry/EulerAngles.h +114 -0
- data/vendor/eigen/Eigen/src/Geometry/Homogeneous.h +497 -0
- data/vendor/eigen/Eigen/src/Geometry/Hyperplane.h +282 -0
- data/vendor/eigen/Eigen/src/Geometry/OrthoMethods.h +234 -0
- data/vendor/eigen/Eigen/src/Geometry/ParametrizedLine.h +195 -0
- data/vendor/eigen/Eigen/src/Geometry/Quaternion.h +814 -0
- data/vendor/eigen/Eigen/src/Geometry/Rotation2D.h +199 -0
- data/vendor/eigen/Eigen/src/Geometry/RotationBase.h +206 -0
- data/vendor/eigen/Eigen/src/Geometry/Scaling.h +170 -0
- data/vendor/eigen/Eigen/src/Geometry/Transform.h +1542 -0
- data/vendor/eigen/Eigen/src/Geometry/Translation.h +208 -0
- data/vendor/eigen/Eigen/src/Geometry/Umeyama.h +166 -0
- data/vendor/eigen/Eigen/src/Geometry/arch/Geometry_SSE.h +161 -0
- data/vendor/eigen/Eigen/src/Householder/BlockHouseholder.h +103 -0
- data/vendor/eigen/Eigen/src/Householder/Householder.h +172 -0
- data/vendor/eigen/Eigen/src/Householder/HouseholderSequence.h +470 -0
- data/vendor/eigen/Eigen/src/IterativeLinearSolvers/BasicPreconditioners.h +226 -0
- data/vendor/eigen/Eigen/src/IterativeLinearSolvers/BiCGSTAB.h +228 -0
- data/vendor/eigen/Eigen/src/IterativeLinearSolvers/ConjugateGradient.h +246 -0
- data/vendor/eigen/Eigen/src/IterativeLinearSolvers/IncompleteCholesky.h +400 -0
- data/vendor/eigen/Eigen/src/IterativeLinearSolvers/IncompleteLUT.h +462 -0
- data/vendor/eigen/Eigen/src/IterativeLinearSolvers/IterativeSolverBase.h +394 -0
- data/vendor/eigen/Eigen/src/IterativeLinearSolvers/LeastSquareConjugateGradient.h +216 -0
- data/vendor/eigen/Eigen/src/IterativeLinearSolvers/SolveWithGuess.h +115 -0
- data/vendor/eigen/Eigen/src/Jacobi/Jacobi.h +462 -0
- data/vendor/eigen/Eigen/src/LU/Determinant.h +101 -0
- data/vendor/eigen/Eigen/src/LU/FullPivLU.h +891 -0
- data/vendor/eigen/Eigen/src/LU/InverseImpl.h +415 -0
- data/vendor/eigen/Eigen/src/LU/PartialPivLU.h +611 -0
- data/vendor/eigen/Eigen/src/LU/PartialPivLU_LAPACKE.h +83 -0
- data/vendor/eigen/Eigen/src/LU/arch/Inverse_SSE.h +338 -0
- data/vendor/eigen/Eigen/src/MetisSupport/MetisSupport.h +137 -0
- data/vendor/eigen/Eigen/src/OrderingMethods/Amd.h +445 -0
- data/vendor/eigen/Eigen/src/OrderingMethods/Eigen_Colamd.h +1843 -0
- data/vendor/eigen/Eigen/src/OrderingMethods/Ordering.h +157 -0
- data/vendor/eigen/Eigen/src/PaStiXSupport/PaStiXSupport.h +678 -0
- data/vendor/eigen/Eigen/src/PardisoSupport/PardisoSupport.h +543 -0
- data/vendor/eigen/Eigen/src/QR/ColPivHouseholderQR.h +653 -0
- data/vendor/eigen/Eigen/src/QR/ColPivHouseholderQR_LAPACKE.h +97 -0
- data/vendor/eigen/Eigen/src/QR/CompleteOrthogonalDecomposition.h +562 -0
- data/vendor/eigen/Eigen/src/QR/FullPivHouseholderQR.h +676 -0
- data/vendor/eigen/Eigen/src/QR/HouseholderQR.h +409 -0
- data/vendor/eigen/Eigen/src/QR/HouseholderQR_LAPACKE.h +68 -0
- data/vendor/eigen/Eigen/src/SPQRSupport/SuiteSparseQRSupport.h +313 -0
- data/vendor/eigen/Eigen/src/SVD/BDCSVD.h +1246 -0
- data/vendor/eigen/Eigen/src/SVD/JacobiSVD.h +804 -0
- data/vendor/eigen/Eigen/src/SVD/JacobiSVD_LAPACKE.h +91 -0
- data/vendor/eigen/Eigen/src/SVD/SVDBase.h +315 -0
- data/vendor/eigen/Eigen/src/SVD/UpperBidiagonalization.h +414 -0
- data/vendor/eigen/Eigen/src/SparseCholesky/SimplicialCholesky.h +689 -0
- data/vendor/eigen/Eigen/src/SparseCholesky/SimplicialCholesky_impl.h +199 -0
- data/vendor/eigen/Eigen/src/SparseCore/AmbiVector.h +377 -0
- data/vendor/eigen/Eigen/src/SparseCore/CompressedStorage.h +258 -0
- data/vendor/eigen/Eigen/src/SparseCore/ConservativeSparseSparseProduct.h +352 -0
- data/vendor/eigen/Eigen/src/SparseCore/MappedSparseMatrix.h +67 -0
- data/vendor/eigen/Eigen/src/SparseCore/SparseAssign.h +216 -0
- data/vendor/eigen/Eigen/src/SparseCore/SparseBlock.h +603 -0
- data/vendor/eigen/Eigen/src/SparseCore/SparseColEtree.h +206 -0
- data/vendor/eigen/Eigen/src/SparseCore/SparseCompressedBase.h +341 -0
- data/vendor/eigen/Eigen/src/SparseCore/SparseCwiseBinaryOp.h +726 -0
- data/vendor/eigen/Eigen/src/SparseCore/SparseCwiseUnaryOp.h +148 -0
- data/vendor/eigen/Eigen/src/SparseCore/SparseDenseProduct.h +320 -0
- data/vendor/eigen/Eigen/src/SparseCore/SparseDiagonalProduct.h +138 -0
- data/vendor/eigen/Eigen/src/SparseCore/SparseDot.h +98 -0
- data/vendor/eigen/Eigen/src/SparseCore/SparseFuzzy.h +29 -0
- data/vendor/eigen/Eigen/src/SparseCore/SparseMap.h +305 -0
- data/vendor/eigen/Eigen/src/SparseCore/SparseMatrix.h +1403 -0
- data/vendor/eigen/Eigen/src/SparseCore/SparseMatrixBase.h +405 -0
- data/vendor/eigen/Eigen/src/SparseCore/SparsePermutation.h +178 -0
- data/vendor/eigen/Eigen/src/SparseCore/SparseProduct.h +169 -0
- data/vendor/eigen/Eigen/src/SparseCore/SparseRedux.h +49 -0
- data/vendor/eigen/Eigen/src/SparseCore/SparseRef.h +397 -0
- data/vendor/eigen/Eigen/src/SparseCore/SparseSelfAdjointView.h +656 -0
- data/vendor/eigen/Eigen/src/SparseCore/SparseSolverBase.h +124 -0
- data/vendor/eigen/Eigen/src/SparseCore/SparseSparseProductWithPruning.h +198 -0
- data/vendor/eigen/Eigen/src/SparseCore/SparseTranspose.h +92 -0
- data/vendor/eigen/Eigen/src/SparseCore/SparseTriangularView.h +189 -0
- data/vendor/eigen/Eigen/src/SparseCore/SparseUtil.h +178 -0
- data/vendor/eigen/Eigen/src/SparseCore/SparseVector.h +478 -0
- data/vendor/eigen/Eigen/src/SparseCore/SparseView.h +253 -0
- data/vendor/eigen/Eigen/src/SparseCore/TriangularSolver.h +315 -0
- data/vendor/eigen/Eigen/src/SparseLU/SparseLU.h +773 -0
- data/vendor/eigen/Eigen/src/SparseLU/SparseLUImpl.h +66 -0
- data/vendor/eigen/Eigen/src/SparseLU/SparseLU_Memory.h +226 -0
- data/vendor/eigen/Eigen/src/SparseLU/SparseLU_Structs.h +110 -0
- data/vendor/eigen/Eigen/src/SparseLU/SparseLU_SupernodalMatrix.h +301 -0
- data/vendor/eigen/Eigen/src/SparseLU/SparseLU_Utils.h +80 -0
- data/vendor/eigen/Eigen/src/SparseLU/SparseLU_column_bmod.h +181 -0
- data/vendor/eigen/Eigen/src/SparseLU/SparseLU_column_dfs.h +179 -0
- data/vendor/eigen/Eigen/src/SparseLU/SparseLU_copy_to_ucol.h +107 -0
- data/vendor/eigen/Eigen/src/SparseLU/SparseLU_gemm_kernel.h +280 -0
- data/vendor/eigen/Eigen/src/SparseLU/SparseLU_heap_relax_snode.h +126 -0
- data/vendor/eigen/Eigen/src/SparseLU/SparseLU_kernel_bmod.h +130 -0
- data/vendor/eigen/Eigen/src/SparseLU/SparseLU_panel_bmod.h +223 -0
- data/vendor/eigen/Eigen/src/SparseLU/SparseLU_panel_dfs.h +258 -0
- data/vendor/eigen/Eigen/src/SparseLU/SparseLU_pivotL.h +137 -0
- data/vendor/eigen/Eigen/src/SparseLU/SparseLU_pruneL.h +136 -0
- data/vendor/eigen/Eigen/src/SparseLU/SparseLU_relax_snode.h +83 -0
- data/vendor/eigen/Eigen/src/SparseQR/SparseQR.h +745 -0
- data/vendor/eigen/Eigen/src/StlSupport/StdDeque.h +126 -0
- data/vendor/eigen/Eigen/src/StlSupport/StdList.h +106 -0
- data/vendor/eigen/Eigen/src/StlSupport/StdVector.h +131 -0
- data/vendor/eigen/Eigen/src/StlSupport/details.h +84 -0
- data/vendor/eigen/Eigen/src/SuperLUSupport/SuperLUSupport.h +1027 -0
- data/vendor/eigen/Eigen/src/UmfPackSupport/UmfPackSupport.h +506 -0
- data/vendor/eigen/Eigen/src/misc/Image.h +82 -0
- data/vendor/eigen/Eigen/src/misc/Kernel.h +79 -0
- data/vendor/eigen/Eigen/src/misc/RealSvd2x2.h +55 -0
- data/vendor/eigen/Eigen/src/misc/blas.h +440 -0
- data/vendor/eigen/Eigen/src/misc/lapack.h +152 -0
- data/vendor/eigen/Eigen/src/misc/lapacke.h +16291 -0
- data/vendor/eigen/Eigen/src/misc/lapacke_mangling.h +17 -0
- data/vendor/eigen/Eigen/src/plugins/ArrayCwiseBinaryOps.h +332 -0
- data/vendor/eigen/Eigen/src/plugins/ArrayCwiseUnaryOps.h +552 -0
- data/vendor/eigen/Eigen/src/plugins/BlockMethods.h +1058 -0
- data/vendor/eigen/Eigen/src/plugins/CommonCwiseBinaryOps.h +115 -0
- data/vendor/eigen/Eigen/src/plugins/CommonCwiseUnaryOps.h +163 -0
- data/vendor/eigen/Eigen/src/plugins/MatrixCwiseBinaryOps.h +152 -0
- data/vendor/eigen/Eigen/src/plugins/MatrixCwiseUnaryOps.h +85 -0
- data/vendor/eigen/README.md +3 -0
- data/vendor/eigen/bench/README.txt +55 -0
- data/vendor/eigen/bench/btl/COPYING +340 -0
- data/vendor/eigen/bench/btl/README +154 -0
- data/vendor/eigen/bench/tensors/README +21 -0
- data/vendor/eigen/blas/README.txt +6 -0
- data/vendor/eigen/demos/mandelbrot/README +10 -0
- data/vendor/eigen/demos/mix_eigen_and_c/README +9 -0
- data/vendor/eigen/demos/opengl/README +13 -0
- data/vendor/eigen/unsupported/Eigen/CXX11/src/Tensor/README.md +1760 -0
- data/vendor/eigen/unsupported/README.txt +50 -0
- data/vendor/tomotopy/LICENSE +21 -0
- data/vendor/tomotopy/README.kr.rst +375 -0
- data/vendor/tomotopy/README.rst +382 -0
- data/vendor/tomotopy/src/Labeling/FoRelevance.cpp +362 -0
- data/vendor/tomotopy/src/Labeling/FoRelevance.h +88 -0
- data/vendor/tomotopy/src/Labeling/Labeler.h +50 -0
- data/vendor/tomotopy/src/TopicModel/CT.h +37 -0
- data/vendor/tomotopy/src/TopicModel/CTModel.cpp +13 -0
- data/vendor/tomotopy/src/TopicModel/CTModel.hpp +293 -0
- data/vendor/tomotopy/src/TopicModel/DMR.h +51 -0
- data/vendor/tomotopy/src/TopicModel/DMRModel.cpp +13 -0
- data/vendor/tomotopy/src/TopicModel/DMRModel.hpp +374 -0
- data/vendor/tomotopy/src/TopicModel/DT.h +65 -0
- data/vendor/tomotopy/src/TopicModel/DTM.h +22 -0
- data/vendor/tomotopy/src/TopicModel/DTModel.cpp +15 -0
- data/vendor/tomotopy/src/TopicModel/DTModel.hpp +572 -0
- data/vendor/tomotopy/src/TopicModel/GDMR.h +37 -0
- data/vendor/tomotopy/src/TopicModel/GDMRModel.cpp +14 -0
- data/vendor/tomotopy/src/TopicModel/GDMRModel.hpp +485 -0
- data/vendor/tomotopy/src/TopicModel/HDP.h +74 -0
- data/vendor/tomotopy/src/TopicModel/HDPModel.cpp +13 -0
- data/vendor/tomotopy/src/TopicModel/HDPModel.hpp +592 -0
- data/vendor/tomotopy/src/TopicModel/HLDA.h +40 -0
- data/vendor/tomotopy/src/TopicModel/HLDAModel.cpp +13 -0
- data/vendor/tomotopy/src/TopicModel/HLDAModel.hpp +681 -0
- data/vendor/tomotopy/src/TopicModel/HPA.h +27 -0
- data/vendor/tomotopy/src/TopicModel/HPAModel.cpp +21 -0
- data/vendor/tomotopy/src/TopicModel/HPAModel.hpp +588 -0
- data/vendor/tomotopy/src/TopicModel/LDA.h +144 -0
- data/vendor/tomotopy/src/TopicModel/LDACVB0Model.hpp +442 -0
- data/vendor/tomotopy/src/TopicModel/LDAModel.cpp +13 -0
- data/vendor/tomotopy/src/TopicModel/LDAModel.hpp +1058 -0
- data/vendor/tomotopy/src/TopicModel/LLDA.h +45 -0
- data/vendor/tomotopy/src/TopicModel/LLDAModel.cpp +13 -0
- data/vendor/tomotopy/src/TopicModel/LLDAModel.hpp +203 -0
- data/vendor/tomotopy/src/TopicModel/MGLDA.h +63 -0
- data/vendor/tomotopy/src/TopicModel/MGLDAModel.cpp +17 -0
- data/vendor/tomotopy/src/TopicModel/MGLDAModel.hpp +558 -0
- data/vendor/tomotopy/src/TopicModel/PA.h +43 -0
- data/vendor/tomotopy/src/TopicModel/PAModel.cpp +13 -0
- data/vendor/tomotopy/src/TopicModel/PAModel.hpp +467 -0
- data/vendor/tomotopy/src/TopicModel/PLDA.h +17 -0
- data/vendor/tomotopy/src/TopicModel/PLDAModel.cpp +13 -0
- data/vendor/tomotopy/src/TopicModel/PLDAModel.hpp +214 -0
- data/vendor/tomotopy/src/TopicModel/SLDA.h +54 -0
- data/vendor/tomotopy/src/TopicModel/SLDAModel.cpp +17 -0
- data/vendor/tomotopy/src/TopicModel/SLDAModel.hpp +456 -0
- data/vendor/tomotopy/src/TopicModel/TopicModel.hpp +692 -0
- data/vendor/tomotopy/src/Utils/AliasMethod.hpp +169 -0
- data/vendor/tomotopy/src/Utils/Dictionary.h +80 -0
- data/vendor/tomotopy/src/Utils/EigenAddonOps.hpp +181 -0
- data/vendor/tomotopy/src/Utils/LBFGS.h +202 -0
- data/vendor/tomotopy/src/Utils/LBFGS/LineSearchBacktracking.h +120 -0
- data/vendor/tomotopy/src/Utils/LBFGS/LineSearchBracketing.h +122 -0
- data/vendor/tomotopy/src/Utils/LBFGS/Param.h +213 -0
- data/vendor/tomotopy/src/Utils/LUT.hpp +82 -0
- data/vendor/tomotopy/src/Utils/MultiNormalDistribution.hpp +69 -0
- data/vendor/tomotopy/src/Utils/PolyaGamma.hpp +200 -0
- data/vendor/tomotopy/src/Utils/PolyaGammaHybrid.hpp +672 -0
- data/vendor/tomotopy/src/Utils/ThreadPool.hpp +150 -0
- data/vendor/tomotopy/src/Utils/Trie.hpp +220 -0
- data/vendor/tomotopy/src/Utils/TruncMultiNormal.hpp +94 -0
- data/vendor/tomotopy/src/Utils/Utils.hpp +337 -0
- data/vendor/tomotopy/src/Utils/avx_gamma.h +46 -0
- data/vendor/tomotopy/src/Utils/avx_mathfun.h +736 -0
- data/vendor/tomotopy/src/Utils/exception.h +28 -0
- data/vendor/tomotopy/src/Utils/math.h +281 -0
- data/vendor/tomotopy/src/Utils/rtnorm.hpp +2690 -0
- data/vendor/tomotopy/src/Utils/sample.hpp +192 -0
- data/vendor/tomotopy/src/Utils/serializer.hpp +695 -0
- data/vendor/tomotopy/src/Utils/slp.hpp +131 -0
- data/vendor/tomotopy/src/Utils/sse_gamma.h +48 -0
- data/vendor/tomotopy/src/Utils/sse_mathfun.h +710 -0
- data/vendor/tomotopy/src/Utils/text.hpp +49 -0
- data/vendor/tomotopy/src/Utils/tvector.hpp +543 -0
- metadata +531 -0
|
@@ -0,0 +1,273 @@
|
|
|
1
|
+
// This file is part of Eigen, a lightweight C++ template library
|
|
2
|
+
// for linear algebra.
|
|
3
|
+
//
|
|
4
|
+
// Copyright (C) 2008 Gael Guennebaud <gael.guennebaud@inria.fr>
|
|
5
|
+
//
|
|
6
|
+
// This Source Code Form is subject to the terms of the Mozilla
|
|
7
|
+
// Public License v. 2.0. If a copy of the MPL was not distributed
|
|
8
|
+
// with this file, You can obtain one at http://mozilla.org/MPL/2.0/.
|
|
9
|
+
|
|
10
|
+
#ifndef EIGEN_VISITOR_H
|
|
11
|
+
#define EIGEN_VISITOR_H
|
|
12
|
+
|
|
13
|
+
namespace Eigen {
|
|
14
|
+
|
|
15
|
+
namespace internal {
|
|
16
|
+
|
|
17
|
+
template<typename Visitor, typename Derived, int UnrollCount>
|
|
18
|
+
struct visitor_impl
|
|
19
|
+
{
|
|
20
|
+
enum {
|
|
21
|
+
col = (UnrollCount-1) / Derived::RowsAtCompileTime,
|
|
22
|
+
row = (UnrollCount-1) % Derived::RowsAtCompileTime
|
|
23
|
+
};
|
|
24
|
+
|
|
25
|
+
EIGEN_DEVICE_FUNC
|
|
26
|
+
static inline void run(const Derived &mat, Visitor& visitor)
|
|
27
|
+
{
|
|
28
|
+
visitor_impl<Visitor, Derived, UnrollCount-1>::run(mat, visitor);
|
|
29
|
+
visitor(mat.coeff(row, col), row, col);
|
|
30
|
+
}
|
|
31
|
+
};
|
|
32
|
+
|
|
33
|
+
template<typename Visitor, typename Derived>
|
|
34
|
+
struct visitor_impl<Visitor, Derived, 1>
|
|
35
|
+
{
|
|
36
|
+
EIGEN_DEVICE_FUNC
|
|
37
|
+
static inline void run(const Derived &mat, Visitor& visitor)
|
|
38
|
+
{
|
|
39
|
+
return visitor.init(mat.coeff(0, 0), 0, 0);
|
|
40
|
+
}
|
|
41
|
+
};
|
|
42
|
+
|
|
43
|
+
template<typename Visitor, typename Derived>
|
|
44
|
+
struct visitor_impl<Visitor, Derived, Dynamic>
|
|
45
|
+
{
|
|
46
|
+
EIGEN_DEVICE_FUNC
|
|
47
|
+
static inline void run(const Derived& mat, Visitor& visitor)
|
|
48
|
+
{
|
|
49
|
+
visitor.init(mat.coeff(0,0), 0, 0);
|
|
50
|
+
for(Index i = 1; i < mat.rows(); ++i)
|
|
51
|
+
visitor(mat.coeff(i, 0), i, 0);
|
|
52
|
+
for(Index j = 1; j < mat.cols(); ++j)
|
|
53
|
+
for(Index i = 0; i < mat.rows(); ++i)
|
|
54
|
+
visitor(mat.coeff(i, j), i, j);
|
|
55
|
+
}
|
|
56
|
+
};
|
|
57
|
+
|
|
58
|
+
// evaluator adaptor
|
|
59
|
+
template<typename XprType>
|
|
60
|
+
class visitor_evaluator
|
|
61
|
+
{
|
|
62
|
+
public:
|
|
63
|
+
EIGEN_DEVICE_FUNC
|
|
64
|
+
explicit visitor_evaluator(const XprType &xpr) : m_evaluator(xpr), m_xpr(xpr) {}
|
|
65
|
+
|
|
66
|
+
typedef typename XprType::Scalar Scalar;
|
|
67
|
+
typedef typename XprType::CoeffReturnType CoeffReturnType;
|
|
68
|
+
|
|
69
|
+
enum {
|
|
70
|
+
RowsAtCompileTime = XprType::RowsAtCompileTime,
|
|
71
|
+
CoeffReadCost = internal::evaluator<XprType>::CoeffReadCost
|
|
72
|
+
};
|
|
73
|
+
|
|
74
|
+
EIGEN_DEVICE_FUNC Index rows() const { return m_xpr.rows(); }
|
|
75
|
+
EIGEN_DEVICE_FUNC Index cols() const { return m_xpr.cols(); }
|
|
76
|
+
EIGEN_DEVICE_FUNC Index size() const { return m_xpr.size(); }
|
|
77
|
+
|
|
78
|
+
EIGEN_DEVICE_FUNC CoeffReturnType coeff(Index row, Index col) const
|
|
79
|
+
{ return m_evaluator.coeff(row, col); }
|
|
80
|
+
|
|
81
|
+
protected:
|
|
82
|
+
internal::evaluator<XprType> m_evaluator;
|
|
83
|
+
const XprType &m_xpr;
|
|
84
|
+
};
|
|
85
|
+
} // end namespace internal
|
|
86
|
+
|
|
87
|
+
/** Applies the visitor \a visitor to the whole coefficients of the matrix or vector.
|
|
88
|
+
*
|
|
89
|
+
* The template parameter \a Visitor is the type of the visitor and provides the following interface:
|
|
90
|
+
* \code
|
|
91
|
+
* struct MyVisitor {
|
|
92
|
+
* // called for the first coefficient
|
|
93
|
+
* void init(const Scalar& value, Index i, Index j);
|
|
94
|
+
* // called for all other coefficients
|
|
95
|
+
* void operator() (const Scalar& value, Index i, Index j);
|
|
96
|
+
* };
|
|
97
|
+
* \endcode
|
|
98
|
+
*
|
|
99
|
+
* \note compared to one or two \em for \em loops, visitors offer automatic
|
|
100
|
+
* unrolling for small fixed size matrix.
|
|
101
|
+
*
|
|
102
|
+
* \sa minCoeff(Index*,Index*), maxCoeff(Index*,Index*), DenseBase::redux()
|
|
103
|
+
*/
|
|
104
|
+
template<typename Derived>
|
|
105
|
+
template<typename Visitor>
|
|
106
|
+
EIGEN_DEVICE_FUNC
|
|
107
|
+
void DenseBase<Derived>::visit(Visitor& visitor) const
|
|
108
|
+
{
|
|
109
|
+
typedef typename internal::visitor_evaluator<Derived> ThisEvaluator;
|
|
110
|
+
ThisEvaluator thisEval(derived());
|
|
111
|
+
|
|
112
|
+
enum {
|
|
113
|
+
unroll = SizeAtCompileTime != Dynamic
|
|
114
|
+
&& SizeAtCompileTime * ThisEvaluator::CoeffReadCost + (SizeAtCompileTime-1) * internal::functor_traits<Visitor>::Cost <= EIGEN_UNROLLING_LIMIT
|
|
115
|
+
};
|
|
116
|
+
return internal::visitor_impl<Visitor, ThisEvaluator, unroll ? int(SizeAtCompileTime) : Dynamic>::run(thisEval, visitor);
|
|
117
|
+
}
|
|
118
|
+
|
|
119
|
+
namespace internal {
|
|
120
|
+
|
|
121
|
+
/** \internal
|
|
122
|
+
* \brief Base class to implement min and max visitors
|
|
123
|
+
*/
|
|
124
|
+
template <typename Derived>
|
|
125
|
+
struct coeff_visitor
|
|
126
|
+
{
|
|
127
|
+
typedef typename Derived::Scalar Scalar;
|
|
128
|
+
Index row, col;
|
|
129
|
+
Scalar res;
|
|
130
|
+
EIGEN_DEVICE_FUNC
|
|
131
|
+
inline void init(const Scalar& value, Index i, Index j)
|
|
132
|
+
{
|
|
133
|
+
res = value;
|
|
134
|
+
row = i;
|
|
135
|
+
col = j;
|
|
136
|
+
}
|
|
137
|
+
};
|
|
138
|
+
|
|
139
|
+
/** \internal
|
|
140
|
+
* \brief Visitor computing the min coefficient with its value and coordinates
|
|
141
|
+
*
|
|
142
|
+
* \sa DenseBase::minCoeff(Index*, Index*)
|
|
143
|
+
*/
|
|
144
|
+
template <typename Derived>
|
|
145
|
+
struct min_coeff_visitor : coeff_visitor<Derived>
|
|
146
|
+
{
|
|
147
|
+
typedef typename Derived::Scalar Scalar;
|
|
148
|
+
EIGEN_DEVICE_FUNC
|
|
149
|
+
void operator() (const Scalar& value, Index i, Index j)
|
|
150
|
+
{
|
|
151
|
+
if(value < this->res)
|
|
152
|
+
{
|
|
153
|
+
this->res = value;
|
|
154
|
+
this->row = i;
|
|
155
|
+
this->col = j;
|
|
156
|
+
}
|
|
157
|
+
}
|
|
158
|
+
};
|
|
159
|
+
|
|
160
|
+
template<typename Scalar>
|
|
161
|
+
struct functor_traits<min_coeff_visitor<Scalar> > {
|
|
162
|
+
enum {
|
|
163
|
+
Cost = NumTraits<Scalar>::AddCost
|
|
164
|
+
};
|
|
165
|
+
};
|
|
166
|
+
|
|
167
|
+
/** \internal
|
|
168
|
+
* \brief Visitor computing the max coefficient with its value and coordinates
|
|
169
|
+
*
|
|
170
|
+
* \sa DenseBase::maxCoeff(Index*, Index*)
|
|
171
|
+
*/
|
|
172
|
+
template <typename Derived>
|
|
173
|
+
struct max_coeff_visitor : coeff_visitor<Derived>
|
|
174
|
+
{
|
|
175
|
+
typedef typename Derived::Scalar Scalar;
|
|
176
|
+
EIGEN_DEVICE_FUNC
|
|
177
|
+
void operator() (const Scalar& value, Index i, Index j)
|
|
178
|
+
{
|
|
179
|
+
if(value > this->res)
|
|
180
|
+
{
|
|
181
|
+
this->res = value;
|
|
182
|
+
this->row = i;
|
|
183
|
+
this->col = j;
|
|
184
|
+
}
|
|
185
|
+
}
|
|
186
|
+
};
|
|
187
|
+
|
|
188
|
+
template<typename Scalar>
|
|
189
|
+
struct functor_traits<max_coeff_visitor<Scalar> > {
|
|
190
|
+
enum {
|
|
191
|
+
Cost = NumTraits<Scalar>::AddCost
|
|
192
|
+
};
|
|
193
|
+
};
|
|
194
|
+
|
|
195
|
+
} // end namespace internal
|
|
196
|
+
|
|
197
|
+
/** \fn DenseBase<Derived>::minCoeff(IndexType* rowId, IndexType* colId) const
|
|
198
|
+
* \returns the minimum of all coefficients of *this and puts in *row and *col its location.
|
|
199
|
+
* \warning the result is undefined if \c *this contains NaN.
|
|
200
|
+
*
|
|
201
|
+
* \sa DenseBase::minCoeff(Index*), DenseBase::maxCoeff(Index*,Index*), DenseBase::visit(), DenseBase::minCoeff()
|
|
202
|
+
*/
|
|
203
|
+
template<typename Derived>
|
|
204
|
+
template<typename IndexType>
|
|
205
|
+
EIGEN_DEVICE_FUNC
|
|
206
|
+
typename internal::traits<Derived>::Scalar
|
|
207
|
+
DenseBase<Derived>::minCoeff(IndexType* rowId, IndexType* colId) const
|
|
208
|
+
{
|
|
209
|
+
internal::min_coeff_visitor<Derived> minVisitor;
|
|
210
|
+
this->visit(minVisitor);
|
|
211
|
+
*rowId = minVisitor.row;
|
|
212
|
+
if (colId) *colId = minVisitor.col;
|
|
213
|
+
return minVisitor.res;
|
|
214
|
+
}
|
|
215
|
+
|
|
216
|
+
/** \returns the minimum of all coefficients of *this and puts in *index its location.
|
|
217
|
+
* \warning the result is undefined if \c *this contains NaN.
|
|
218
|
+
*
|
|
219
|
+
* \sa DenseBase::minCoeff(IndexType*,IndexType*), DenseBase::maxCoeff(IndexType*,IndexType*), DenseBase::visit(), DenseBase::minCoeff()
|
|
220
|
+
*/
|
|
221
|
+
template<typename Derived>
|
|
222
|
+
template<typename IndexType>
|
|
223
|
+
EIGEN_DEVICE_FUNC
|
|
224
|
+
typename internal::traits<Derived>::Scalar
|
|
225
|
+
DenseBase<Derived>::minCoeff(IndexType* index) const
|
|
226
|
+
{
|
|
227
|
+
EIGEN_STATIC_ASSERT_VECTOR_ONLY(Derived)
|
|
228
|
+
internal::min_coeff_visitor<Derived> minVisitor;
|
|
229
|
+
this->visit(minVisitor);
|
|
230
|
+
*index = IndexType((RowsAtCompileTime==1) ? minVisitor.col : minVisitor.row);
|
|
231
|
+
return minVisitor.res;
|
|
232
|
+
}
|
|
233
|
+
|
|
234
|
+
/** \fn DenseBase<Derived>::maxCoeff(IndexType* rowId, IndexType* colId) const
|
|
235
|
+
* \returns the maximum of all coefficients of *this and puts in *row and *col its location.
|
|
236
|
+
* \warning the result is undefined if \c *this contains NaN.
|
|
237
|
+
*
|
|
238
|
+
* \sa DenseBase::minCoeff(IndexType*,IndexType*), DenseBase::visit(), DenseBase::maxCoeff()
|
|
239
|
+
*/
|
|
240
|
+
template<typename Derived>
|
|
241
|
+
template<typename IndexType>
|
|
242
|
+
EIGEN_DEVICE_FUNC
|
|
243
|
+
typename internal::traits<Derived>::Scalar
|
|
244
|
+
DenseBase<Derived>::maxCoeff(IndexType* rowPtr, IndexType* colPtr) const
|
|
245
|
+
{
|
|
246
|
+
internal::max_coeff_visitor<Derived> maxVisitor;
|
|
247
|
+
this->visit(maxVisitor);
|
|
248
|
+
*rowPtr = maxVisitor.row;
|
|
249
|
+
if (colPtr) *colPtr = maxVisitor.col;
|
|
250
|
+
return maxVisitor.res;
|
|
251
|
+
}
|
|
252
|
+
|
|
253
|
+
/** \returns the maximum of all coefficients of *this and puts in *index its location.
|
|
254
|
+
* \warning the result is undefined if \c *this contains NaN.
|
|
255
|
+
*
|
|
256
|
+
* \sa DenseBase::maxCoeff(IndexType*,IndexType*), DenseBase::minCoeff(IndexType*,IndexType*), DenseBase::visitor(), DenseBase::maxCoeff()
|
|
257
|
+
*/
|
|
258
|
+
template<typename Derived>
|
|
259
|
+
template<typename IndexType>
|
|
260
|
+
EIGEN_DEVICE_FUNC
|
|
261
|
+
typename internal::traits<Derived>::Scalar
|
|
262
|
+
DenseBase<Derived>::maxCoeff(IndexType* index) const
|
|
263
|
+
{
|
|
264
|
+
EIGEN_STATIC_ASSERT_VECTOR_ONLY(Derived)
|
|
265
|
+
internal::max_coeff_visitor<Derived> maxVisitor;
|
|
266
|
+
this->visit(maxVisitor);
|
|
267
|
+
*index = (RowsAtCompileTime==1) ? maxVisitor.col : maxVisitor.row;
|
|
268
|
+
return maxVisitor.res;
|
|
269
|
+
}
|
|
270
|
+
|
|
271
|
+
} // end namespace Eigen
|
|
272
|
+
|
|
273
|
+
#endif // EIGEN_VISITOR_H
|
|
@@ -0,0 +1,451 @@
|
|
|
1
|
+
// This file is part of Eigen, a lightweight C++ template library
|
|
2
|
+
// for linear algebra.
|
|
3
|
+
//
|
|
4
|
+
// Copyright (C) 2014 Benoit Steiner (benoit.steiner.goog@gmail.com)
|
|
5
|
+
//
|
|
6
|
+
// This Source Code Form is subject to the terms of the Mozilla
|
|
7
|
+
// Public License v. 2.0. If a copy of the MPL was not distributed
|
|
8
|
+
// with this file, You can obtain one at http://mozilla.org/MPL/2.0/.
|
|
9
|
+
|
|
10
|
+
#ifndef EIGEN_COMPLEX_AVX_H
|
|
11
|
+
#define EIGEN_COMPLEX_AVX_H
|
|
12
|
+
|
|
13
|
+
namespace Eigen {
|
|
14
|
+
|
|
15
|
+
namespace internal {
|
|
16
|
+
|
|
17
|
+
//---------- float ----------
|
|
18
|
+
struct Packet4cf
|
|
19
|
+
{
|
|
20
|
+
EIGEN_STRONG_INLINE Packet4cf() {}
|
|
21
|
+
EIGEN_STRONG_INLINE explicit Packet4cf(const __m256& a) : v(a) {}
|
|
22
|
+
__m256 v;
|
|
23
|
+
};
|
|
24
|
+
|
|
25
|
+
template<> struct packet_traits<std::complex<float> > : default_packet_traits
|
|
26
|
+
{
|
|
27
|
+
typedef Packet4cf type;
|
|
28
|
+
typedef Packet2cf half;
|
|
29
|
+
enum {
|
|
30
|
+
Vectorizable = 1,
|
|
31
|
+
AlignedOnScalar = 1,
|
|
32
|
+
size = 4,
|
|
33
|
+
HasHalfPacket = 1,
|
|
34
|
+
|
|
35
|
+
HasAdd = 1,
|
|
36
|
+
HasSub = 1,
|
|
37
|
+
HasMul = 1,
|
|
38
|
+
HasDiv = 1,
|
|
39
|
+
HasNegate = 1,
|
|
40
|
+
HasAbs = 0,
|
|
41
|
+
HasAbs2 = 0,
|
|
42
|
+
HasMin = 0,
|
|
43
|
+
HasMax = 0,
|
|
44
|
+
HasSetLinear = 0
|
|
45
|
+
};
|
|
46
|
+
};
|
|
47
|
+
|
|
48
|
+
template<> struct unpacket_traits<Packet4cf> { typedef std::complex<float> type; enum {size=4, alignment=Aligned32}; typedef Packet2cf half; };
|
|
49
|
+
|
|
50
|
+
template<> EIGEN_STRONG_INLINE Packet4cf padd<Packet4cf>(const Packet4cf& a, const Packet4cf& b) { return Packet4cf(_mm256_add_ps(a.v,b.v)); }
|
|
51
|
+
template<> EIGEN_STRONG_INLINE Packet4cf psub<Packet4cf>(const Packet4cf& a, const Packet4cf& b) { return Packet4cf(_mm256_sub_ps(a.v,b.v)); }
|
|
52
|
+
template<> EIGEN_STRONG_INLINE Packet4cf pnegate(const Packet4cf& a)
|
|
53
|
+
{
|
|
54
|
+
return Packet4cf(pnegate(a.v));
|
|
55
|
+
}
|
|
56
|
+
template<> EIGEN_STRONG_INLINE Packet4cf pconj(const Packet4cf& a)
|
|
57
|
+
{
|
|
58
|
+
const __m256 mask = _mm256_castsi256_ps(_mm256_setr_epi32(0x00000000,0x80000000,0x00000000,0x80000000,0x00000000,0x80000000,0x00000000,0x80000000));
|
|
59
|
+
return Packet4cf(_mm256_xor_ps(a.v,mask));
|
|
60
|
+
}
|
|
61
|
+
|
|
62
|
+
template<> EIGEN_STRONG_INLINE Packet4cf pmul<Packet4cf>(const Packet4cf& a, const Packet4cf& b)
|
|
63
|
+
{
|
|
64
|
+
__m256 tmp1 = _mm256_mul_ps(_mm256_moveldup_ps(a.v), b.v);
|
|
65
|
+
__m256 tmp2 = _mm256_mul_ps(_mm256_movehdup_ps(a.v), _mm256_permute_ps(b.v, _MM_SHUFFLE(2,3,0,1)));
|
|
66
|
+
__m256 result = _mm256_addsub_ps(tmp1, tmp2);
|
|
67
|
+
return Packet4cf(result);
|
|
68
|
+
}
|
|
69
|
+
|
|
70
|
+
template<> EIGEN_STRONG_INLINE Packet4cf pand <Packet4cf>(const Packet4cf& a, const Packet4cf& b) { return Packet4cf(_mm256_and_ps(a.v,b.v)); }
|
|
71
|
+
template<> EIGEN_STRONG_INLINE Packet4cf por <Packet4cf>(const Packet4cf& a, const Packet4cf& b) { return Packet4cf(_mm256_or_ps(a.v,b.v)); }
|
|
72
|
+
template<> EIGEN_STRONG_INLINE Packet4cf pxor <Packet4cf>(const Packet4cf& a, const Packet4cf& b) { return Packet4cf(_mm256_xor_ps(a.v,b.v)); }
|
|
73
|
+
template<> EIGEN_STRONG_INLINE Packet4cf pandnot<Packet4cf>(const Packet4cf& a, const Packet4cf& b) { return Packet4cf(_mm256_andnot_ps(a.v,b.v)); }
|
|
74
|
+
|
|
75
|
+
template<> EIGEN_STRONG_INLINE Packet4cf pload <Packet4cf>(const std::complex<float>* from) { EIGEN_DEBUG_ALIGNED_LOAD return Packet4cf(pload<Packet8f>(&numext::real_ref(*from))); }
|
|
76
|
+
template<> EIGEN_STRONG_INLINE Packet4cf ploadu<Packet4cf>(const std::complex<float>* from) { EIGEN_DEBUG_UNALIGNED_LOAD return Packet4cf(ploadu<Packet8f>(&numext::real_ref(*from))); }
|
|
77
|
+
|
|
78
|
+
|
|
79
|
+
template<> EIGEN_STRONG_INLINE Packet4cf pset1<Packet4cf>(const std::complex<float>& from)
|
|
80
|
+
{
|
|
81
|
+
return Packet4cf(_mm256_castpd_ps(_mm256_broadcast_sd((const double*)(const void*)&from)));
|
|
82
|
+
}
|
|
83
|
+
|
|
84
|
+
template<> EIGEN_STRONG_INLINE Packet4cf ploaddup<Packet4cf>(const std::complex<float>* from)
|
|
85
|
+
{
|
|
86
|
+
// FIXME The following might be optimized using _mm256_movedup_pd
|
|
87
|
+
Packet2cf a = ploaddup<Packet2cf>(from);
|
|
88
|
+
Packet2cf b = ploaddup<Packet2cf>(from+1);
|
|
89
|
+
return Packet4cf(_mm256_insertf128_ps(_mm256_castps128_ps256(a.v), b.v, 1));
|
|
90
|
+
}
|
|
91
|
+
|
|
92
|
+
template<> EIGEN_STRONG_INLINE void pstore <std::complex<float> >(std::complex<float>* to, const Packet4cf& from) { EIGEN_DEBUG_ALIGNED_STORE pstore(&numext::real_ref(*to), from.v); }
|
|
93
|
+
template<> EIGEN_STRONG_INLINE void pstoreu<std::complex<float> >(std::complex<float>* to, const Packet4cf& from) { EIGEN_DEBUG_UNALIGNED_STORE pstoreu(&numext::real_ref(*to), from.v); }
|
|
94
|
+
|
|
95
|
+
template<> EIGEN_DEVICE_FUNC inline Packet4cf pgather<std::complex<float>, Packet4cf>(const std::complex<float>* from, Index stride)
|
|
96
|
+
{
|
|
97
|
+
return Packet4cf(_mm256_set_ps(std::imag(from[3*stride]), std::real(from[3*stride]),
|
|
98
|
+
std::imag(from[2*stride]), std::real(from[2*stride]),
|
|
99
|
+
std::imag(from[1*stride]), std::real(from[1*stride]),
|
|
100
|
+
std::imag(from[0*stride]), std::real(from[0*stride])));
|
|
101
|
+
}
|
|
102
|
+
|
|
103
|
+
template<> EIGEN_DEVICE_FUNC inline void pscatter<std::complex<float>, Packet4cf>(std::complex<float>* to, const Packet4cf& from, Index stride)
|
|
104
|
+
{
|
|
105
|
+
__m128 low = _mm256_extractf128_ps(from.v, 0);
|
|
106
|
+
to[stride*0] = std::complex<float>(_mm_cvtss_f32(_mm_shuffle_ps(low, low, 0)),
|
|
107
|
+
_mm_cvtss_f32(_mm_shuffle_ps(low, low, 1)));
|
|
108
|
+
to[stride*1] = std::complex<float>(_mm_cvtss_f32(_mm_shuffle_ps(low, low, 2)),
|
|
109
|
+
_mm_cvtss_f32(_mm_shuffle_ps(low, low, 3)));
|
|
110
|
+
|
|
111
|
+
__m128 high = _mm256_extractf128_ps(from.v, 1);
|
|
112
|
+
to[stride*2] = std::complex<float>(_mm_cvtss_f32(_mm_shuffle_ps(high, high, 0)),
|
|
113
|
+
_mm_cvtss_f32(_mm_shuffle_ps(high, high, 1)));
|
|
114
|
+
to[stride*3] = std::complex<float>(_mm_cvtss_f32(_mm_shuffle_ps(high, high, 2)),
|
|
115
|
+
_mm_cvtss_f32(_mm_shuffle_ps(high, high, 3)));
|
|
116
|
+
|
|
117
|
+
}
|
|
118
|
+
|
|
119
|
+
template<> EIGEN_STRONG_INLINE std::complex<float> pfirst<Packet4cf>(const Packet4cf& a)
|
|
120
|
+
{
|
|
121
|
+
return pfirst(Packet2cf(_mm256_castps256_ps128(a.v)));
|
|
122
|
+
}
|
|
123
|
+
|
|
124
|
+
template<> EIGEN_STRONG_INLINE Packet4cf preverse(const Packet4cf& a) {
|
|
125
|
+
__m128 low = _mm256_extractf128_ps(a.v, 0);
|
|
126
|
+
__m128 high = _mm256_extractf128_ps(a.v, 1);
|
|
127
|
+
__m128d lowd = _mm_castps_pd(low);
|
|
128
|
+
__m128d highd = _mm_castps_pd(high);
|
|
129
|
+
low = _mm_castpd_ps(_mm_shuffle_pd(lowd,lowd,0x1));
|
|
130
|
+
high = _mm_castpd_ps(_mm_shuffle_pd(highd,highd,0x1));
|
|
131
|
+
__m256 result = _mm256_setzero_ps();
|
|
132
|
+
result = _mm256_insertf128_ps(result, low, 1);
|
|
133
|
+
result = _mm256_insertf128_ps(result, high, 0);
|
|
134
|
+
return Packet4cf(result);
|
|
135
|
+
}
|
|
136
|
+
|
|
137
|
+
template<> EIGEN_STRONG_INLINE std::complex<float> predux<Packet4cf>(const Packet4cf& a)
|
|
138
|
+
{
|
|
139
|
+
return predux(padd(Packet2cf(_mm256_extractf128_ps(a.v,0)),
|
|
140
|
+
Packet2cf(_mm256_extractf128_ps(a.v,1))));
|
|
141
|
+
}
|
|
142
|
+
|
|
143
|
+
template<> EIGEN_STRONG_INLINE Packet4cf preduxp<Packet4cf>(const Packet4cf* vecs)
|
|
144
|
+
{
|
|
145
|
+
Packet8f t0 = _mm256_shuffle_ps(vecs[0].v, vecs[0].v, _MM_SHUFFLE(3, 1, 2 ,0));
|
|
146
|
+
Packet8f t1 = _mm256_shuffle_ps(vecs[1].v, vecs[1].v, _MM_SHUFFLE(3, 1, 2 ,0));
|
|
147
|
+
t0 = _mm256_hadd_ps(t0,t1);
|
|
148
|
+
Packet8f t2 = _mm256_shuffle_ps(vecs[2].v, vecs[2].v, _MM_SHUFFLE(3, 1, 2 ,0));
|
|
149
|
+
Packet8f t3 = _mm256_shuffle_ps(vecs[3].v, vecs[3].v, _MM_SHUFFLE(3, 1, 2 ,0));
|
|
150
|
+
t2 = _mm256_hadd_ps(t2,t3);
|
|
151
|
+
|
|
152
|
+
t1 = _mm256_permute2f128_ps(t0,t2, 0 + (2<<4));
|
|
153
|
+
t3 = _mm256_permute2f128_ps(t0,t2, 1 + (3<<4));
|
|
154
|
+
|
|
155
|
+
return Packet4cf(_mm256_add_ps(t1,t3));
|
|
156
|
+
}
|
|
157
|
+
|
|
158
|
+
template<> EIGEN_STRONG_INLINE std::complex<float> predux_mul<Packet4cf>(const Packet4cf& a)
|
|
159
|
+
{
|
|
160
|
+
return predux_mul(pmul(Packet2cf(_mm256_extractf128_ps(a.v, 0)),
|
|
161
|
+
Packet2cf(_mm256_extractf128_ps(a.v, 1))));
|
|
162
|
+
}
|
|
163
|
+
|
|
164
|
+
template<int Offset>
|
|
165
|
+
struct palign_impl<Offset,Packet4cf>
|
|
166
|
+
{
|
|
167
|
+
static EIGEN_STRONG_INLINE void run(Packet4cf& first, const Packet4cf& second)
|
|
168
|
+
{
|
|
169
|
+
if (Offset==0) return;
|
|
170
|
+
palign_impl<Offset*2,Packet8f>::run(first.v, second.v);
|
|
171
|
+
}
|
|
172
|
+
};
|
|
173
|
+
|
|
174
|
+
template<> struct conj_helper<Packet4cf, Packet4cf, false,true>
|
|
175
|
+
{
|
|
176
|
+
EIGEN_STRONG_INLINE Packet4cf pmadd(const Packet4cf& x, const Packet4cf& y, const Packet4cf& c) const
|
|
177
|
+
{ return padd(pmul(x,y),c); }
|
|
178
|
+
|
|
179
|
+
EIGEN_STRONG_INLINE Packet4cf pmul(const Packet4cf& a, const Packet4cf& b) const
|
|
180
|
+
{
|
|
181
|
+
return internal::pmul(a, pconj(b));
|
|
182
|
+
}
|
|
183
|
+
};
|
|
184
|
+
|
|
185
|
+
template<> struct conj_helper<Packet4cf, Packet4cf, true,false>
|
|
186
|
+
{
|
|
187
|
+
EIGEN_STRONG_INLINE Packet4cf pmadd(const Packet4cf& x, const Packet4cf& y, const Packet4cf& c) const
|
|
188
|
+
{ return padd(pmul(x,y),c); }
|
|
189
|
+
|
|
190
|
+
EIGEN_STRONG_INLINE Packet4cf pmul(const Packet4cf& a, const Packet4cf& b) const
|
|
191
|
+
{
|
|
192
|
+
return internal::pmul(pconj(a), b);
|
|
193
|
+
}
|
|
194
|
+
};
|
|
195
|
+
|
|
196
|
+
template<> struct conj_helper<Packet4cf, Packet4cf, true,true>
|
|
197
|
+
{
|
|
198
|
+
EIGEN_STRONG_INLINE Packet4cf pmadd(const Packet4cf& x, const Packet4cf& y, const Packet4cf& c) const
|
|
199
|
+
{ return padd(pmul(x,y),c); }
|
|
200
|
+
|
|
201
|
+
EIGEN_STRONG_INLINE Packet4cf pmul(const Packet4cf& a, const Packet4cf& b) const
|
|
202
|
+
{
|
|
203
|
+
return pconj(internal::pmul(a, b));
|
|
204
|
+
}
|
|
205
|
+
};
|
|
206
|
+
|
|
207
|
+
EIGEN_MAKE_CONJ_HELPER_CPLX_REAL(Packet4cf,Packet8f)
|
|
208
|
+
|
|
209
|
+
template<> EIGEN_STRONG_INLINE Packet4cf pdiv<Packet4cf>(const Packet4cf& a, const Packet4cf& b)
|
|
210
|
+
{
|
|
211
|
+
Packet4cf num = pmul(a, pconj(b));
|
|
212
|
+
__m256 tmp = _mm256_mul_ps(b.v, b.v);
|
|
213
|
+
__m256 tmp2 = _mm256_shuffle_ps(tmp,tmp,0xB1);
|
|
214
|
+
__m256 denom = _mm256_add_ps(tmp, tmp2);
|
|
215
|
+
return Packet4cf(_mm256_div_ps(num.v, denom));
|
|
216
|
+
}
|
|
217
|
+
|
|
218
|
+
template<> EIGEN_STRONG_INLINE Packet4cf pcplxflip<Packet4cf>(const Packet4cf& x)
|
|
219
|
+
{
|
|
220
|
+
return Packet4cf(_mm256_shuffle_ps(x.v, x.v, _MM_SHUFFLE(2, 3, 0 ,1)));
|
|
221
|
+
}
|
|
222
|
+
|
|
223
|
+
//---------- double ----------
|
|
224
|
+
struct Packet2cd
|
|
225
|
+
{
|
|
226
|
+
EIGEN_STRONG_INLINE Packet2cd() {}
|
|
227
|
+
EIGEN_STRONG_INLINE explicit Packet2cd(const __m256d& a) : v(a) {}
|
|
228
|
+
__m256d v;
|
|
229
|
+
};
|
|
230
|
+
|
|
231
|
+
template<> struct packet_traits<std::complex<double> > : default_packet_traits
|
|
232
|
+
{
|
|
233
|
+
typedef Packet2cd type;
|
|
234
|
+
typedef Packet1cd half;
|
|
235
|
+
enum {
|
|
236
|
+
Vectorizable = 1,
|
|
237
|
+
AlignedOnScalar = 0,
|
|
238
|
+
size = 2,
|
|
239
|
+
HasHalfPacket = 1,
|
|
240
|
+
|
|
241
|
+
HasAdd = 1,
|
|
242
|
+
HasSub = 1,
|
|
243
|
+
HasMul = 1,
|
|
244
|
+
HasDiv = 1,
|
|
245
|
+
HasNegate = 1,
|
|
246
|
+
HasAbs = 0,
|
|
247
|
+
HasAbs2 = 0,
|
|
248
|
+
HasMin = 0,
|
|
249
|
+
HasMax = 0,
|
|
250
|
+
HasSetLinear = 0
|
|
251
|
+
};
|
|
252
|
+
};
|
|
253
|
+
|
|
254
|
+
template<> struct unpacket_traits<Packet2cd> { typedef std::complex<double> type; enum {size=2, alignment=Aligned32}; typedef Packet1cd half; };
|
|
255
|
+
|
|
256
|
+
template<> EIGEN_STRONG_INLINE Packet2cd padd<Packet2cd>(const Packet2cd& a, const Packet2cd& b) { return Packet2cd(_mm256_add_pd(a.v,b.v)); }
|
|
257
|
+
template<> EIGEN_STRONG_INLINE Packet2cd psub<Packet2cd>(const Packet2cd& a, const Packet2cd& b) { return Packet2cd(_mm256_sub_pd(a.v,b.v)); }
|
|
258
|
+
template<> EIGEN_STRONG_INLINE Packet2cd pnegate(const Packet2cd& a) { return Packet2cd(pnegate(a.v)); }
|
|
259
|
+
template<> EIGEN_STRONG_INLINE Packet2cd pconj(const Packet2cd& a)
|
|
260
|
+
{
|
|
261
|
+
const __m256d mask = _mm256_castsi256_pd(_mm256_set_epi32(0x80000000,0x0,0x0,0x0,0x80000000,0x0,0x0,0x0));
|
|
262
|
+
return Packet2cd(_mm256_xor_pd(a.v,mask));
|
|
263
|
+
}
|
|
264
|
+
|
|
265
|
+
template<> EIGEN_STRONG_INLINE Packet2cd pmul<Packet2cd>(const Packet2cd& a, const Packet2cd& b)
|
|
266
|
+
{
|
|
267
|
+
__m256d tmp1 = _mm256_shuffle_pd(a.v,a.v,0x0);
|
|
268
|
+
__m256d even = _mm256_mul_pd(tmp1, b.v);
|
|
269
|
+
__m256d tmp2 = _mm256_shuffle_pd(a.v,a.v,0xF);
|
|
270
|
+
__m256d tmp3 = _mm256_shuffle_pd(b.v,b.v,0x5);
|
|
271
|
+
__m256d odd = _mm256_mul_pd(tmp2, tmp3);
|
|
272
|
+
return Packet2cd(_mm256_addsub_pd(even, odd));
|
|
273
|
+
}
|
|
274
|
+
|
|
275
|
+
template<> EIGEN_STRONG_INLINE Packet2cd pand <Packet2cd>(const Packet2cd& a, const Packet2cd& b) { return Packet2cd(_mm256_and_pd(a.v,b.v)); }
|
|
276
|
+
template<> EIGEN_STRONG_INLINE Packet2cd por <Packet2cd>(const Packet2cd& a, const Packet2cd& b) { return Packet2cd(_mm256_or_pd(a.v,b.v)); }
|
|
277
|
+
template<> EIGEN_STRONG_INLINE Packet2cd pxor <Packet2cd>(const Packet2cd& a, const Packet2cd& b) { return Packet2cd(_mm256_xor_pd(a.v,b.v)); }
|
|
278
|
+
template<> EIGEN_STRONG_INLINE Packet2cd pandnot<Packet2cd>(const Packet2cd& a, const Packet2cd& b) { return Packet2cd(_mm256_andnot_pd(a.v,b.v)); }
|
|
279
|
+
|
|
280
|
+
template<> EIGEN_STRONG_INLINE Packet2cd pload <Packet2cd>(const std::complex<double>* from)
|
|
281
|
+
{ EIGEN_DEBUG_ALIGNED_LOAD return Packet2cd(pload<Packet4d>((const double*)from)); }
|
|
282
|
+
template<> EIGEN_STRONG_INLINE Packet2cd ploadu<Packet2cd>(const std::complex<double>* from)
|
|
283
|
+
{ EIGEN_DEBUG_UNALIGNED_LOAD return Packet2cd(ploadu<Packet4d>((const double*)from)); }
|
|
284
|
+
|
|
285
|
+
template<> EIGEN_STRONG_INLINE Packet2cd pset1<Packet2cd>(const std::complex<double>& from)
|
|
286
|
+
{
|
|
287
|
+
// in case casting to a __m128d* is really not safe, then we can still fallback to this version: (much slower though)
|
|
288
|
+
// return Packet2cd(_mm256_loadu2_m128d((const double*)&from,(const double*)&from));
|
|
289
|
+
return Packet2cd(_mm256_broadcast_pd((const __m128d*)(const void*)&from));
|
|
290
|
+
}
|
|
291
|
+
|
|
292
|
+
template<> EIGEN_STRONG_INLINE Packet2cd ploaddup<Packet2cd>(const std::complex<double>* from) { return pset1<Packet2cd>(*from); }
|
|
293
|
+
|
|
294
|
+
template<> EIGEN_STRONG_INLINE void pstore <std::complex<double> >(std::complex<double> * to, const Packet2cd& from) { EIGEN_DEBUG_ALIGNED_STORE pstore((double*)to, from.v); }
|
|
295
|
+
template<> EIGEN_STRONG_INLINE void pstoreu<std::complex<double> >(std::complex<double> * to, const Packet2cd& from) { EIGEN_DEBUG_UNALIGNED_STORE pstoreu((double*)to, from.v); }
|
|
296
|
+
|
|
297
|
+
template<> EIGEN_DEVICE_FUNC inline Packet2cd pgather<std::complex<double>, Packet2cd>(const std::complex<double>* from, Index stride)
|
|
298
|
+
{
|
|
299
|
+
return Packet2cd(_mm256_set_pd(std::imag(from[1*stride]), std::real(from[1*stride]),
|
|
300
|
+
std::imag(from[0*stride]), std::real(from[0*stride])));
|
|
301
|
+
}
|
|
302
|
+
|
|
303
|
+
template<> EIGEN_DEVICE_FUNC inline void pscatter<std::complex<double>, Packet2cd>(std::complex<double>* to, const Packet2cd& from, Index stride)
|
|
304
|
+
{
|
|
305
|
+
__m128d low = _mm256_extractf128_pd(from.v, 0);
|
|
306
|
+
to[stride*0] = std::complex<double>(_mm_cvtsd_f64(low), _mm_cvtsd_f64(_mm_shuffle_pd(low, low, 1)));
|
|
307
|
+
__m128d high = _mm256_extractf128_pd(from.v, 1);
|
|
308
|
+
to[stride*1] = std::complex<double>(_mm_cvtsd_f64(high), _mm_cvtsd_f64(_mm_shuffle_pd(high, high, 1)));
|
|
309
|
+
}
|
|
310
|
+
|
|
311
|
+
template<> EIGEN_STRONG_INLINE std::complex<double> pfirst<Packet2cd>(const Packet2cd& a)
|
|
312
|
+
{
|
|
313
|
+
__m128d low = _mm256_extractf128_pd(a.v, 0);
|
|
314
|
+
EIGEN_ALIGN16 double res[2];
|
|
315
|
+
_mm_store_pd(res, low);
|
|
316
|
+
return std::complex<double>(res[0],res[1]);
|
|
317
|
+
}
|
|
318
|
+
|
|
319
|
+
template<> EIGEN_STRONG_INLINE Packet2cd preverse(const Packet2cd& a) {
|
|
320
|
+
__m256d result = _mm256_permute2f128_pd(a.v, a.v, 1);
|
|
321
|
+
return Packet2cd(result);
|
|
322
|
+
}
|
|
323
|
+
|
|
324
|
+
template<> EIGEN_STRONG_INLINE std::complex<double> predux<Packet2cd>(const Packet2cd& a)
|
|
325
|
+
{
|
|
326
|
+
return predux(padd(Packet1cd(_mm256_extractf128_pd(a.v,0)),
|
|
327
|
+
Packet1cd(_mm256_extractf128_pd(a.v,1))));
|
|
328
|
+
}
|
|
329
|
+
|
|
330
|
+
template<> EIGEN_STRONG_INLINE Packet2cd preduxp<Packet2cd>(const Packet2cd* vecs)
|
|
331
|
+
{
|
|
332
|
+
Packet4d t0 = _mm256_permute2f128_pd(vecs[0].v,vecs[1].v, 0 + (2<<4));
|
|
333
|
+
Packet4d t1 = _mm256_permute2f128_pd(vecs[0].v,vecs[1].v, 1 + (3<<4));
|
|
334
|
+
|
|
335
|
+
return Packet2cd(_mm256_add_pd(t0,t1));
|
|
336
|
+
}
|
|
337
|
+
|
|
338
|
+
template<> EIGEN_STRONG_INLINE std::complex<double> predux_mul<Packet2cd>(const Packet2cd& a)
|
|
339
|
+
{
|
|
340
|
+
return predux(pmul(Packet1cd(_mm256_extractf128_pd(a.v,0)),
|
|
341
|
+
Packet1cd(_mm256_extractf128_pd(a.v,1))));
|
|
342
|
+
}
|
|
343
|
+
|
|
344
|
+
template<int Offset>
|
|
345
|
+
struct palign_impl<Offset,Packet2cd>
|
|
346
|
+
{
|
|
347
|
+
static EIGEN_STRONG_INLINE void run(Packet2cd& first, const Packet2cd& second)
|
|
348
|
+
{
|
|
349
|
+
if (Offset==0) return;
|
|
350
|
+
palign_impl<Offset*2,Packet4d>::run(first.v, second.v);
|
|
351
|
+
}
|
|
352
|
+
};
|
|
353
|
+
|
|
354
|
+
template<> struct conj_helper<Packet2cd, Packet2cd, false,true>
|
|
355
|
+
{
|
|
356
|
+
EIGEN_STRONG_INLINE Packet2cd pmadd(const Packet2cd& x, const Packet2cd& y, const Packet2cd& c) const
|
|
357
|
+
{ return padd(pmul(x,y),c); }
|
|
358
|
+
|
|
359
|
+
EIGEN_STRONG_INLINE Packet2cd pmul(const Packet2cd& a, const Packet2cd& b) const
|
|
360
|
+
{
|
|
361
|
+
return internal::pmul(a, pconj(b));
|
|
362
|
+
}
|
|
363
|
+
};
|
|
364
|
+
|
|
365
|
+
template<> struct conj_helper<Packet2cd, Packet2cd, true,false>
|
|
366
|
+
{
|
|
367
|
+
EIGEN_STRONG_INLINE Packet2cd pmadd(const Packet2cd& x, const Packet2cd& y, const Packet2cd& c) const
|
|
368
|
+
{ return padd(pmul(x,y),c); }
|
|
369
|
+
|
|
370
|
+
EIGEN_STRONG_INLINE Packet2cd pmul(const Packet2cd& a, const Packet2cd& b) const
|
|
371
|
+
{
|
|
372
|
+
return internal::pmul(pconj(a), b);
|
|
373
|
+
}
|
|
374
|
+
};
|
|
375
|
+
|
|
376
|
+
template<> struct conj_helper<Packet2cd, Packet2cd, true,true>
|
|
377
|
+
{
|
|
378
|
+
EIGEN_STRONG_INLINE Packet2cd pmadd(const Packet2cd& x, const Packet2cd& y, const Packet2cd& c) const
|
|
379
|
+
{ return padd(pmul(x,y),c); }
|
|
380
|
+
|
|
381
|
+
EIGEN_STRONG_INLINE Packet2cd pmul(const Packet2cd& a, const Packet2cd& b) const
|
|
382
|
+
{
|
|
383
|
+
return pconj(internal::pmul(a, b));
|
|
384
|
+
}
|
|
385
|
+
};
|
|
386
|
+
|
|
387
|
+
EIGEN_MAKE_CONJ_HELPER_CPLX_REAL(Packet2cd,Packet4d)
|
|
388
|
+
|
|
389
|
+
template<> EIGEN_STRONG_INLINE Packet2cd pdiv<Packet2cd>(const Packet2cd& a, const Packet2cd& b)
|
|
390
|
+
{
|
|
391
|
+
Packet2cd num = pmul(a, pconj(b));
|
|
392
|
+
__m256d tmp = _mm256_mul_pd(b.v, b.v);
|
|
393
|
+
__m256d denom = _mm256_hadd_pd(tmp, tmp);
|
|
394
|
+
return Packet2cd(_mm256_div_pd(num.v, denom));
|
|
395
|
+
}
|
|
396
|
+
|
|
397
|
+
template<> EIGEN_STRONG_INLINE Packet2cd pcplxflip<Packet2cd>(const Packet2cd& x)
|
|
398
|
+
{
|
|
399
|
+
return Packet2cd(_mm256_shuffle_pd(x.v, x.v, 0x5));
|
|
400
|
+
}
|
|
401
|
+
|
|
402
|
+
EIGEN_DEVICE_FUNC inline void
|
|
403
|
+
ptranspose(PacketBlock<Packet4cf,4>& kernel) {
|
|
404
|
+
__m256d P0 = _mm256_castps_pd(kernel.packet[0].v);
|
|
405
|
+
__m256d P1 = _mm256_castps_pd(kernel.packet[1].v);
|
|
406
|
+
__m256d P2 = _mm256_castps_pd(kernel.packet[2].v);
|
|
407
|
+
__m256d P3 = _mm256_castps_pd(kernel.packet[3].v);
|
|
408
|
+
|
|
409
|
+
__m256d T0 = _mm256_shuffle_pd(P0, P1, 15);
|
|
410
|
+
__m256d T1 = _mm256_shuffle_pd(P0, P1, 0);
|
|
411
|
+
__m256d T2 = _mm256_shuffle_pd(P2, P3, 15);
|
|
412
|
+
__m256d T3 = _mm256_shuffle_pd(P2, P3, 0);
|
|
413
|
+
|
|
414
|
+
kernel.packet[1].v = _mm256_castpd_ps(_mm256_permute2f128_pd(T0, T2, 32));
|
|
415
|
+
kernel.packet[3].v = _mm256_castpd_ps(_mm256_permute2f128_pd(T0, T2, 49));
|
|
416
|
+
kernel.packet[0].v = _mm256_castpd_ps(_mm256_permute2f128_pd(T1, T3, 32));
|
|
417
|
+
kernel.packet[2].v = _mm256_castpd_ps(_mm256_permute2f128_pd(T1, T3, 49));
|
|
418
|
+
}
|
|
419
|
+
|
|
420
|
+
EIGEN_DEVICE_FUNC inline void
|
|
421
|
+
ptranspose(PacketBlock<Packet2cd,2>& kernel) {
|
|
422
|
+
__m256d tmp = _mm256_permute2f128_pd(kernel.packet[0].v, kernel.packet[1].v, 0+(2<<4));
|
|
423
|
+
kernel.packet[1].v = _mm256_permute2f128_pd(kernel.packet[0].v, kernel.packet[1].v, 1+(3<<4));
|
|
424
|
+
kernel.packet[0].v = tmp;
|
|
425
|
+
}
|
|
426
|
+
|
|
427
|
+
template<> EIGEN_STRONG_INLINE Packet4cf pinsertfirst(const Packet4cf& a, std::complex<float> b)
|
|
428
|
+
{
|
|
429
|
+
return Packet4cf(_mm256_blend_ps(a.v,pset1<Packet4cf>(b).v,1|2));
|
|
430
|
+
}
|
|
431
|
+
|
|
432
|
+
template<> EIGEN_STRONG_INLINE Packet2cd pinsertfirst(const Packet2cd& a, std::complex<double> b)
|
|
433
|
+
{
|
|
434
|
+
return Packet2cd(_mm256_blend_pd(a.v,pset1<Packet2cd>(b).v,1|2));
|
|
435
|
+
}
|
|
436
|
+
|
|
437
|
+
template<> EIGEN_STRONG_INLINE Packet4cf pinsertlast(const Packet4cf& a, std::complex<float> b)
|
|
438
|
+
{
|
|
439
|
+
return Packet4cf(_mm256_blend_ps(a.v,pset1<Packet4cf>(b).v,(1<<7)|(1<<6)));
|
|
440
|
+
}
|
|
441
|
+
|
|
442
|
+
template<> EIGEN_STRONG_INLINE Packet2cd pinsertlast(const Packet2cd& a, std::complex<double> b)
|
|
443
|
+
{
|
|
444
|
+
return Packet2cd(_mm256_blend_pd(a.v,pset1<Packet2cd>(b).v,(1<<3)|(1<<2)));
|
|
445
|
+
}
|
|
446
|
+
|
|
447
|
+
} // end namespace internal
|
|
448
|
+
|
|
449
|
+
} // end namespace Eigen
|
|
450
|
+
|
|
451
|
+
#endif // EIGEN_COMPLEX_AVX_H
|