RubyGems - tomoto - Versions diffs - 0.1.0 - Mend

tomoto 0.1.0

Files changed (420) hide show

checksums.yaml +7 -0
data/CHANGELOG.md +3 -0
data/LICENSE.txt +22 -0
data/README.md +123 -0
data/ext/tomoto/ext.cpp +245 -0
data/ext/tomoto/extconf.rb +28 -0
data/lib/tomoto.rb +12 -0
data/lib/tomoto/ct.rb +11 -0
data/lib/tomoto/hdp.rb +11 -0
data/lib/tomoto/lda.rb +67 -0
data/lib/tomoto/version.rb +3 -0
data/vendor/EigenRand/EigenRand/Core.h +1139 -0
data/vendor/EigenRand/EigenRand/Dists/Basic.h +111 -0
data/vendor/EigenRand/EigenRand/Dists/Discrete.h +877 -0
data/vendor/EigenRand/EigenRand/Dists/GammaPoisson.h +108 -0
data/vendor/EigenRand/EigenRand/Dists/NormalExp.h +626 -0
data/vendor/EigenRand/EigenRand/EigenRand +19 -0
data/vendor/EigenRand/EigenRand/Macro.h +24 -0
data/vendor/EigenRand/EigenRand/MorePacketMath.h +978 -0
data/vendor/EigenRand/EigenRand/PacketFilter.h +286 -0
data/vendor/EigenRand/EigenRand/PacketRandomEngine.h +624 -0
data/vendor/EigenRand/EigenRand/RandUtils.h +413 -0
data/vendor/EigenRand/EigenRand/doc.h +220 -0
data/vendor/EigenRand/LICENSE +21 -0
data/vendor/EigenRand/README.md +288 -0
data/vendor/eigen/COPYING.BSD +26 -0
data/vendor/eigen/COPYING.GPL +674 -0
data/vendor/eigen/COPYING.LGPL +502 -0
data/vendor/eigen/COPYING.MINPACK +52 -0
data/vendor/eigen/COPYING.MPL2 +373 -0
data/vendor/eigen/COPYING.README +18 -0
data/vendor/eigen/Eigen/CMakeLists.txt +19 -0
data/vendor/eigen/Eigen/Cholesky +46 -0
data/vendor/eigen/Eigen/CholmodSupport +48 -0
data/vendor/eigen/Eigen/Core +537 -0
data/vendor/eigen/Eigen/Dense +7 -0
data/vendor/eigen/Eigen/Eigen +2 -0
data/vendor/eigen/Eigen/Eigenvalues +61 -0
data/vendor/eigen/Eigen/Geometry +62 -0
data/vendor/eigen/Eigen/Householder +30 -0
data/vendor/eigen/Eigen/IterativeLinearSolvers +48 -0
data/vendor/eigen/Eigen/Jacobi +33 -0
data/vendor/eigen/Eigen/LU +50 -0
data/vendor/eigen/Eigen/MetisSupport +35 -0
data/vendor/eigen/Eigen/OrderingMethods +73 -0
data/vendor/eigen/Eigen/PaStiXSupport +48 -0
data/vendor/eigen/Eigen/PardisoSupport +35 -0
data/vendor/eigen/Eigen/QR +51 -0
data/vendor/eigen/Eigen/QtAlignedMalloc +40 -0
data/vendor/eigen/Eigen/SPQRSupport +34 -0
data/vendor/eigen/Eigen/SVD +51 -0
data/vendor/eigen/Eigen/Sparse +36 -0
data/vendor/eigen/Eigen/SparseCholesky +45 -0
data/vendor/eigen/Eigen/SparseCore +69 -0
data/vendor/eigen/Eigen/SparseLU +46 -0
data/vendor/eigen/Eigen/SparseQR +37 -0
data/vendor/eigen/Eigen/StdDeque +27 -0
data/vendor/eigen/Eigen/StdList +26 -0
data/vendor/eigen/Eigen/StdVector +27 -0
data/vendor/eigen/Eigen/SuperLUSupport +64 -0
data/vendor/eigen/Eigen/UmfPackSupport +40 -0
data/vendor/eigen/Eigen/src/Cholesky/LDLT.h +673 -0
data/vendor/eigen/Eigen/src/Cholesky/LLT.h +542 -0
data/vendor/eigen/Eigen/src/Cholesky/LLT_LAPACKE.h +99 -0
data/vendor/eigen/Eigen/src/CholmodSupport/CholmodSupport.h +639 -0
data/vendor/eigen/Eigen/src/Core/Array.h +329 -0
data/vendor/eigen/Eigen/src/Core/ArrayBase.h +226 -0
data/vendor/eigen/Eigen/src/Core/ArrayWrapper.h +209 -0
data/vendor/eigen/Eigen/src/Core/Assign.h +90 -0
data/vendor/eigen/Eigen/src/Core/AssignEvaluator.h +935 -0
data/vendor/eigen/Eigen/src/Core/Assign_MKL.h +178 -0
data/vendor/eigen/Eigen/src/Core/BandMatrix.h +353 -0
data/vendor/eigen/Eigen/src/Core/Block.h +452 -0
data/vendor/eigen/Eigen/src/Core/BooleanRedux.h +164 -0
data/vendor/eigen/Eigen/src/Core/CommaInitializer.h +160 -0
data/vendor/eigen/Eigen/src/Core/ConditionEstimator.h +175 -0
data/vendor/eigen/Eigen/src/Core/CoreEvaluators.h +1688 -0
data/vendor/eigen/Eigen/src/Core/CoreIterators.h +127 -0
data/vendor/eigen/Eigen/src/Core/CwiseBinaryOp.h +184 -0
data/vendor/eigen/Eigen/src/Core/CwiseNullaryOp.h +866 -0
data/vendor/eigen/Eigen/src/Core/CwiseTernaryOp.h +197 -0
data/vendor/eigen/Eigen/src/Core/CwiseUnaryOp.h +103 -0
data/vendor/eigen/Eigen/src/Core/CwiseUnaryView.h +128 -0
data/vendor/eigen/Eigen/src/Core/DenseBase.h +611 -0
data/vendor/eigen/Eigen/src/Core/DenseCoeffsBase.h +681 -0
data/vendor/eigen/Eigen/src/Core/DenseStorage.h +570 -0
data/vendor/eigen/Eigen/src/Core/Diagonal.h +260 -0
data/vendor/eigen/Eigen/src/Core/DiagonalMatrix.h +343 -0
data/vendor/eigen/Eigen/src/Core/DiagonalProduct.h +28 -0
data/vendor/eigen/Eigen/src/Core/Dot.h +318 -0
data/vendor/eigen/Eigen/src/Core/EigenBase.h +159 -0
data/vendor/eigen/Eigen/src/Core/ForceAlignedAccess.h +146 -0
data/vendor/eigen/Eigen/src/Core/Fuzzy.h +155 -0
data/vendor/eigen/Eigen/src/Core/GeneralProduct.h +455 -0
data/vendor/eigen/Eigen/src/Core/GenericPacketMath.h +593 -0
data/vendor/eigen/Eigen/src/Core/GlobalFunctions.h +187 -0
data/vendor/eigen/Eigen/src/Core/IO.h +225 -0
data/vendor/eigen/Eigen/src/Core/Inverse.h +118 -0
data/vendor/eigen/Eigen/src/Core/Map.h +171 -0
data/vendor/eigen/Eigen/src/Core/MapBase.h +303 -0
data/vendor/eigen/Eigen/src/Core/MathFunctions.h +1415 -0
data/vendor/eigen/Eigen/src/Core/MathFunctionsImpl.h +101 -0
data/vendor/eigen/Eigen/src/Core/Matrix.h +459 -0
data/vendor/eigen/Eigen/src/Core/MatrixBase.h +529 -0
data/vendor/eigen/Eigen/src/Core/NestByValue.h +110 -0
data/vendor/eigen/Eigen/src/Core/NoAlias.h +108 -0
data/vendor/eigen/Eigen/src/Core/NumTraits.h +248 -0
data/vendor/eigen/Eigen/src/Core/PermutationMatrix.h +633 -0
data/vendor/eigen/Eigen/src/Core/PlainObjectBase.h +1035 -0
data/vendor/eigen/Eigen/src/Core/Product.h +186 -0
data/vendor/eigen/Eigen/src/Core/ProductEvaluators.h +1112 -0
data/vendor/eigen/Eigen/src/Core/Random.h +182 -0
data/vendor/eigen/Eigen/src/Core/Redux.h +505 -0
data/vendor/eigen/Eigen/src/Core/Ref.h +283 -0
data/vendor/eigen/Eigen/src/Core/Replicate.h +142 -0
data/vendor/eigen/Eigen/src/Core/ReturnByValue.h +117 -0
data/vendor/eigen/Eigen/src/Core/Reverse.h +211 -0
data/vendor/eigen/Eigen/src/Core/Select.h +162 -0
data/vendor/eigen/Eigen/src/Core/SelfAdjointView.h +352 -0
data/vendor/eigen/Eigen/src/Core/SelfCwiseBinaryOp.h +47 -0
data/vendor/eigen/Eigen/src/Core/Solve.h +188 -0
data/vendor/eigen/Eigen/src/Core/SolveTriangular.h +235 -0
data/vendor/eigen/Eigen/src/Core/SolverBase.h +130 -0
data/vendor/eigen/Eigen/src/Core/StableNorm.h +221 -0
data/vendor/eigen/Eigen/src/Core/Stride.h +111 -0
data/vendor/eigen/Eigen/src/Core/Swap.h +67 -0
data/vendor/eigen/Eigen/src/Core/Transpose.h +403 -0
data/vendor/eigen/Eigen/src/Core/Transpositions.h +407 -0
data/vendor/eigen/Eigen/src/Core/TriangularMatrix.h +983 -0
data/vendor/eigen/Eigen/src/Core/VectorBlock.h +96 -0
data/vendor/eigen/Eigen/src/Core/VectorwiseOp.h +695 -0
data/vendor/eigen/Eigen/src/Core/Visitor.h +273 -0
data/vendor/eigen/Eigen/src/Core/arch/AVX/Complex.h +451 -0
data/vendor/eigen/Eigen/src/Core/arch/AVX/MathFunctions.h +439 -0
data/vendor/eigen/Eigen/src/Core/arch/AVX/PacketMath.h +637 -0
data/vendor/eigen/Eigen/src/Core/arch/AVX/TypeCasting.h +51 -0
data/vendor/eigen/Eigen/src/Core/arch/AVX512/MathFunctions.h +391 -0
data/vendor/eigen/Eigen/src/Core/arch/AVX512/PacketMath.h +1316 -0
data/vendor/eigen/Eigen/src/Core/arch/AltiVec/Complex.h +430 -0
data/vendor/eigen/Eigen/src/Core/arch/AltiVec/MathFunctions.h +322 -0
data/vendor/eigen/Eigen/src/Core/arch/AltiVec/PacketMath.h +1061 -0
data/vendor/eigen/Eigen/src/Core/arch/CUDA/Complex.h +103 -0
data/vendor/eigen/Eigen/src/Core/arch/CUDA/Half.h +674 -0
data/vendor/eigen/Eigen/src/Core/arch/CUDA/MathFunctions.h +91 -0
data/vendor/eigen/Eigen/src/Core/arch/CUDA/PacketMath.h +333 -0
data/vendor/eigen/Eigen/src/Core/arch/CUDA/PacketMathHalf.h +1124 -0
data/vendor/eigen/Eigen/src/Core/arch/CUDA/TypeCasting.h +212 -0
data/vendor/eigen/Eigen/src/Core/arch/Default/ConjHelper.h +29 -0
data/vendor/eigen/Eigen/src/Core/arch/Default/Settings.h +49 -0
data/vendor/eigen/Eigen/src/Core/arch/NEON/Complex.h +490 -0
data/vendor/eigen/Eigen/src/Core/arch/NEON/MathFunctions.h +91 -0
data/vendor/eigen/Eigen/src/Core/arch/NEON/PacketMath.h +760 -0
data/vendor/eigen/Eigen/src/Core/arch/SSE/Complex.h +471 -0
data/vendor/eigen/Eigen/src/Core/arch/SSE/MathFunctions.h +562 -0
data/vendor/eigen/Eigen/src/Core/arch/SSE/PacketMath.h +895 -0
data/vendor/eigen/Eigen/src/Core/arch/SSE/TypeCasting.h +77 -0
data/vendor/eigen/Eigen/src/Core/arch/ZVector/Complex.h +397 -0
data/vendor/eigen/Eigen/src/Core/arch/ZVector/MathFunctions.h +137 -0
data/vendor/eigen/Eigen/src/Core/arch/ZVector/PacketMath.h +945 -0
data/vendor/eigen/Eigen/src/Core/functors/AssignmentFunctors.h +168 -0
data/vendor/eigen/Eigen/src/Core/functors/BinaryFunctors.h +475 -0
data/vendor/eigen/Eigen/src/Core/functors/NullaryFunctors.h +188 -0
data/vendor/eigen/Eigen/src/Core/functors/StlFunctors.h +136 -0
data/vendor/eigen/Eigen/src/Core/functors/TernaryFunctors.h +25 -0
data/vendor/eigen/Eigen/src/Core/functors/UnaryFunctors.h +792 -0
data/vendor/eigen/Eigen/src/Core/products/GeneralBlockPanelKernel.h +2156 -0
data/vendor/eigen/Eigen/src/Core/products/GeneralMatrixMatrix.h +492 -0
data/vendor/eigen/Eigen/src/Core/products/GeneralMatrixMatrixTriangular.h +311 -0
data/vendor/eigen/Eigen/src/Core/products/GeneralMatrixMatrixTriangular_BLAS.h +145 -0
data/vendor/eigen/Eigen/src/Core/products/GeneralMatrixMatrix_BLAS.h +122 -0
data/vendor/eigen/Eigen/src/Core/products/GeneralMatrixVector.h +619 -0
data/vendor/eigen/Eigen/src/Core/products/GeneralMatrixVector_BLAS.h +136 -0
data/vendor/eigen/Eigen/src/Core/products/Parallelizer.h +163 -0
data/vendor/eigen/Eigen/src/Core/products/SelfadjointMatrixMatrix.h +521 -0
data/vendor/eigen/Eigen/src/Core/products/SelfadjointMatrixMatrix_BLAS.h +287 -0
data/vendor/eigen/Eigen/src/Core/products/SelfadjointMatrixVector.h +260 -0
data/vendor/eigen/Eigen/src/Core/products/SelfadjointMatrixVector_BLAS.h +118 -0
data/vendor/eigen/Eigen/src/Core/products/SelfadjointProduct.h +133 -0
data/vendor/eigen/Eigen/src/Core/products/SelfadjointRank2Update.h +93 -0
data/vendor/eigen/Eigen/src/Core/products/TriangularMatrixMatrix.h +466 -0
data/vendor/eigen/Eigen/src/Core/products/TriangularMatrixMatrix_BLAS.h +315 -0
data/vendor/eigen/Eigen/src/Core/products/TriangularMatrixVector.h +350 -0
data/vendor/eigen/Eigen/src/Core/products/TriangularMatrixVector_BLAS.h +255 -0
data/vendor/eigen/Eigen/src/Core/products/TriangularSolverMatrix.h +335 -0
data/vendor/eigen/Eigen/src/Core/products/TriangularSolverMatrix_BLAS.h +163 -0
data/vendor/eigen/Eigen/src/Core/products/TriangularSolverVector.h +145 -0
data/vendor/eigen/Eigen/src/Core/util/BlasUtil.h +398 -0
data/vendor/eigen/Eigen/src/Core/util/Constants.h +547 -0
data/vendor/eigen/Eigen/src/Core/util/DisableStupidWarnings.h +83 -0
data/vendor/eigen/Eigen/src/Core/util/ForwardDeclarations.h +302 -0
data/vendor/eigen/Eigen/src/Core/util/MKL_support.h +130 -0
data/vendor/eigen/Eigen/src/Core/util/Macros.h +1001 -0
data/vendor/eigen/Eigen/src/Core/util/Memory.h +993 -0
data/vendor/eigen/Eigen/src/Core/util/Meta.h +534 -0
data/vendor/eigen/Eigen/src/Core/util/NonMPL2.h +3 -0
data/vendor/eigen/Eigen/src/Core/util/ReenableStupidWarnings.h +27 -0
data/vendor/eigen/Eigen/src/Core/util/StaticAssert.h +218 -0
data/vendor/eigen/Eigen/src/Core/util/XprHelper.h +821 -0
data/vendor/eigen/Eigen/src/Eigenvalues/ComplexEigenSolver.h +346 -0
data/vendor/eigen/Eigen/src/Eigenvalues/ComplexSchur.h +459 -0
data/vendor/eigen/Eigen/src/Eigenvalues/ComplexSchur_LAPACKE.h +91 -0
data/vendor/eigen/Eigen/src/Eigenvalues/EigenSolver.h +622 -0
data/vendor/eigen/Eigen/src/Eigenvalues/GeneralizedEigenSolver.h +418 -0
data/vendor/eigen/Eigen/src/Eigenvalues/GeneralizedSelfAdjointEigenSolver.h +226 -0
data/vendor/eigen/Eigen/src/Eigenvalues/HessenbergDecomposition.h +374 -0
data/vendor/eigen/Eigen/src/Eigenvalues/MatrixBaseEigenvalues.h +158 -0
data/vendor/eigen/Eigen/src/Eigenvalues/RealQZ.h +654 -0
data/vendor/eigen/Eigen/src/Eigenvalues/RealSchur.h +546 -0
data/vendor/eigen/Eigen/src/Eigenvalues/RealSchur_LAPACKE.h +77 -0
data/vendor/eigen/Eigen/src/Eigenvalues/SelfAdjointEigenSolver.h +870 -0
data/vendor/eigen/Eigen/src/Eigenvalues/SelfAdjointEigenSolver_LAPACKE.h +87 -0
data/vendor/eigen/Eigen/src/Eigenvalues/Tridiagonalization.h +556 -0
data/vendor/eigen/Eigen/src/Geometry/AlignedBox.h +392 -0
data/vendor/eigen/Eigen/src/Geometry/AngleAxis.h +247 -0
data/vendor/eigen/Eigen/src/Geometry/EulerAngles.h +114 -0
data/vendor/eigen/Eigen/src/Geometry/Homogeneous.h +497 -0
data/vendor/eigen/Eigen/src/Geometry/Hyperplane.h +282 -0
data/vendor/eigen/Eigen/src/Geometry/OrthoMethods.h +234 -0
data/vendor/eigen/Eigen/src/Geometry/ParametrizedLine.h +195 -0
data/vendor/eigen/Eigen/src/Geometry/Quaternion.h +814 -0
data/vendor/eigen/Eigen/src/Geometry/Rotation2D.h +199 -0
data/vendor/eigen/Eigen/src/Geometry/RotationBase.h +206 -0
data/vendor/eigen/Eigen/src/Geometry/Scaling.h +170 -0
data/vendor/eigen/Eigen/src/Geometry/Transform.h +1542 -0
data/vendor/eigen/Eigen/src/Geometry/Translation.h +208 -0
data/vendor/eigen/Eigen/src/Geometry/Umeyama.h +166 -0
data/vendor/eigen/Eigen/src/Geometry/arch/Geometry_SSE.h +161 -0
data/vendor/eigen/Eigen/src/Householder/BlockHouseholder.h +103 -0
data/vendor/eigen/Eigen/src/Householder/Householder.h +172 -0
data/vendor/eigen/Eigen/src/Householder/HouseholderSequence.h +470 -0
data/vendor/eigen/Eigen/src/IterativeLinearSolvers/BasicPreconditioners.h +226 -0
data/vendor/eigen/Eigen/src/IterativeLinearSolvers/BiCGSTAB.h +228 -0
data/vendor/eigen/Eigen/src/IterativeLinearSolvers/ConjugateGradient.h +246 -0
data/vendor/eigen/Eigen/src/IterativeLinearSolvers/IncompleteCholesky.h +400 -0
data/vendor/eigen/Eigen/src/IterativeLinearSolvers/IncompleteLUT.h +462 -0
data/vendor/eigen/Eigen/src/IterativeLinearSolvers/IterativeSolverBase.h +394 -0
data/vendor/eigen/Eigen/src/IterativeLinearSolvers/LeastSquareConjugateGradient.h +216 -0
data/vendor/eigen/Eigen/src/IterativeLinearSolvers/SolveWithGuess.h +115 -0
data/vendor/eigen/Eigen/src/Jacobi/Jacobi.h +462 -0
data/vendor/eigen/Eigen/src/LU/Determinant.h +101 -0
data/vendor/eigen/Eigen/src/LU/FullPivLU.h +891 -0
data/vendor/eigen/Eigen/src/LU/InverseImpl.h +415 -0
data/vendor/eigen/Eigen/src/LU/PartialPivLU.h +611 -0
data/vendor/eigen/Eigen/src/LU/PartialPivLU_LAPACKE.h +83 -0
data/vendor/eigen/Eigen/src/LU/arch/Inverse_SSE.h +338 -0
data/vendor/eigen/Eigen/src/MetisSupport/MetisSupport.h +137 -0
data/vendor/eigen/Eigen/src/OrderingMethods/Amd.h +445 -0
data/vendor/eigen/Eigen/src/OrderingMethods/Eigen_Colamd.h +1843 -0
data/vendor/eigen/Eigen/src/OrderingMethods/Ordering.h +157 -0
data/vendor/eigen/Eigen/src/PaStiXSupport/PaStiXSupport.h +678 -0
data/vendor/eigen/Eigen/src/PardisoSupport/PardisoSupport.h +543 -0
data/vendor/eigen/Eigen/src/QR/ColPivHouseholderQR.h +653 -0
data/vendor/eigen/Eigen/src/QR/ColPivHouseholderQR_LAPACKE.h +97 -0
data/vendor/eigen/Eigen/src/QR/CompleteOrthogonalDecomposition.h +562 -0
data/vendor/eigen/Eigen/src/QR/FullPivHouseholderQR.h +676 -0
data/vendor/eigen/Eigen/src/QR/HouseholderQR.h +409 -0
data/vendor/eigen/Eigen/src/QR/HouseholderQR_LAPACKE.h +68 -0
data/vendor/eigen/Eigen/src/SPQRSupport/SuiteSparseQRSupport.h +313 -0
data/vendor/eigen/Eigen/src/SVD/BDCSVD.h +1246 -0
data/vendor/eigen/Eigen/src/SVD/JacobiSVD.h +804 -0
data/vendor/eigen/Eigen/src/SVD/JacobiSVD_LAPACKE.h +91 -0
data/vendor/eigen/Eigen/src/SVD/SVDBase.h +315 -0
data/vendor/eigen/Eigen/src/SVD/UpperBidiagonalization.h +414 -0
data/vendor/eigen/Eigen/src/SparseCholesky/SimplicialCholesky.h +689 -0
data/vendor/eigen/Eigen/src/SparseCholesky/SimplicialCholesky_impl.h +199 -0
data/vendor/eigen/Eigen/src/SparseCore/AmbiVector.h +377 -0
data/vendor/eigen/Eigen/src/SparseCore/CompressedStorage.h +258 -0
data/vendor/eigen/Eigen/src/SparseCore/ConservativeSparseSparseProduct.h +352 -0
data/vendor/eigen/Eigen/src/SparseCore/MappedSparseMatrix.h +67 -0
data/vendor/eigen/Eigen/src/SparseCore/SparseAssign.h +216 -0
data/vendor/eigen/Eigen/src/SparseCore/SparseBlock.h +603 -0
data/vendor/eigen/Eigen/src/SparseCore/SparseColEtree.h +206 -0
data/vendor/eigen/Eigen/src/SparseCore/SparseCompressedBase.h +341 -0
data/vendor/eigen/Eigen/src/SparseCore/SparseCwiseBinaryOp.h +726 -0
data/vendor/eigen/Eigen/src/SparseCore/SparseCwiseUnaryOp.h +148 -0
data/vendor/eigen/Eigen/src/SparseCore/SparseDenseProduct.h +320 -0
data/vendor/eigen/Eigen/src/SparseCore/SparseDiagonalProduct.h +138 -0
data/vendor/eigen/Eigen/src/SparseCore/SparseDot.h +98 -0
data/vendor/eigen/Eigen/src/SparseCore/SparseFuzzy.h +29 -0
data/vendor/eigen/Eigen/src/SparseCore/SparseMap.h +305 -0
data/vendor/eigen/Eigen/src/SparseCore/SparseMatrix.h +1403 -0
data/vendor/eigen/Eigen/src/SparseCore/SparseMatrixBase.h +405 -0
data/vendor/eigen/Eigen/src/SparseCore/SparsePermutation.h +178 -0
data/vendor/eigen/Eigen/src/SparseCore/SparseProduct.h +169 -0
data/vendor/eigen/Eigen/src/SparseCore/SparseRedux.h +49 -0
data/vendor/eigen/Eigen/src/SparseCore/SparseRef.h +397 -0
data/vendor/eigen/Eigen/src/SparseCore/SparseSelfAdjointView.h +656 -0
data/vendor/eigen/Eigen/src/SparseCore/SparseSolverBase.h +124 -0
data/vendor/eigen/Eigen/src/SparseCore/SparseSparseProductWithPruning.h +198 -0
data/vendor/eigen/Eigen/src/SparseCore/SparseTranspose.h +92 -0
data/vendor/eigen/Eigen/src/SparseCore/SparseTriangularView.h +189 -0
data/vendor/eigen/Eigen/src/SparseCore/SparseUtil.h +178 -0
data/vendor/eigen/Eigen/src/SparseCore/SparseVector.h +478 -0
data/vendor/eigen/Eigen/src/SparseCore/SparseView.h +253 -0
data/vendor/eigen/Eigen/src/SparseCore/TriangularSolver.h +315 -0
data/vendor/eigen/Eigen/src/SparseLU/SparseLU.h +773 -0
data/vendor/eigen/Eigen/src/SparseLU/SparseLUImpl.h +66 -0
data/vendor/eigen/Eigen/src/SparseLU/SparseLU_Memory.h +226 -0
data/vendor/eigen/Eigen/src/SparseLU/SparseLU_Structs.h +110 -0
data/vendor/eigen/Eigen/src/SparseLU/SparseLU_SupernodalMatrix.h +301 -0
data/vendor/eigen/Eigen/src/SparseLU/SparseLU_Utils.h +80 -0
data/vendor/eigen/Eigen/src/SparseLU/SparseLU_column_bmod.h +181 -0
data/vendor/eigen/Eigen/src/SparseLU/SparseLU_column_dfs.h +179 -0
data/vendor/eigen/Eigen/src/SparseLU/SparseLU_copy_to_ucol.h +107 -0
data/vendor/eigen/Eigen/src/SparseLU/SparseLU_gemm_kernel.h +280 -0
data/vendor/eigen/Eigen/src/SparseLU/SparseLU_heap_relax_snode.h +126 -0
data/vendor/eigen/Eigen/src/SparseLU/SparseLU_kernel_bmod.h +130 -0
data/vendor/eigen/Eigen/src/SparseLU/SparseLU_panel_bmod.h +223 -0
data/vendor/eigen/Eigen/src/SparseLU/SparseLU_panel_dfs.h +258 -0
data/vendor/eigen/Eigen/src/SparseLU/SparseLU_pivotL.h +137 -0
data/vendor/eigen/Eigen/src/SparseLU/SparseLU_pruneL.h +136 -0
data/vendor/eigen/Eigen/src/SparseLU/SparseLU_relax_snode.h +83 -0
data/vendor/eigen/Eigen/src/SparseQR/SparseQR.h +745 -0
data/vendor/eigen/Eigen/src/StlSupport/StdDeque.h +126 -0
data/vendor/eigen/Eigen/src/StlSupport/StdList.h +106 -0
data/vendor/eigen/Eigen/src/StlSupport/StdVector.h +131 -0
data/vendor/eigen/Eigen/src/StlSupport/details.h +84 -0
data/vendor/eigen/Eigen/src/SuperLUSupport/SuperLUSupport.h +1027 -0
data/vendor/eigen/Eigen/src/UmfPackSupport/UmfPackSupport.h +506 -0
data/vendor/eigen/Eigen/src/misc/Image.h +82 -0
data/vendor/eigen/Eigen/src/misc/Kernel.h +79 -0
data/vendor/eigen/Eigen/src/misc/RealSvd2x2.h +55 -0
data/vendor/eigen/Eigen/src/misc/blas.h +440 -0
data/vendor/eigen/Eigen/src/misc/lapack.h +152 -0
data/vendor/eigen/Eigen/src/misc/lapacke.h +16291 -0
data/vendor/eigen/Eigen/src/misc/lapacke_mangling.h +17 -0
data/vendor/eigen/Eigen/src/plugins/ArrayCwiseBinaryOps.h +332 -0
data/vendor/eigen/Eigen/src/plugins/ArrayCwiseUnaryOps.h +552 -0
data/vendor/eigen/Eigen/src/plugins/BlockMethods.h +1058 -0
data/vendor/eigen/Eigen/src/plugins/CommonCwiseBinaryOps.h +115 -0
data/vendor/eigen/Eigen/src/plugins/CommonCwiseUnaryOps.h +163 -0
data/vendor/eigen/Eigen/src/plugins/MatrixCwiseBinaryOps.h +152 -0
data/vendor/eigen/Eigen/src/plugins/MatrixCwiseUnaryOps.h +85 -0
data/vendor/eigen/README.md +3 -0
data/vendor/eigen/bench/README.txt +55 -0
data/vendor/eigen/bench/btl/COPYING +340 -0
data/vendor/eigen/bench/btl/README +154 -0
data/vendor/eigen/bench/tensors/README +21 -0
data/vendor/eigen/blas/README.txt +6 -0
data/vendor/eigen/demos/mandelbrot/README +10 -0
data/vendor/eigen/demos/mix_eigen_and_c/README +9 -0
data/vendor/eigen/demos/opengl/README +13 -0
data/vendor/eigen/unsupported/Eigen/CXX11/src/Tensor/README.md +1760 -0
data/vendor/eigen/unsupported/README.txt +50 -0
data/vendor/tomotopy/LICENSE +21 -0
data/vendor/tomotopy/README.kr.rst +375 -0
data/vendor/tomotopy/README.rst +382 -0
data/vendor/tomotopy/src/Labeling/FoRelevance.cpp +362 -0
data/vendor/tomotopy/src/Labeling/FoRelevance.h +88 -0
data/vendor/tomotopy/src/Labeling/Labeler.h +50 -0
data/vendor/tomotopy/src/TopicModel/CT.h +37 -0
data/vendor/tomotopy/src/TopicModel/CTModel.cpp +13 -0
data/vendor/tomotopy/src/TopicModel/CTModel.hpp +293 -0
data/vendor/tomotopy/src/TopicModel/DMR.h +51 -0
data/vendor/tomotopy/src/TopicModel/DMRModel.cpp +13 -0
data/vendor/tomotopy/src/TopicModel/DMRModel.hpp +374 -0
data/vendor/tomotopy/src/TopicModel/DT.h +65 -0
data/vendor/tomotopy/src/TopicModel/DTM.h +22 -0
data/vendor/tomotopy/src/TopicModel/DTModel.cpp +15 -0
data/vendor/tomotopy/src/TopicModel/DTModel.hpp +572 -0
data/vendor/tomotopy/src/TopicModel/GDMR.h +37 -0
data/vendor/tomotopy/src/TopicModel/GDMRModel.cpp +14 -0
data/vendor/tomotopy/src/TopicModel/GDMRModel.hpp +485 -0
data/vendor/tomotopy/src/TopicModel/HDP.h +74 -0
data/vendor/tomotopy/src/TopicModel/HDPModel.cpp +13 -0
data/vendor/tomotopy/src/TopicModel/HDPModel.hpp +592 -0
data/vendor/tomotopy/src/TopicModel/HLDA.h +40 -0
data/vendor/tomotopy/src/TopicModel/HLDAModel.cpp +13 -0
data/vendor/tomotopy/src/TopicModel/HLDAModel.hpp +681 -0
data/vendor/tomotopy/src/TopicModel/HPA.h +27 -0
data/vendor/tomotopy/src/TopicModel/HPAModel.cpp +21 -0
data/vendor/tomotopy/src/TopicModel/HPAModel.hpp +588 -0
data/vendor/tomotopy/src/TopicModel/LDA.h +144 -0
data/vendor/tomotopy/src/TopicModel/LDACVB0Model.hpp +442 -0
data/vendor/tomotopy/src/TopicModel/LDAModel.cpp +13 -0
data/vendor/tomotopy/src/TopicModel/LDAModel.hpp +1058 -0
data/vendor/tomotopy/src/TopicModel/LLDA.h +45 -0
data/vendor/tomotopy/src/TopicModel/LLDAModel.cpp +13 -0
data/vendor/tomotopy/src/TopicModel/LLDAModel.hpp +203 -0
data/vendor/tomotopy/src/TopicModel/MGLDA.h +63 -0
data/vendor/tomotopy/src/TopicModel/MGLDAModel.cpp +17 -0
data/vendor/tomotopy/src/TopicModel/MGLDAModel.hpp +558 -0
data/vendor/tomotopy/src/TopicModel/PA.h +43 -0
data/vendor/tomotopy/src/TopicModel/PAModel.cpp +13 -0
data/vendor/tomotopy/src/TopicModel/PAModel.hpp +467 -0
data/vendor/tomotopy/src/TopicModel/PLDA.h +17 -0
data/vendor/tomotopy/src/TopicModel/PLDAModel.cpp +13 -0
data/vendor/tomotopy/src/TopicModel/PLDAModel.hpp +214 -0
data/vendor/tomotopy/src/TopicModel/SLDA.h +54 -0
data/vendor/tomotopy/src/TopicModel/SLDAModel.cpp +17 -0
data/vendor/tomotopy/src/TopicModel/SLDAModel.hpp +456 -0
data/vendor/tomotopy/src/TopicModel/TopicModel.hpp +692 -0
data/vendor/tomotopy/src/Utils/AliasMethod.hpp +169 -0
data/vendor/tomotopy/src/Utils/Dictionary.h +80 -0
data/vendor/tomotopy/src/Utils/EigenAddonOps.hpp +181 -0
data/vendor/tomotopy/src/Utils/LBFGS.h +202 -0
data/vendor/tomotopy/src/Utils/LBFGS/LineSearchBacktracking.h +120 -0
data/vendor/tomotopy/src/Utils/LBFGS/LineSearchBracketing.h +122 -0
data/vendor/tomotopy/src/Utils/LBFGS/Param.h +213 -0
data/vendor/tomotopy/src/Utils/LUT.hpp +82 -0
data/vendor/tomotopy/src/Utils/MultiNormalDistribution.hpp +69 -0
data/vendor/tomotopy/src/Utils/PolyaGamma.hpp +200 -0
data/vendor/tomotopy/src/Utils/PolyaGammaHybrid.hpp +672 -0
data/vendor/tomotopy/src/Utils/ThreadPool.hpp +150 -0
data/vendor/tomotopy/src/Utils/Trie.hpp +220 -0
data/vendor/tomotopy/src/Utils/TruncMultiNormal.hpp +94 -0
data/vendor/tomotopy/src/Utils/Utils.hpp +337 -0
data/vendor/tomotopy/src/Utils/avx_gamma.h +46 -0
data/vendor/tomotopy/src/Utils/avx_mathfun.h +736 -0
data/vendor/tomotopy/src/Utils/exception.h +28 -0
data/vendor/tomotopy/src/Utils/math.h +281 -0
data/vendor/tomotopy/src/Utils/rtnorm.hpp +2690 -0
data/vendor/tomotopy/src/Utils/sample.hpp +192 -0
data/vendor/tomotopy/src/Utils/serializer.hpp +695 -0
data/vendor/tomotopy/src/Utils/slp.hpp +131 -0
data/vendor/tomotopy/src/Utils/sse_gamma.h +48 -0
data/vendor/tomotopy/src/Utils/sse_mathfun.h +710 -0
data/vendor/tomotopy/src/Utils/text.hpp +49 -0
data/vendor/tomotopy/src/Utils/tvector.hpp +543 -0
metadata +531 -0

data/vendor/eigen/Eigen/src/Core/Product.h ADDED

@@ -0,0 +1,186 @@
+// This file is part of Eigen, a lightweight C++ template library
+// for linear algebra.
+//
+// Copyright (C) 2008-2011 Gael Guennebaud <gael.guennebaud@inria.fr>
+//
+// This Source Code Form is subject to the terms of the Mozilla
+// Public License v. 2.0. If a copy of the MPL was not distributed
+// with this file, You can obtain one at http://mozilla.org/MPL/2.0/.
+#ifndef EIGEN_PRODUCT_H
+#define EIGEN_PRODUCT_H
+namespace Eigen {
+template<typename Lhs, typename Rhs, int Option, typename StorageKind> class ProductImpl;
+namespace internal {
+template<typename Lhs, typename Rhs, int Option>
+struct traits<Product<Lhs, Rhs, Option> >
+{
+  typedef typename remove_all<Lhs>::type LhsCleaned;
+  typedef typename remove_all<Rhs>::type RhsCleaned;
+  typedef traits<LhsCleaned> LhsTraits;
+  typedef traits<RhsCleaned> RhsTraits;
+  typedef MatrixXpr XprKind;
+  typedef typename ScalarBinaryOpTraits<typename traits<LhsCleaned>::Scalar, typename traits<RhsCleaned>::Scalar>::ReturnType Scalar;
+  typedef typename product_promote_storage_type<typename LhsTraits::StorageKind,
+                                                typename RhsTraits::StorageKind,
+                                                internal::product_type<Lhs,Rhs>::ret>::ret StorageKind;
+  typedef typename promote_index_type<typename LhsTraits::StorageIndex,
+                                      typename RhsTraits::StorageIndex>::type StorageIndex;
+  enum {
+    RowsAtCompileTime    = LhsTraits::RowsAtCompileTime,
+    ColsAtCompileTime    = RhsTraits::ColsAtCompileTime,
+    MaxRowsAtCompileTime = LhsTraits::MaxRowsAtCompileTime,
+    MaxColsAtCompileTime = RhsTraits::MaxColsAtCompileTime,
+    // FIXME: only needed by GeneralMatrixMatrixTriangular
+    InnerSize = EIGEN_SIZE_MIN_PREFER_FIXED(LhsTraits::ColsAtCompileTime, RhsTraits::RowsAtCompileTime),
+    // The storage order is somewhat arbitrary here. The correct one will be determined through the evaluator.
+    Flags = (MaxRowsAtCompileTime==1 && MaxColsAtCompileTime!=1) ? RowMajorBit
+          : (MaxColsAtCompileTime==1 && MaxRowsAtCompileTime!=1) ? 0
+          : (   ((LhsTraits::Flags&NoPreferredStorageOrderBit) && (RhsTraits::Flags&RowMajorBit))
+             || ((RhsTraits::Flags&NoPreferredStorageOrderBit) && (LhsTraits::Flags&RowMajorBit)) ) ? RowMajorBit
+          : NoPreferredStorageOrderBit
+  };
+};
+} // end namespace internal
+/** \class Product
+  * \ingroup Core_Module
+  *
+  * \brief Expression of the product of two arbitrary matrices or vectors
+  *
+  * \tparam _Lhs the type of the left-hand side expression
+  * \tparam _Rhs the type of the right-hand side expression
+  *
+  * This class represents an expression of the product of two arbitrary matrices.
+  *
+  * The other template parameters are:
+  * \tparam Option     can be DefaultProduct, AliasFreeProduct, or LazyProduct
+  *
+  */
+template<typename _Lhs, typename _Rhs, int Option>
+class Product : public ProductImpl<_Lhs,_Rhs,Option,
+                                   typename internal::product_promote_storage_type<typename internal::traits<_Lhs>::StorageKind,
+                                                                                   typename internal::traits<_Rhs>::StorageKind,
+                                                                                   internal::product_type<_Lhs,_Rhs>::ret>::ret>
+{
+  public:
+    typedef _Lhs Lhs;
+    typedef _Rhs Rhs;
+    typedef typename ProductImpl<
+        Lhs, Rhs, Option,
+        typename internal::product_promote_storage_type<typename internal::traits<Lhs>::StorageKind,
+                                                        typename internal::traits<Rhs>::StorageKind,
+                                                        internal::product_type<Lhs,Rhs>::ret>::ret>::Base Base;
+    EIGEN_GENERIC_PUBLIC_INTERFACE(Product)
+    typedef typename internal::ref_selector<Lhs>::type LhsNested;
+    typedef typename internal::ref_selector<Rhs>::type RhsNested;
+    typedef typename internal::remove_all<LhsNested>::type LhsNestedCleaned;
+    typedef typename internal::remove_all<RhsNested>::type RhsNestedCleaned;
+    EIGEN_DEVICE_FUNC Product(const Lhs& lhs, const Rhs& rhs) : m_lhs(lhs), m_rhs(rhs)
+    {
+      eigen_assert(lhs.cols() == rhs.rows()
+        && "invalid matrix product"
+        && "if you wanted a coeff-wise or a dot product use the respective explicit functions");
+    }
+    EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE Index rows() const { return m_lhs.rows(); }
+    EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE Index cols() const { return m_rhs.cols(); }
+    EIGEN_DEVICE_FUNC const LhsNestedCleaned& lhs() const { return m_lhs; }
+    EIGEN_DEVICE_FUNC const RhsNestedCleaned& rhs() const { return m_rhs; }
+  protected:
+    LhsNested m_lhs;
+    RhsNested m_rhs;
+};
+namespace internal {
+template<typename Lhs, typename Rhs, int Option, int ProductTag = internal::product_type<Lhs,Rhs>::ret>
+class dense_product_base
+ : public internal::dense_xpr_base<Product<Lhs,Rhs,Option> >::type
+{};
+/** Convertion to scalar for inner-products */
+template<typename Lhs, typename Rhs, int Option>
+class dense_product_base<Lhs, Rhs, Option, InnerProduct>
+ : public internal::dense_xpr_base<Product<Lhs,Rhs,Option> >::type
+{
+  typedef Product<Lhs,Rhs,Option> ProductXpr;
+  typedef typename internal::dense_xpr_base<ProductXpr>::type Base;
+public:
+  using Base::derived;
+  typedef typename Base::Scalar Scalar;
+  EIGEN_STRONG_INLINE operator const Scalar() const
+  {
+    return internal::evaluator<ProductXpr>(derived()).coeff(0,0);
+  }
+};
+} // namespace internal
+// Generic API dispatcher
+template<typename Lhs, typename Rhs, int Option, typename StorageKind>
+class ProductImpl : public internal::generic_xpr_base<Product<Lhs,Rhs,Option>, MatrixXpr, StorageKind>::type
+{
+  public:
+    typedef typename internal::generic_xpr_base<Product<Lhs,Rhs,Option>, MatrixXpr, StorageKind>::type Base;
+};
+template<typename Lhs, typename Rhs, int Option>
+class ProductImpl<Lhs,Rhs,Option,Dense>
+  : public internal::dense_product_base<Lhs,Rhs,Option>
+{
+    typedef Product<Lhs, Rhs, Option> Derived;
+  public:
+    typedef typename internal::dense_product_base<Lhs, Rhs, Option> Base;
+    EIGEN_DENSE_PUBLIC_INTERFACE(Derived)
+  protected:
+    enum {
+      IsOneByOne = (RowsAtCompileTime == 1 || RowsAtCompileTime == Dynamic) &&
+                   (ColsAtCompileTime == 1 || ColsAtCompileTime == Dynamic),
+      EnableCoeff = IsOneByOne || Option==LazyProduct
+    };
+  public:
+    EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE Scalar coeff(Index row, Index col) const
+    {
+      EIGEN_STATIC_ASSERT(EnableCoeff, THIS_METHOD_IS_ONLY_FOR_INNER_OR_LAZY_PRODUCTS);
+      eigen_assert( (Option==LazyProduct) || (this->rows() == 1 && this->cols() == 1) );
+      return internal::evaluator<Derived>(derived()).coeff(row,col);
+    }
+    EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE Scalar coeff(Index i) const
+    {
+      EIGEN_STATIC_ASSERT(EnableCoeff, THIS_METHOD_IS_ONLY_FOR_INNER_OR_LAZY_PRODUCTS);
+      eigen_assert( (Option==LazyProduct) || (this->rows() == 1 && this->cols() == 1) );
+      return internal::evaluator<Derived>(derived()).coeff(i);
+    }
+};
+} // end namespace Eigen
+#endif // EIGEN_PRODUCT_H

data/vendor/eigen/Eigen/src/Core/ProductEvaluators.h ADDED

@@ -0,0 +1,1112 @@
+// This file is part of Eigen, a lightweight C++ template library
+// for linear algebra.
+//
+// Copyright (C) 2006-2008 Benoit Jacob <jacob.benoit.1@gmail.com>
+// Copyright (C) 2008-2010 Gael Guennebaud <gael.guennebaud@inria.fr>
+// Copyright (C) 2011 Jitse Niesen <jitse@maths.leeds.ac.uk>
+//
+// This Source Code Form is subject to the terms of the Mozilla
+// Public License v. 2.0. If a copy of the MPL was not distributed
+// with this file, You can obtain one at http://mozilla.org/MPL/2.0/.
+#ifndef EIGEN_PRODUCTEVALUATORS_H
+#define EIGEN_PRODUCTEVALUATORS_H
+namespace Eigen {
+namespace internal {
+/** \internal
+  * Evaluator of a product expression.
+  * Since products require special treatments to handle all possible cases,
+  * we simply deffer the evaluation logic to a product_evaluator class
+  * which offers more partial specialization possibilities.
+  *
+  * \sa class product_evaluator
+  */
+template<typename Lhs, typename Rhs, int Options>
+struct evaluator<Product<Lhs, Rhs, Options> >
+ : public product_evaluator<Product<Lhs, Rhs, Options> >
+{
+  typedef Product<Lhs, Rhs, Options> XprType;
+  typedef product_evaluator<XprType> Base;
+  EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE explicit evaluator(const XprType& xpr) : Base(xpr) {}
+};
+// Catch "scalar * ( A * B )" and transform it to "(A*scalar) * B"
+// TODO we should apply that rule only if that's really helpful
+template<typename Lhs, typename Rhs, typename Scalar1, typename Scalar2, typename Plain1>
+struct evaluator_assume_aliasing<CwiseBinaryOp<internal::scalar_product_op<Scalar1,Scalar2>,
+                                               const CwiseNullaryOp<internal::scalar_constant_op<Scalar1>, Plain1>,
+                                               const Product<Lhs, Rhs, DefaultProduct> > >
+{
+  static const bool value = true;
+};
+template<typename Lhs, typename Rhs, typename Scalar1, typename Scalar2, typename Plain1>
+struct evaluator<CwiseBinaryOp<internal::scalar_product_op<Scalar1,Scalar2>,
+                               const CwiseNullaryOp<internal::scalar_constant_op<Scalar1>, Plain1>,
+                               const Product<Lhs, Rhs, DefaultProduct> > >
+ : public evaluator<Product<EIGEN_SCALAR_BINARYOP_EXPR_RETURN_TYPE(Scalar1,Lhs,product), Rhs, DefaultProduct> >
+{
+  typedef CwiseBinaryOp<internal::scalar_product_op<Scalar1,Scalar2>,
+                               const CwiseNullaryOp<internal::scalar_constant_op<Scalar1>, Plain1>,
+                               const Product<Lhs, Rhs, DefaultProduct> > XprType;
+  typedef evaluator<Product<EIGEN_SCALAR_BINARYOP_EXPR_RETURN_TYPE(Scalar1,Lhs,product), Rhs, DefaultProduct> > Base;
+  EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE explicit evaluator(const XprType& xpr)
+    : Base(xpr.lhs().functor().m_other * xpr.rhs().lhs() * xpr.rhs().rhs())
+  {}
+};
+template<typename Lhs, typename Rhs, int DiagIndex>
+struct evaluator<Diagonal<const Product<Lhs, Rhs, DefaultProduct>, DiagIndex> >
+ : public evaluator<Diagonal<const Product<Lhs, Rhs, LazyProduct>, DiagIndex> >
+{
+  typedef Diagonal<const Product<Lhs, Rhs, DefaultProduct>, DiagIndex> XprType;
+  typedef evaluator<Diagonal<const Product<Lhs, Rhs, LazyProduct>, DiagIndex> > Base;
+  EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE explicit evaluator(const XprType& xpr)
+    : Base(Diagonal<const Product<Lhs, Rhs, LazyProduct>, DiagIndex>(
+        Product<Lhs, Rhs, LazyProduct>(xpr.nestedExpression().lhs(), xpr.nestedExpression().rhs()),
+        xpr.index() ))
+  {}
+};
+// Helper class to perform a matrix product with the destination at hand.
+// Depending on the sizes of the factors, there are different evaluation strategies
+// as controlled by internal::product_type.
+template< typename Lhs, typename Rhs,
+          typename LhsShape = typename evaluator_traits<Lhs>::Shape,
+          typename RhsShape = typename evaluator_traits<Rhs>::Shape,
+          int ProductType = internal::product_type<Lhs,Rhs>::value>
+struct generic_product_impl;
+template<typename Lhs, typename Rhs>
+struct evaluator_assume_aliasing<Product<Lhs, Rhs, DefaultProduct> > {
+  static const bool value = true;
+};
+// This is the default evaluator implementation for products:
+// It creates a temporary and call generic_product_impl
+template<typename Lhs, typename Rhs, int Options, int ProductTag, typename LhsShape, typename RhsShape>
+struct product_evaluator<Product<Lhs, Rhs, Options>, ProductTag, LhsShape, RhsShape>
+  : public evaluator<typename Product<Lhs, Rhs, Options>::PlainObject>
+{
+  typedef Product<Lhs, Rhs, Options> XprType;
+  typedef typename XprType::PlainObject PlainObject;
+  typedef evaluator<PlainObject> Base;
+  enum {
+    Flags = Base::Flags | EvalBeforeNestingBit
+  };
+  EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE
+  explicit product_evaluator(const XprType& xpr)
+    : m_result(xpr.rows(), xpr.cols())
+  {
+    ::new (static_cast<Base*>(this)) Base(m_result);
+// FIXME shall we handle nested_eval here?,
+// if so, then we must take care at removing the call to nested_eval in the specializations (e.g., in permutation_matrix_product, transposition_matrix_product, etc.)
+//     typedef typename internal::nested_eval<Lhs,Rhs::ColsAtCompileTime>::type LhsNested;
+//     typedef typename internal::nested_eval<Rhs,Lhs::RowsAtCompileTime>::type RhsNested;
+//     typedef typename internal::remove_all<LhsNested>::type LhsNestedCleaned;
+//     typedef typename internal::remove_all<RhsNested>::type RhsNestedCleaned;
+//
+//     const LhsNested lhs(xpr.lhs());
+//     const RhsNested rhs(xpr.rhs());
+//
+//     generic_product_impl<LhsNestedCleaned, RhsNestedCleaned>::evalTo(m_result, lhs, rhs);
+    generic_product_impl<Lhs, Rhs, LhsShape, RhsShape, ProductTag>::evalTo(m_result, xpr.lhs(), xpr.rhs());
+  }
+protected:
+  PlainObject m_result;
+};
+// The following three shortcuts are enabled only if the scalar types match excatly.
+// TODO: we could enable them for different scalar types when the product is not vectorized.
+// Dense = Product
+template< typename DstXprType, typename Lhs, typename Rhs, int Options, typename Scalar>
+struct Assignment<DstXprType, Product<Lhs,Rhs,Options>, internal::assign_op<Scalar,Scalar>, Dense2Dense,
+  typename enable_if<(Options==DefaultProduct || Options==AliasFreeProduct)>::type>
+{
+  typedef Product<Lhs,Rhs,Options> SrcXprType;
+  static EIGEN_STRONG_INLINE
+  void run(DstXprType &dst, const SrcXprType &src, const internal::assign_op<Scalar,Scalar> &)
+  {
+    Index dstRows = src.rows();
+    Index dstCols = src.cols();
+    if((dst.rows()!=dstRows) || (dst.cols()!=dstCols))
+      dst.resize(dstRows, dstCols);
+    // FIXME shall we handle nested_eval here?
+    generic_product_impl<Lhs, Rhs>::evalTo(dst, src.lhs(), src.rhs());
+  }
+};
+// Dense += Product
+template< typename DstXprType, typename Lhs, typename Rhs, int Options, typename Scalar>
+struct Assignment<DstXprType, Product<Lhs,Rhs,Options>, internal::add_assign_op<Scalar,Scalar>, Dense2Dense,
+  typename enable_if<(Options==DefaultProduct || Options==AliasFreeProduct)>::type>
+{
+  typedef Product<Lhs,Rhs,Options> SrcXprType;
+  static EIGEN_STRONG_INLINE
+  void run(DstXprType &dst, const SrcXprType &src, const internal::add_assign_op<Scalar,Scalar> &)
+  {
+    eigen_assert(dst.rows() == src.rows() && dst.cols() == src.cols());
+    // FIXME shall we handle nested_eval here?
+    generic_product_impl<Lhs, Rhs>::addTo(dst, src.lhs(), src.rhs());
+  }
+};
+// Dense -= Product
+template< typename DstXprType, typename Lhs, typename Rhs, int Options, typename Scalar>
+struct Assignment<DstXprType, Product<Lhs,Rhs,Options>, internal::sub_assign_op<Scalar,Scalar>, Dense2Dense,
+  typename enable_if<(Options==DefaultProduct || Options==AliasFreeProduct)>::type>
+{
+  typedef Product<Lhs,Rhs,Options> SrcXprType;
+  static EIGEN_STRONG_INLINE
+  void run(DstXprType &dst, const SrcXprType &src, const internal::sub_assign_op<Scalar,Scalar> &)
+  {
+    eigen_assert(dst.rows() == src.rows() && dst.cols() == src.cols());
+    // FIXME shall we handle nested_eval here?
+    generic_product_impl<Lhs, Rhs>::subTo(dst, src.lhs(), src.rhs());
+  }
+};
+// Dense ?= scalar * Product
+// TODO we should apply that rule if that's really helpful
+// for instance, this is not good for inner products
+template< typename DstXprType, typename Lhs, typename Rhs, typename AssignFunc, typename Scalar, typename ScalarBis, typename Plain>
+struct Assignment<DstXprType, CwiseBinaryOp<internal::scalar_product_op<ScalarBis,Scalar>, const CwiseNullaryOp<internal::scalar_constant_op<ScalarBis>,Plain>,
+                                           const Product<Lhs,Rhs,DefaultProduct> >, AssignFunc, Dense2Dense>
+{
+  typedef CwiseBinaryOp<internal::scalar_product_op<ScalarBis,Scalar>,
+                        const CwiseNullaryOp<internal::scalar_constant_op<ScalarBis>,Plain>,
+                        const Product<Lhs,Rhs,DefaultProduct> > SrcXprType;
+  static EIGEN_STRONG_INLINE
+  void run(DstXprType &dst, const SrcXprType &src, const AssignFunc& func)
+  {
+    call_assignment_no_alias(dst, (src.lhs().functor().m_other * src.rhs().lhs())*src.rhs().rhs(), func);
+  }
+};
+//----------------------------------------
+// Catch "Dense ?= xpr + Product<>" expression to save one temporary
+// FIXME we could probably enable these rules for any product, i.e., not only Dense and DefaultProduct
+template<typename OtherXpr, typename Lhs, typename Rhs>
+struct evaluator_assume_aliasing<CwiseBinaryOp<internal::scalar_sum_op<typename OtherXpr::Scalar,typename Product<Lhs,Rhs,DefaultProduct>::Scalar>, const OtherXpr,
+                                               const Product<Lhs,Rhs,DefaultProduct> >, DenseShape > {
+  static const bool value = true;
+};
+template<typename OtherXpr, typename Lhs, typename Rhs>
+struct evaluator_assume_aliasing<CwiseBinaryOp<internal::scalar_difference_op<typename OtherXpr::Scalar,typename Product<Lhs,Rhs,DefaultProduct>::Scalar>, const OtherXpr,
+                                               const Product<Lhs,Rhs,DefaultProduct> >, DenseShape > {
+  static const bool value = true;
+};
+template<typename DstXprType, typename OtherXpr, typename ProductType, typename Func1, typename Func2>
+struct assignment_from_xpr_op_product
+{
+  template<typename SrcXprType, typename InitialFunc>
+  static EIGEN_STRONG_INLINE
+  void run(DstXprType &dst, const SrcXprType &src, const InitialFunc& /*func*/)
+  {
+    call_assignment_no_alias(dst, src.lhs(), Func1());
+    call_assignment_no_alias(dst, src.rhs(), Func2());
+  }
+};
+#define EIGEN_CATCH_ASSIGN_XPR_OP_PRODUCT(ASSIGN_OP,BINOP,ASSIGN_OP2) \
+  template< typename DstXprType, typename OtherXpr, typename Lhs, typename Rhs, typename DstScalar, typename SrcScalar, typename OtherScalar,typename ProdScalar> \
+  struct Assignment<DstXprType, CwiseBinaryOp<internal::BINOP<OtherScalar,ProdScalar>, const OtherXpr, \
+                                            const Product<Lhs,Rhs,DefaultProduct> >, internal::ASSIGN_OP<DstScalar,SrcScalar>, Dense2Dense> \
+    : assignment_from_xpr_op_product<DstXprType, OtherXpr, Product<Lhs,Rhs,DefaultProduct>, internal::ASSIGN_OP<DstScalar,OtherScalar>, internal::ASSIGN_OP2<DstScalar,ProdScalar> > \
+  {}
+EIGEN_CATCH_ASSIGN_XPR_OP_PRODUCT(assign_op,    scalar_sum_op,add_assign_op);
+EIGEN_CATCH_ASSIGN_XPR_OP_PRODUCT(add_assign_op,scalar_sum_op,add_assign_op);
+EIGEN_CATCH_ASSIGN_XPR_OP_PRODUCT(sub_assign_op,scalar_sum_op,sub_assign_op);
+EIGEN_CATCH_ASSIGN_XPR_OP_PRODUCT(assign_op,    scalar_difference_op,sub_assign_op);
+EIGEN_CATCH_ASSIGN_XPR_OP_PRODUCT(add_assign_op,scalar_difference_op,sub_assign_op);
+EIGEN_CATCH_ASSIGN_XPR_OP_PRODUCT(sub_assign_op,scalar_difference_op,add_assign_op);
+//----------------------------------------
+template<typename Lhs, typename Rhs>
+struct generic_product_impl<Lhs,Rhs,DenseShape,DenseShape,InnerProduct>
+{
+  template<typename Dst>
+  static EIGEN_STRONG_INLINE void evalTo(Dst& dst, const Lhs& lhs, const Rhs& rhs)
+  {
+    dst.coeffRef(0,0) = (lhs.transpose().cwiseProduct(rhs)).sum();
+  }
+  template<typename Dst>
+  static EIGEN_STRONG_INLINE void addTo(Dst& dst, const Lhs& lhs, const Rhs& rhs)
+  {
+    dst.coeffRef(0,0) += (lhs.transpose().cwiseProduct(rhs)).sum();
+  }
+  template<typename Dst>
+  static EIGEN_STRONG_INLINE void subTo(Dst& dst, const Lhs& lhs, const Rhs& rhs)
+  { dst.coeffRef(0,0) -= (lhs.transpose().cwiseProduct(rhs)).sum(); }
+};
+/***********************************************************************
+*  Implementation of outer dense * dense vector product
+***********************************************************************/
+// Column major result
+template<typename Dst, typename Lhs, typename Rhs, typename Func>
+void outer_product_selector_run(Dst& dst, const Lhs &lhs, const Rhs &rhs, const Func& func, const false_type&)
+{
+  evaluator<Rhs> rhsEval(rhs);
+  typename nested_eval<Lhs,Rhs::SizeAtCompileTime>::type actual_lhs(lhs);
+  // FIXME if cols is large enough, then it might be useful to make sure that lhs is sequentially stored
+  // FIXME not very good if rhs is real and lhs complex while alpha is real too
+  const Index cols = dst.cols();
+  for (Index j=0; j<cols; ++j)
+    func(dst.col(j), rhsEval.coeff(Index(0),j) * actual_lhs);
+}
+// Row major result
+template<typename Dst, typename Lhs, typename Rhs, typename Func>
+void outer_product_selector_run(Dst& dst, const Lhs &lhs, const Rhs &rhs, const Func& func, const true_type&)
+{
+  evaluator<Lhs> lhsEval(lhs);
+  typename nested_eval<Rhs,Lhs::SizeAtCompileTime>::type actual_rhs(rhs);
+  // FIXME if rows is large enough, then it might be useful to make sure that rhs is sequentially stored
+  // FIXME not very good if lhs is real and rhs complex while alpha is real too
+  const Index rows = dst.rows();
+  for (Index i=0; i<rows; ++i)
+    func(dst.row(i), lhsEval.coeff(i,Index(0)) * actual_rhs);
+}
+template<typename Lhs, typename Rhs>
+struct generic_product_impl<Lhs,Rhs,DenseShape,DenseShape,OuterProduct>
+{
+  template<typename T> struct is_row_major : internal::conditional<(int(T::Flags)&RowMajorBit), internal::true_type, internal::false_type>::type {};
+  typedef typename Product<Lhs,Rhs>::Scalar Scalar;
+  // TODO it would be nice to be able to exploit our *_assign_op functors for that purpose
+  struct set  { template<typename Dst, typename Src> void operator()(const Dst& dst, const Src& src) const { dst.const_cast_derived()  = src; } };
+  struct add  { template<typename Dst, typename Src> void operator()(const Dst& dst, const Src& src) const { dst.const_cast_derived() += src; } };
+  struct sub  { template<typename Dst, typename Src> void operator()(const Dst& dst, const Src& src) const { dst.const_cast_derived() -= src; } };
+  struct adds {
+    Scalar m_scale;
+    explicit adds(const Scalar& s) : m_scale(s) {}
+    template<typename Dst, typename Src> void operator()(const Dst& dst, const Src& src) const {
+      dst.const_cast_derived() += m_scale * src;
+    }
+  };
+  template<typename Dst>
+  static EIGEN_STRONG_INLINE void evalTo(Dst& dst, const Lhs& lhs, const Rhs& rhs)
+  {
+    internal::outer_product_selector_run(dst, lhs, rhs, set(), is_row_major<Dst>());
+  }
+  template<typename Dst>
+  static EIGEN_STRONG_INLINE void addTo(Dst& dst, const Lhs& lhs, const Rhs& rhs)
+  {
+    internal::outer_product_selector_run(dst, lhs, rhs, add(), is_row_major<Dst>());
+  }
+  template<typename Dst>
+  static EIGEN_STRONG_INLINE void subTo(Dst& dst, const Lhs& lhs, const Rhs& rhs)
+  {
+    internal::outer_product_selector_run(dst, lhs, rhs, sub(), is_row_major<Dst>());
+  }
+  template<typename Dst>
+  static EIGEN_STRONG_INLINE void scaleAndAddTo(Dst& dst, const Lhs& lhs, const Rhs& rhs, const Scalar& alpha)
+  {
+    internal::outer_product_selector_run(dst, lhs, rhs, adds(alpha), is_row_major<Dst>());
+  }
+};
+// This base class provides default implementations for evalTo, addTo, subTo, in terms of scaleAndAddTo
+template<typename Lhs, typename Rhs, typename Derived>
+struct generic_product_impl_base
+{
+  typedef typename Product<Lhs,Rhs>::Scalar Scalar;
+  template<typename Dst>
+  static EIGEN_STRONG_INLINE void evalTo(Dst& dst, const Lhs& lhs, const Rhs& rhs)
+  { dst.setZero(); scaleAndAddTo(dst, lhs, rhs, Scalar(1)); }
+  template<typename Dst>
+  static EIGEN_STRONG_INLINE void addTo(Dst& dst, const Lhs& lhs, const Rhs& rhs)
+  { scaleAndAddTo(dst,lhs, rhs, Scalar(1)); }
+  template<typename Dst>
+  static EIGEN_STRONG_INLINE void subTo(Dst& dst, const Lhs& lhs, const Rhs& rhs)
+  { scaleAndAddTo(dst, lhs, rhs, Scalar(-1)); }
+  template<typename Dst>
+  static EIGEN_STRONG_INLINE void scaleAndAddTo(Dst& dst, const Lhs& lhs, const Rhs& rhs, const Scalar& alpha)
+  { Derived::scaleAndAddTo(dst,lhs,rhs,alpha); }
+};
+template<typename Lhs, typename Rhs>
+struct generic_product_impl<Lhs,Rhs,DenseShape,DenseShape,GemvProduct>
+  : generic_product_impl_base<Lhs,Rhs,generic_product_impl<Lhs,Rhs,DenseShape,DenseShape,GemvProduct> >
+{
+  typedef typename nested_eval<Lhs,1>::type LhsNested;
+  typedef typename nested_eval<Rhs,1>::type RhsNested;
+  typedef typename Product<Lhs,Rhs>::Scalar Scalar;
+  enum { Side = Lhs::IsVectorAtCompileTime ? OnTheLeft : OnTheRight };
+  typedef typename internal::remove_all<typename internal::conditional<int(Side)==OnTheRight,LhsNested,RhsNested>::type>::type MatrixType;
+  template<typename Dest>
+  static EIGEN_STRONG_INLINE void scaleAndAddTo(Dest& dst, const Lhs& lhs, const Rhs& rhs, const Scalar& alpha)
+  {
+    LhsNested actual_lhs(lhs);
+    RhsNested actual_rhs(rhs);
+    internal::gemv_dense_selector<Side,
+                            (int(MatrixType::Flags)&RowMajorBit) ? RowMajor : ColMajor,
+                            bool(internal::blas_traits<MatrixType>::HasUsableDirectAccess)
+                           >::run(actual_lhs, actual_rhs, dst, alpha);
+  }
+};
+template<typename Lhs, typename Rhs>
+struct generic_product_impl<Lhs,Rhs,DenseShape,DenseShape,CoeffBasedProductMode>
+{
+  typedef typename Product<Lhs,Rhs>::Scalar Scalar;
+  template<typename Dst>
+  static EIGEN_STRONG_INLINE void evalTo(Dst& dst, const Lhs& lhs, const Rhs& rhs)
+  {
+    // Same as: dst.noalias() = lhs.lazyProduct(rhs);
+    // but easier on the compiler side
+    call_assignment_no_alias(dst, lhs.lazyProduct(rhs), internal::assign_op<typename Dst::Scalar,Scalar>());
+  }
+  template<typename Dst>
+  static EIGEN_STRONG_INLINE void addTo(Dst& dst, const Lhs& lhs, const Rhs& rhs)
+  {
+    // dst.noalias() += lhs.lazyProduct(rhs);
+    call_assignment_no_alias(dst, lhs.lazyProduct(rhs), internal::add_assign_op<typename Dst::Scalar,Scalar>());
+  }
+  template<typename Dst>
+  static EIGEN_STRONG_INLINE void subTo(Dst& dst, const Lhs& lhs, const Rhs& rhs)
+  {
+    // dst.noalias() -= lhs.lazyProduct(rhs);
+    call_assignment_no_alias(dst, lhs.lazyProduct(rhs), internal::sub_assign_op<typename Dst::Scalar,Scalar>());
+  }
+//   template<typename Dst>
+//   static inline void scaleAndAddTo(Dst& dst, const Lhs& lhs, const Rhs& rhs, const Scalar& alpha)
+//   { dst.noalias() += alpha * lhs.lazyProduct(rhs); }
+};
+// This specialization enforces the use of a coefficient-based evaluation strategy
+template<typename Lhs, typename Rhs>
+struct generic_product_impl<Lhs,Rhs,DenseShape,DenseShape,LazyCoeffBasedProductMode>
+  : generic_product_impl<Lhs,Rhs,DenseShape,DenseShape,CoeffBasedProductMode> {};
+// Case 2: Evaluate coeff by coeff
+//
+// This is mostly taken from CoeffBasedProduct.h
+// The main difference is that we add an extra argument to the etor_product_*_impl::run() function
+// for the inner dimension of the product, because evaluator object do not know their size.
+template<int Traversal, int UnrollingIndex, typename Lhs, typename Rhs, typename RetScalar>
+struct etor_product_coeff_impl;
+template<int StorageOrder, int UnrollingIndex, typename Lhs, typename Rhs, typename Packet, int LoadMode>
+struct etor_product_packet_impl;
+template<typename Lhs, typename Rhs, int ProductTag>
+struct product_evaluator<Product<Lhs, Rhs, LazyProduct>, ProductTag, DenseShape, DenseShape>
+    : evaluator_base<Product<Lhs, Rhs, LazyProduct> >
+{
+  typedef Product<Lhs, Rhs, LazyProduct> XprType;
+  typedef typename XprType::Scalar Scalar;
+  typedef typename XprType::CoeffReturnType CoeffReturnType;
+  EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE
+  explicit product_evaluator(const XprType& xpr)
+    : m_lhs(xpr.lhs()),
+      m_rhs(xpr.rhs()),
+      m_lhsImpl(m_lhs),     // FIXME the creation of the evaluator objects should result in a no-op, but check that!
+      m_rhsImpl(m_rhs),     //       Moreover, they are only useful for the packet path, so we could completely disable them when not needed,
+                            //       or perhaps declare them on the fly on the packet method... We have experiment to check what's best.
+      m_innerDim(xpr.lhs().cols())
+  {
+    EIGEN_INTERNAL_CHECK_COST_VALUE(NumTraits<Scalar>::MulCost);
+    EIGEN_INTERNAL_CHECK_COST_VALUE(NumTraits<Scalar>::AddCost);
+    EIGEN_INTERNAL_CHECK_COST_VALUE(CoeffReadCost);
+#if 0
+    std::cerr << "LhsOuterStrideBytes=  " << LhsOuterStrideBytes << "\n";
+    std::cerr << "RhsOuterStrideBytes=  " << RhsOuterStrideBytes << "\n";
+    std::cerr << "LhsAlignment=         " << LhsAlignment << "\n";
+    std::cerr << "RhsAlignment=         " << RhsAlignment << "\n";
+    std::cerr << "CanVectorizeLhs=      " << CanVectorizeLhs << "\n";
+    std::cerr << "CanVectorizeRhs=      " << CanVectorizeRhs << "\n";
+    std::cerr << "CanVectorizeInner=    " << CanVectorizeInner << "\n";
+    std::cerr << "EvalToRowMajor=       " << EvalToRowMajor << "\n";
+    std::cerr << "Alignment=            " << Alignment << "\n";
+    std::cerr << "Flags=                " << Flags << "\n";
+#endif
+  }
+  // Everything below here is taken from CoeffBasedProduct.h
+  typedef typename internal::nested_eval<Lhs,Rhs::ColsAtCompileTime>::type LhsNested;
+  typedef typename internal::nested_eval<Rhs,Lhs::RowsAtCompileTime>::type RhsNested;
+  typedef typename internal::remove_all<LhsNested>::type LhsNestedCleaned;
+  typedef typename internal::remove_all<RhsNested>::type RhsNestedCleaned;
+  typedef evaluator<LhsNestedCleaned> LhsEtorType;
+  typedef evaluator<RhsNestedCleaned> RhsEtorType;
+  enum {
+    RowsAtCompileTime = LhsNestedCleaned::RowsAtCompileTime,
+    ColsAtCompileTime = RhsNestedCleaned::ColsAtCompileTime,
+    InnerSize = EIGEN_SIZE_MIN_PREFER_FIXED(LhsNestedCleaned::ColsAtCompileTime, RhsNestedCleaned::RowsAtCompileTime),
+    MaxRowsAtCompileTime = LhsNestedCleaned::MaxRowsAtCompileTime,
+    MaxColsAtCompileTime = RhsNestedCleaned::MaxColsAtCompileTime
+  };
+  typedef typename find_best_packet<Scalar,RowsAtCompileTime>::type LhsVecPacketType;
+  typedef typename find_best_packet<Scalar,ColsAtCompileTime>::type RhsVecPacketType;
+  enum {
+    LhsCoeffReadCost = LhsEtorType::CoeffReadCost,
+    RhsCoeffReadCost = RhsEtorType::CoeffReadCost,
+    CoeffReadCost = InnerSize==0 ? NumTraits<Scalar>::ReadCost
+                  : InnerSize == Dynamic ? HugeCost
+                  : InnerSize * (NumTraits<Scalar>::MulCost + LhsCoeffReadCost + RhsCoeffReadCost)
+                    + (InnerSize - 1) * NumTraits<Scalar>::AddCost,
+    Unroll = CoeffReadCost <= EIGEN_UNROLLING_LIMIT,
+    LhsFlags = LhsEtorType::Flags,
+    RhsFlags = RhsEtorType::Flags,
+    LhsRowMajor = LhsFlags & RowMajorBit,
+    RhsRowMajor = RhsFlags & RowMajorBit,
+    LhsVecPacketSize = unpacket_traits<LhsVecPacketType>::size,
+    RhsVecPacketSize = unpacket_traits<RhsVecPacketType>::size,
+    // Here, we don't care about alignment larger than the usable packet size.
+    LhsAlignment = EIGEN_PLAIN_ENUM_MIN(LhsEtorType::Alignment,LhsVecPacketSize*int(sizeof(typename LhsNestedCleaned::Scalar))),
+    RhsAlignment = EIGEN_PLAIN_ENUM_MIN(RhsEtorType::Alignment,RhsVecPacketSize*int(sizeof(typename RhsNestedCleaned::Scalar))),
+    SameType = is_same<typename LhsNestedCleaned::Scalar,typename RhsNestedCleaned::Scalar>::value,
+    CanVectorizeRhs = bool(RhsRowMajor) && (RhsFlags & PacketAccessBit) && (ColsAtCompileTime!=1),
+    CanVectorizeLhs = (!LhsRowMajor) && (LhsFlags & PacketAccessBit) && (RowsAtCompileTime!=1),
+    EvalToRowMajor = (MaxRowsAtCompileTime==1&&MaxColsAtCompileTime!=1) ? 1
+                    : (MaxColsAtCompileTime==1&&MaxRowsAtCompileTime!=1) ? 0
+                    : (bool(RhsRowMajor) && !CanVectorizeLhs),
+    Flags = ((unsigned int)(LhsFlags | RhsFlags) & HereditaryBits & ~RowMajorBit)
+          | (EvalToRowMajor ? RowMajorBit : 0)
+          // TODO enable vectorization for mixed types
+          | (SameType && (CanVectorizeLhs || CanVectorizeRhs) ? PacketAccessBit : 0)
+          | (XprType::IsVectorAtCompileTime ? LinearAccessBit : 0),
+    LhsOuterStrideBytes = int(LhsNestedCleaned::OuterStrideAtCompileTime) * int(sizeof(typename LhsNestedCleaned::Scalar)),
+    RhsOuterStrideBytes = int(RhsNestedCleaned::OuterStrideAtCompileTime) * int(sizeof(typename RhsNestedCleaned::Scalar)),
+    Alignment = bool(CanVectorizeLhs) ? (LhsOuterStrideBytes<=0 || (int(LhsOuterStrideBytes) % EIGEN_PLAIN_ENUM_MAX(1,LhsAlignment))!=0 ? 0 : LhsAlignment)
+              : bool(CanVectorizeRhs) ? (RhsOuterStrideBytes<=0 || (int(RhsOuterStrideBytes) % EIGEN_PLAIN_ENUM_MAX(1,RhsAlignment))!=0 ? 0 : RhsAlignment)
+              : 0,
+    /* CanVectorizeInner deserves special explanation. It does not affect the product flags. It is not used outside
+     * of Product. If the Product itself is not a packet-access expression, there is still a chance that the inner
+     * loop of the product might be vectorized. This is the meaning of CanVectorizeInner. Since it doesn't affect
+     * the Flags, it is safe to make this value depend on ActualPacketAccessBit, that doesn't affect the ABI.
+     */
+    CanVectorizeInner =    SameType
+                        && LhsRowMajor
+                        && (!RhsRowMajor)
+                        && (LhsFlags & RhsFlags & ActualPacketAccessBit)
+                        && (InnerSize % packet_traits<Scalar>::size == 0)
+  };
+  EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE const CoeffReturnType coeff(Index row, Index col) const
+  {
+    return (m_lhs.row(row).transpose().cwiseProduct( m_rhs.col(col) )).sum();
+  }
+  /* Allow index-based non-packet access. It is impossible though to allow index-based packed access,
+   * which is why we don't set the LinearAccessBit.
+   * TODO: this seems possible when the result is a vector
+   */
+  EIGEN_DEVICE_FUNC const CoeffReturnType coeff(Index index) const
+  {
+    const Index row = (RowsAtCompileTime == 1 || MaxRowsAtCompileTime==1) ? 0 : index;
+    const Index col = (RowsAtCompileTime == 1 || MaxRowsAtCompileTime==1) ? index : 0;
+    return (m_lhs.row(row).transpose().cwiseProduct( m_rhs.col(col) )).sum();
+  }
+  template<int LoadMode, typename PacketType>
+  const PacketType packet(Index row, Index col) const
+  {
+    PacketType res;
+    typedef etor_product_packet_impl<bool(int(Flags)&RowMajorBit) ? RowMajor : ColMajor,
+                                     Unroll ? int(InnerSize) : Dynamic,
+                                     LhsEtorType, RhsEtorType, PacketType, LoadMode> PacketImpl;
+    PacketImpl::run(row, col, m_lhsImpl, m_rhsImpl, m_innerDim, res);
+    return res;
+  }
+  template<int LoadMode, typename PacketType>
+  const PacketType packet(Index index) const
+  {
+    const Index row = (RowsAtCompileTime == 1 || MaxRowsAtCompileTime==1) ? 0 : index;
+    const Index col = (RowsAtCompileTime == 1 || MaxRowsAtCompileTime==1) ? index : 0;
+    return packet<LoadMode,PacketType>(row,col);
+  }
+protected:
+  typename internal::add_const_on_value_type<LhsNested>::type m_lhs;
+  typename internal::add_const_on_value_type<RhsNested>::type m_rhs;
+  LhsEtorType m_lhsImpl;
+  RhsEtorType m_rhsImpl;
+  // TODO: Get rid of m_innerDim if known at compile time
+  Index m_innerDim;
+};
+template<typename Lhs, typename Rhs>
+struct product_evaluator<Product<Lhs, Rhs, DefaultProduct>, LazyCoeffBasedProductMode, DenseShape, DenseShape>
+  : product_evaluator<Product<Lhs, Rhs, LazyProduct>, CoeffBasedProductMode, DenseShape, DenseShape>
+{
+  typedef Product<Lhs, Rhs, DefaultProduct> XprType;
+  typedef Product<Lhs, Rhs, LazyProduct> BaseProduct;
+  typedef product_evaluator<BaseProduct, CoeffBasedProductMode, DenseShape, DenseShape> Base;
+  enum {
+    Flags = Base::Flags | EvalBeforeNestingBit
+  };
+  EIGEN_DEVICE_FUNC explicit product_evaluator(const XprType& xpr)
+    : Base(BaseProduct(xpr.lhs(),xpr.rhs()))
+  {}
+};
+/****************************************
+*** Coeff based product, Packet path  ***
+****************************************/
+template<int UnrollingIndex, typename Lhs, typename Rhs, typename Packet, int LoadMode>
+struct etor_product_packet_impl<RowMajor, UnrollingIndex, Lhs, Rhs, Packet, LoadMode>
+{
+  static EIGEN_STRONG_INLINE void run(Index row, Index col, const Lhs& lhs, const Rhs& rhs, Index innerDim, Packet &res)
+  {
+    etor_product_packet_impl<RowMajor, UnrollingIndex-1, Lhs, Rhs, Packet, LoadMode>::run(row, col, lhs, rhs, innerDim, res);
+    res =  pmadd(pset1<Packet>(lhs.coeff(row, Index(UnrollingIndex-1))), rhs.template packet<LoadMode,Packet>(Index(UnrollingIndex-1), col), res);
+  }
+};
+template<int UnrollingIndex, typename Lhs, typename Rhs, typename Packet, int LoadMode>
+struct etor_product_packet_impl<ColMajor, UnrollingIndex, Lhs, Rhs, Packet, LoadMode>
+{
+  static EIGEN_STRONG_INLINE void run(Index row, Index col, const Lhs& lhs, const Rhs& rhs, Index innerDim, Packet &res)
+  {
+    etor_product_packet_impl<ColMajor, UnrollingIndex-1, Lhs, Rhs, Packet, LoadMode>::run(row, col, lhs, rhs, innerDim, res);
+    res =  pmadd(lhs.template packet<LoadMode,Packet>(row, Index(UnrollingIndex-1)), pset1<Packet>(rhs.coeff(Index(UnrollingIndex-1), col)), res);
+  }
+};
+template<typename Lhs, typename Rhs, typename Packet, int LoadMode>
+struct etor_product_packet_impl<RowMajor, 1, Lhs, Rhs, Packet, LoadMode>
+{
+  static EIGEN_STRONG_INLINE void run(Index row, Index col, const Lhs& lhs, const Rhs& rhs, Index /*innerDim*/, Packet &res)
+  {
+    res = pmul(pset1<Packet>(lhs.coeff(row, Index(0))),rhs.template packet<LoadMode,Packet>(Index(0), col));
+  }
+};
+template<typename Lhs, typename Rhs, typename Packet, int LoadMode>
+struct etor_product_packet_impl<ColMajor, 1, Lhs, Rhs, Packet, LoadMode>
+{
+  static EIGEN_STRONG_INLINE void run(Index row, Index col, const Lhs& lhs, const Rhs& rhs, Index /*innerDim*/, Packet &res)
+  {
+    res = pmul(lhs.template packet<LoadMode,Packet>(row, Index(0)), pset1<Packet>(rhs.coeff(Index(0), col)));
+  }
+};
+template<typename Lhs, typename Rhs, typename Packet, int LoadMode>
+struct etor_product_packet_impl<RowMajor, 0, Lhs, Rhs, Packet, LoadMode>
+{
+  static EIGEN_STRONG_INLINE void run(Index /*row*/, Index /*col*/, const Lhs& /*lhs*/, const Rhs& /*rhs*/, Index /*innerDim*/, Packet &res)
+  {
+    res = pset1<Packet>(typename unpacket_traits<Packet>::type(0));
+  }
+};
+template<typename Lhs, typename Rhs, typename Packet, int LoadMode>
+struct etor_product_packet_impl<ColMajor, 0, Lhs, Rhs, Packet, LoadMode>
+{
+  static EIGEN_STRONG_INLINE void run(Index /*row*/, Index /*col*/, const Lhs& /*lhs*/, const Rhs& /*rhs*/, Index /*innerDim*/, Packet &res)
+  {
+    res = pset1<Packet>(typename unpacket_traits<Packet>::type(0));
+  }
+};
+template<typename Lhs, typename Rhs, typename Packet, int LoadMode>
+struct etor_product_packet_impl<RowMajor, Dynamic, Lhs, Rhs, Packet, LoadMode>
+{
+  static EIGEN_STRONG_INLINE void run(Index row, Index col, const Lhs& lhs, const Rhs& rhs, Index innerDim, Packet& res)
+  {
+    res = pset1<Packet>(typename unpacket_traits<Packet>::type(0));
+    for(Index i = 0; i < innerDim; ++i)
+      res =  pmadd(pset1<Packet>(lhs.coeff(row, i)), rhs.template packet<LoadMode,Packet>(i, col), res);
+  }
+};
+template<typename Lhs, typename Rhs, typename Packet, int LoadMode>
+struct etor_product_packet_impl<ColMajor, Dynamic, Lhs, Rhs, Packet, LoadMode>
+{
+  static EIGEN_STRONG_INLINE void run(Index row, Index col, const Lhs& lhs, const Rhs& rhs, Index innerDim, Packet& res)
+  {
+    res = pset1<Packet>(typename unpacket_traits<Packet>::type(0));
+    for(Index i = 0; i < innerDim; ++i)
+      res =  pmadd(lhs.template packet<LoadMode,Packet>(row, i), pset1<Packet>(rhs.coeff(i, col)), res);
+  }
+};
+/***************************************************************************
+* Triangular products
+***************************************************************************/
+template<int Mode, bool LhsIsTriangular,
+         typename Lhs, bool LhsIsVector,
+         typename Rhs, bool RhsIsVector>
+struct triangular_product_impl;
+template<typename Lhs, typename Rhs, int ProductTag>
+struct generic_product_impl<Lhs,Rhs,TriangularShape,DenseShape,ProductTag>
+  : generic_product_impl_base<Lhs,Rhs,generic_product_impl<Lhs,Rhs,TriangularShape,DenseShape,ProductTag> >
+{
+  typedef typename Product<Lhs,Rhs>::Scalar Scalar;
+  template<typename Dest>
+  static void scaleAndAddTo(Dest& dst, const Lhs& lhs, const Rhs& rhs, const Scalar& alpha)
+  {
+    triangular_product_impl<Lhs::Mode,true,typename Lhs::MatrixType,false,Rhs, Rhs::ColsAtCompileTime==1>
+        ::run(dst, lhs.nestedExpression(), rhs, alpha);
+  }
+};
+template<typename Lhs, typename Rhs, int ProductTag>
+struct generic_product_impl<Lhs,Rhs,DenseShape,TriangularShape,ProductTag>
+: generic_product_impl_base<Lhs,Rhs,generic_product_impl<Lhs,Rhs,DenseShape,TriangularShape,ProductTag> >
+{
+  typedef typename Product<Lhs,Rhs>::Scalar Scalar;
+  template<typename Dest>
+  static void scaleAndAddTo(Dest& dst, const Lhs& lhs, const Rhs& rhs, const Scalar& alpha)
+  {
+    triangular_product_impl<Rhs::Mode,false,Lhs,Lhs::RowsAtCompileTime==1, typename Rhs::MatrixType, false>::run(dst, lhs, rhs.nestedExpression(), alpha);
+  }
+};
+/***************************************************************************
+* SelfAdjoint products
+***************************************************************************/
+template <typename Lhs, int LhsMode, bool LhsIsVector,
+          typename Rhs, int RhsMode, bool RhsIsVector>
+struct selfadjoint_product_impl;
+template<typename Lhs, typename Rhs, int ProductTag>
+struct generic_product_impl<Lhs,Rhs,SelfAdjointShape,DenseShape,ProductTag>
+  : generic_product_impl_base<Lhs,Rhs,generic_product_impl<Lhs,Rhs,SelfAdjointShape,DenseShape,ProductTag> >
+{
+  typedef typename Product<Lhs,Rhs>::Scalar Scalar;
+  template<typename Dest>
+  static void scaleAndAddTo(Dest& dst, const Lhs& lhs, const Rhs& rhs, const Scalar& alpha)
+  {
+    selfadjoint_product_impl<typename Lhs::MatrixType,Lhs::Mode,false,Rhs,0,Rhs::IsVectorAtCompileTime>::run(dst, lhs.nestedExpression(), rhs, alpha);
+  }
+};
+template<typename Lhs, typename Rhs, int ProductTag>
+struct generic_product_impl<Lhs,Rhs,DenseShape,SelfAdjointShape,ProductTag>
+: generic_product_impl_base<Lhs,Rhs,generic_product_impl<Lhs,Rhs,DenseShape,SelfAdjointShape,ProductTag> >
+{
+  typedef typename Product<Lhs,Rhs>::Scalar Scalar;
+  template<typename Dest>
+  static void scaleAndAddTo(Dest& dst, const Lhs& lhs, const Rhs& rhs, const Scalar& alpha)
+  {
+    selfadjoint_product_impl<Lhs,0,Lhs::IsVectorAtCompileTime,typename Rhs::MatrixType,Rhs::Mode,false>::run(dst, lhs, rhs.nestedExpression(), alpha);
+  }
+};
+/***************************************************************************
+* Diagonal products
+***************************************************************************/
+template<typename MatrixType, typename DiagonalType, typename Derived, int ProductOrder>
+struct diagonal_product_evaluator_base
+  : evaluator_base<Derived>
+{
+   typedef typename ScalarBinaryOpTraits<typename MatrixType::Scalar, typename DiagonalType::Scalar>::ReturnType Scalar;
+public:
+  enum {
+    CoeffReadCost = NumTraits<Scalar>::MulCost + evaluator<MatrixType>::CoeffReadCost + evaluator<DiagonalType>::CoeffReadCost,
+    MatrixFlags = evaluator<MatrixType>::Flags,
+    DiagFlags = evaluator<DiagonalType>::Flags,
+    _StorageOrder = MatrixFlags & RowMajorBit ? RowMajor : ColMajor,
+    _ScalarAccessOnDiag =  !((int(_StorageOrder) == ColMajor && int(ProductOrder) == OnTheLeft)
+                           ||(int(_StorageOrder) == RowMajor && int(ProductOrder) == OnTheRight)),
+    _SameTypes = is_same<typename MatrixType::Scalar, typename DiagonalType::Scalar>::value,
+    // FIXME currently we need same types, but in the future the next rule should be the one
+    //_Vectorizable = bool(int(MatrixFlags)&PacketAccessBit) && ((!_PacketOnDiag) || (_SameTypes && bool(int(DiagFlags)&PacketAccessBit))),
+    _Vectorizable = bool(int(MatrixFlags)&PacketAccessBit) && _SameTypes && (_ScalarAccessOnDiag || (bool(int(DiagFlags)&PacketAccessBit))),
+    _LinearAccessMask = (MatrixType::RowsAtCompileTime==1 || MatrixType::ColsAtCompileTime==1) ? LinearAccessBit : 0,
+    Flags = ((HereditaryBits|_LinearAccessMask) & (unsigned int)(MatrixFlags)) | (_Vectorizable ? PacketAccessBit : 0),
+    Alignment = evaluator<MatrixType>::Alignment,
+    AsScalarProduct =     (DiagonalType::SizeAtCompileTime==1)
+                      ||  (DiagonalType::SizeAtCompileTime==Dynamic && MatrixType::RowsAtCompileTime==1 && ProductOrder==OnTheLeft)
+                      ||  (DiagonalType::SizeAtCompileTime==Dynamic && MatrixType::ColsAtCompileTime==1 && ProductOrder==OnTheRight)
+  };
+  diagonal_product_evaluator_base(const MatrixType &mat, const DiagonalType &diag)
+    : m_diagImpl(diag), m_matImpl(mat)
+  {
+    EIGEN_INTERNAL_CHECK_COST_VALUE(NumTraits<Scalar>::MulCost);
+    EIGEN_INTERNAL_CHECK_COST_VALUE(CoeffReadCost);
+  }
+  EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE const Scalar coeff(Index idx) const
+  {
+    if(AsScalarProduct)
+      return m_diagImpl.coeff(0) * m_matImpl.coeff(idx);
+    else
+      return m_diagImpl.coeff(idx) * m_matImpl.coeff(idx);
+  }
+protected:
+  template<int LoadMode,typename PacketType>
+  EIGEN_STRONG_INLINE PacketType packet_impl(Index row, Index col, Index id, internal::true_type) const
+  {
+    return internal::pmul(m_matImpl.template packet<LoadMode,PacketType>(row, col),
+                          internal::pset1<PacketType>(m_diagImpl.coeff(id)));
+  }
+  template<int LoadMode,typename PacketType>
+  EIGEN_STRONG_INLINE PacketType packet_impl(Index row, Index col, Index id, internal::false_type) const
+  {
+    enum {
+      InnerSize = (MatrixType::Flags & RowMajorBit) ? MatrixType::ColsAtCompileTime : MatrixType::RowsAtCompileTime,
+      DiagonalPacketLoadMode = EIGEN_PLAIN_ENUM_MIN(LoadMode,((InnerSize%16) == 0) ? int(Aligned16) : int(evaluator<DiagonalType>::Alignment)) // FIXME hardcoded 16!!
+    };
+    return internal::pmul(m_matImpl.template packet<LoadMode,PacketType>(row, col),
+                          m_diagImpl.template packet<DiagonalPacketLoadMode,PacketType>(id));
+  }
+  evaluator<DiagonalType> m_diagImpl;
+  evaluator<MatrixType>   m_matImpl;
+};
+// diagonal * dense
+template<typename Lhs, typename Rhs, int ProductKind, int ProductTag>
+struct product_evaluator<Product<Lhs, Rhs, ProductKind>, ProductTag, DiagonalShape, DenseShape>
+  : diagonal_product_evaluator_base<Rhs, typename Lhs::DiagonalVectorType, Product<Lhs, Rhs, LazyProduct>, OnTheLeft>
+{
+  typedef diagonal_product_evaluator_base<Rhs, typename Lhs::DiagonalVectorType, Product<Lhs, Rhs, LazyProduct>, OnTheLeft> Base;
+  using Base::m_diagImpl;
+  using Base::m_matImpl;
+  using Base::coeff;
+  typedef typename Base::Scalar Scalar;
+  typedef Product<Lhs, Rhs, ProductKind> XprType;
+  typedef typename XprType::PlainObject PlainObject;
+  enum {
+    StorageOrder = int(Rhs::Flags) & RowMajorBit ? RowMajor : ColMajor
+  };
+  EIGEN_DEVICE_FUNC explicit product_evaluator(const XprType& xpr)
+    : Base(xpr.rhs(), xpr.lhs().diagonal())
+  {
+  }
+  EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE const Scalar coeff(Index row, Index col) const
+  {
+    return m_diagImpl.coeff(row) * m_matImpl.coeff(row, col);
+  }
+#ifndef __CUDACC__
+  template<int LoadMode,typename PacketType>
+  EIGEN_STRONG_INLINE PacketType packet(Index row, Index col) const
+  {
+    // FIXME: NVCC used to complain about the template keyword, but we have to check whether this is still the case.
+    // See also similar calls below.
+    return this->template packet_impl<LoadMode,PacketType>(row,col, row,
+                                 typename internal::conditional<int(StorageOrder)==RowMajor, internal::true_type, internal::false_type>::type());
+  }
+  template<int LoadMode,typename PacketType>
+  EIGEN_STRONG_INLINE PacketType packet(Index idx) const
+  {
+    return packet<LoadMode,PacketType>(int(StorageOrder)==ColMajor?idx:0,int(StorageOrder)==ColMajor?0:idx);
+  }
+#endif
+};
+// dense * diagonal
+template<typename Lhs, typename Rhs, int ProductKind, int ProductTag>
+struct product_evaluator<Product<Lhs, Rhs, ProductKind>, ProductTag, DenseShape, DiagonalShape>
+  : diagonal_product_evaluator_base<Lhs, typename Rhs::DiagonalVectorType, Product<Lhs, Rhs, LazyProduct>, OnTheRight>
+{
+  typedef diagonal_product_evaluator_base<Lhs, typename Rhs::DiagonalVectorType, Product<Lhs, Rhs, LazyProduct>, OnTheRight> Base;
+  using Base::m_diagImpl;
+  using Base::m_matImpl;
+  using Base::coeff;
+  typedef typename Base::Scalar Scalar;
+  typedef Product<Lhs, Rhs, ProductKind> XprType;
+  typedef typename XprType::PlainObject PlainObject;
+  enum { StorageOrder = int(Lhs::Flags) & RowMajorBit ? RowMajor : ColMajor };
+  EIGEN_DEVICE_FUNC explicit product_evaluator(const XprType& xpr)
+    : Base(xpr.lhs(), xpr.rhs().diagonal())
+  {
+  }
+  EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE const Scalar coeff(Index row, Index col) const
+  {
+    return m_matImpl.coeff(row, col) * m_diagImpl.coeff(col);
+  }
+#ifndef __CUDACC__
+  template<int LoadMode,typename PacketType>
+  EIGEN_STRONG_INLINE PacketType packet(Index row, Index col) const
+  {
+    return this->template packet_impl<LoadMode,PacketType>(row,col, col,
+                                 typename internal::conditional<int(StorageOrder)==ColMajor, internal::true_type, internal::false_type>::type());
+  }
+  template<int LoadMode,typename PacketType>
+  EIGEN_STRONG_INLINE PacketType packet(Index idx) const
+  {
+    return packet<LoadMode,PacketType>(int(StorageOrder)==ColMajor?idx:0,int(StorageOrder)==ColMajor?0:idx);
+  }
+#endif
+};
+/***************************************************************************
+* Products with permutation matrices
+***************************************************************************/
+/** \internal
+  * \class permutation_matrix_product
+  * Internal helper class implementing the product between a permutation matrix and a matrix.
+  * This class is specialized for DenseShape below and for SparseShape in SparseCore/SparsePermutation.h
+  */
+template<typename ExpressionType, int Side, bool Transposed, typename ExpressionShape>
+struct permutation_matrix_product;
+template<typename ExpressionType, int Side, bool Transposed>
+struct permutation_matrix_product<ExpressionType, Side, Transposed, DenseShape>
+{
+    typedef typename nested_eval<ExpressionType, 1>::type MatrixType;
+    typedef typename remove_all<MatrixType>::type MatrixTypeCleaned;
+    template<typename Dest, typename PermutationType>
+    static inline void run(Dest& dst, const PermutationType& perm, const ExpressionType& xpr)
+    {
+      MatrixType mat(xpr);
+      const Index n = Side==OnTheLeft ? mat.rows() : mat.cols();
+      // FIXME we need an is_same for expression that is not sensitive to constness. For instance
+      // is_same_xpr<Block<const Matrix>, Block<Matrix> >::value should be true.
+      //if(is_same<MatrixTypeCleaned,Dest>::value && extract_data(dst) == extract_data(mat))
+      if(is_same_dense(dst, mat))
+      {
+        // apply the permutation inplace
+        Matrix<bool,PermutationType::RowsAtCompileTime,1,0,PermutationType::MaxRowsAtCompileTime> mask(perm.size());
+        mask.fill(false);
+        Index r = 0;
+        while(r < perm.size())
+        {
+          // search for the next seed
+          while(r<perm.size() && mask[r]) r++;
+          if(r>=perm.size())
+            break;
+          // we got one, let's follow it until we are back to the seed
+          Index k0 = r++;
+          Index kPrev = k0;
+          mask.coeffRef(k0) = true;
+          for(Index k=perm.indices().coeff(k0); k!=k0; k=perm.indices().coeff(k))
+          {
+                  Block<Dest, Side==OnTheLeft ? 1 : Dest::RowsAtCompileTime, Side==OnTheRight ? 1 : Dest::ColsAtCompileTime>(dst, k)
+            .swap(Block<Dest, Side==OnTheLeft ? 1 : Dest::RowsAtCompileTime, Side==OnTheRight ? 1 : Dest::ColsAtCompileTime>
+                       (dst,((Side==OnTheLeft) ^ Transposed) ? k0 : kPrev));
+            mask.coeffRef(k) = true;
+            kPrev = k;
+          }
+        }
+      }
+      else
+      {
+        for(Index i = 0; i < n; ++i)
+        {
+          Block<Dest, Side==OnTheLeft ? 1 : Dest::RowsAtCompileTime, Side==OnTheRight ? 1 : Dest::ColsAtCompileTime>
+               (dst, ((Side==OnTheLeft) ^ Transposed) ? perm.indices().coeff(i) : i)
+          =
+          Block<const MatrixTypeCleaned,Side==OnTheLeft ? 1 : MatrixTypeCleaned::RowsAtCompileTime,Side==OnTheRight ? 1 : MatrixTypeCleaned::ColsAtCompileTime>
+               (mat, ((Side==OnTheRight) ^ Transposed) ? perm.indices().coeff(i) : i);
+        }
+      }
+    }
+};
+template<typename Lhs, typename Rhs, int ProductTag, typename MatrixShape>
+struct generic_product_impl<Lhs, Rhs, PermutationShape, MatrixShape, ProductTag>
+{
+  template<typename Dest>
+  static void evalTo(Dest& dst, const Lhs& lhs, const Rhs& rhs)
+  {
+    permutation_matrix_product<Rhs, OnTheLeft, false, MatrixShape>::run(dst, lhs, rhs);
+  }
+};
+template<typename Lhs, typename Rhs, int ProductTag, typename MatrixShape>
+struct generic_product_impl<Lhs, Rhs, MatrixShape, PermutationShape, ProductTag>
+{
+  template<typename Dest>
+  static void evalTo(Dest& dst, const Lhs& lhs, const Rhs& rhs)
+  {
+    permutation_matrix_product<Lhs, OnTheRight, false, MatrixShape>::run(dst, rhs, lhs);
+  }
+};
+template<typename Lhs, typename Rhs, int ProductTag, typename MatrixShape>
+struct generic_product_impl<Inverse<Lhs>, Rhs, PermutationShape, MatrixShape, ProductTag>
+{
+  template<typename Dest>
+  static void evalTo(Dest& dst, const Inverse<Lhs>& lhs, const Rhs& rhs)
+  {
+    permutation_matrix_product<Rhs, OnTheLeft, true, MatrixShape>::run(dst, lhs.nestedExpression(), rhs);
+  }
+};
+template<typename Lhs, typename Rhs, int ProductTag, typename MatrixShape>
+struct generic_product_impl<Lhs, Inverse<Rhs>, MatrixShape, PermutationShape, ProductTag>
+{
+  template<typename Dest>
+  static void evalTo(Dest& dst, const Lhs& lhs, const Inverse<Rhs>& rhs)
+  {
+    permutation_matrix_product<Lhs, OnTheRight, true, MatrixShape>::run(dst, rhs.nestedExpression(), lhs);
+  }
+};
+/***************************************************************************
+* Products with transpositions matrices
+***************************************************************************/
+// FIXME could we unify Transpositions and Permutation into a single "shape"??
+/** \internal
+  * \class transposition_matrix_product
+  * Internal helper class implementing the product between a permutation matrix and a matrix.
+  */
+template<typename ExpressionType, int Side, bool Transposed, typename ExpressionShape>
+struct transposition_matrix_product
+{
+  typedef typename nested_eval<ExpressionType, 1>::type MatrixType;
+  typedef typename remove_all<MatrixType>::type MatrixTypeCleaned;
+  template<typename Dest, typename TranspositionType>
+  static inline void run(Dest& dst, const TranspositionType& tr, const ExpressionType& xpr)
+  {
+    MatrixType mat(xpr);
+    typedef typename TranspositionType::StorageIndex StorageIndex;
+    const Index size = tr.size();
+    StorageIndex j = 0;
+    if(!is_same_dense(dst,mat))
+      dst = mat;
+    for(Index k=(Transposed?size-1:0) ; Transposed?k>=0:k<size ; Transposed?--k:++k)
+      if(Index(j=tr.coeff(k))!=k)
+      {
+        if(Side==OnTheLeft)        dst.row(k).swap(dst.row(j));
+        else if(Side==OnTheRight)  dst.col(k).swap(dst.col(j));
+      }
+  }
+};
+template<typename Lhs, typename Rhs, int ProductTag, typename MatrixShape>
+struct generic_product_impl<Lhs, Rhs, TranspositionsShape, MatrixShape, ProductTag>
+{
+  template<typename Dest>
+  static void evalTo(Dest& dst, const Lhs& lhs, const Rhs& rhs)
+  {
+    transposition_matrix_product<Rhs, OnTheLeft, false, MatrixShape>::run(dst, lhs, rhs);
+  }
+};
+template<typename Lhs, typename Rhs, int ProductTag, typename MatrixShape>
+struct generic_product_impl<Lhs, Rhs, MatrixShape, TranspositionsShape, ProductTag>
+{
+  template<typename Dest>
+  static void evalTo(Dest& dst, const Lhs& lhs, const Rhs& rhs)
+  {
+    transposition_matrix_product<Lhs, OnTheRight, false, MatrixShape>::run(dst, rhs, lhs);
+  }
+};
+template<typename Lhs, typename Rhs, int ProductTag, typename MatrixShape>
+struct generic_product_impl<Transpose<Lhs>, Rhs, TranspositionsShape, MatrixShape, ProductTag>
+{
+  template<typename Dest>
+  static void evalTo(Dest& dst, const Transpose<Lhs>& lhs, const Rhs& rhs)
+  {
+    transposition_matrix_product<Rhs, OnTheLeft, true, MatrixShape>::run(dst, lhs.nestedExpression(), rhs);
+  }
+};
+template<typename Lhs, typename Rhs, int ProductTag, typename MatrixShape>
+struct generic_product_impl<Lhs, Transpose<Rhs>, MatrixShape, TranspositionsShape, ProductTag>
+{
+  template<typename Dest>
+  static void evalTo(Dest& dst, const Lhs& lhs, const Transpose<Rhs>& rhs)
+  {
+    transposition_matrix_product<Lhs, OnTheRight, true, MatrixShape>::run(dst, rhs.nestedExpression(), lhs);
+  }
+};
+} // end namespace internal
+} // end namespace Eigen
+#endif // EIGEN_PRODUCT_EVALUATORS_H