RubyGems - umappp - Versions diffs - 0.1.2 - Mend

umappp 0.1.2

Files changed (395) hide show

checksums.yaml +7 -0
data/LICENSE.txt +25 -0
data/README.md +110 -0
data/ext/umappp/extconf.rb +25 -0
data/ext/umappp/numo.hpp +867 -0
data/ext/umappp/umappp.cpp +225 -0
data/lib/umappp/version.rb +5 -0
data/lib/umappp.rb +41 -0
data/vendor/Eigen/Cholesky +45 -0
data/vendor/Eigen/CholmodSupport +48 -0
data/vendor/Eigen/Core +384 -0
data/vendor/Eigen/Dense +7 -0
data/vendor/Eigen/Eigen +2 -0
data/vendor/Eigen/Eigenvalues +60 -0
data/vendor/Eigen/Geometry +59 -0
data/vendor/Eigen/Householder +29 -0
data/vendor/Eigen/IterativeLinearSolvers +48 -0
data/vendor/Eigen/Jacobi +32 -0
data/vendor/Eigen/KLUSupport +41 -0
data/vendor/Eigen/LU +47 -0
data/vendor/Eigen/MetisSupport +35 -0
data/vendor/Eigen/OrderingMethods +70 -0
data/vendor/Eigen/PaStiXSupport +49 -0
data/vendor/Eigen/PardisoSupport +35 -0
data/vendor/Eigen/QR +50 -0
data/vendor/Eigen/QtAlignedMalloc +39 -0
data/vendor/Eigen/SPQRSupport +34 -0
data/vendor/Eigen/SVD +50 -0
data/vendor/Eigen/Sparse +34 -0
data/vendor/Eigen/SparseCholesky +37 -0
data/vendor/Eigen/SparseCore +69 -0
data/vendor/Eigen/SparseLU +50 -0
data/vendor/Eigen/SparseQR +36 -0
data/vendor/Eigen/StdDeque +27 -0
data/vendor/Eigen/StdList +26 -0
data/vendor/Eigen/StdVector +27 -0
data/vendor/Eigen/SuperLUSupport +64 -0
data/vendor/Eigen/UmfPackSupport +40 -0
data/vendor/Eigen/src/Cholesky/LDLT.h +688 -0
data/vendor/Eigen/src/Cholesky/LLT.h +558 -0
data/vendor/Eigen/src/Cholesky/LLT_LAPACKE.h +99 -0
data/vendor/Eigen/src/CholmodSupport/CholmodSupport.h +682 -0
data/vendor/Eigen/src/Core/ArithmeticSequence.h +413 -0
data/vendor/Eigen/src/Core/Array.h +417 -0
data/vendor/Eigen/src/Core/ArrayBase.h +226 -0
data/vendor/Eigen/src/Core/ArrayWrapper.h +209 -0
data/vendor/Eigen/src/Core/Assign.h +90 -0
data/vendor/Eigen/src/Core/AssignEvaluator.h +1010 -0
data/vendor/Eigen/src/Core/Assign_MKL.h +178 -0
data/vendor/Eigen/src/Core/BandMatrix.h +353 -0
data/vendor/Eigen/src/Core/Block.h +448 -0
data/vendor/Eigen/src/Core/BooleanRedux.h +162 -0
data/vendor/Eigen/src/Core/CommaInitializer.h +164 -0
data/vendor/Eigen/src/Core/ConditionEstimator.h +175 -0
data/vendor/Eigen/src/Core/CoreEvaluators.h +1741 -0
data/vendor/Eigen/src/Core/CoreIterators.h +132 -0
data/vendor/Eigen/src/Core/CwiseBinaryOp.h +183 -0
data/vendor/Eigen/src/Core/CwiseNullaryOp.h +1001 -0
data/vendor/Eigen/src/Core/CwiseTernaryOp.h +197 -0
data/vendor/Eigen/src/Core/CwiseUnaryOp.h +103 -0
data/vendor/Eigen/src/Core/CwiseUnaryView.h +132 -0
data/vendor/Eigen/src/Core/DenseBase.h +701 -0
data/vendor/Eigen/src/Core/DenseCoeffsBase.h +685 -0
data/vendor/Eigen/src/Core/DenseStorage.h +652 -0
data/vendor/Eigen/src/Core/Diagonal.h +258 -0
data/vendor/Eigen/src/Core/DiagonalMatrix.h +391 -0
data/vendor/Eigen/src/Core/DiagonalProduct.h +28 -0
data/vendor/Eigen/src/Core/Dot.h +318 -0
data/vendor/Eigen/src/Core/EigenBase.h +160 -0
data/vendor/Eigen/src/Core/ForceAlignedAccess.h +150 -0
data/vendor/Eigen/src/Core/Fuzzy.h +155 -0
data/vendor/Eigen/src/Core/GeneralProduct.h +465 -0
data/vendor/Eigen/src/Core/GenericPacketMath.h +1040 -0
data/vendor/Eigen/src/Core/GlobalFunctions.h +194 -0
data/vendor/Eigen/src/Core/IO.h +258 -0
data/vendor/Eigen/src/Core/IndexedView.h +237 -0
data/vendor/Eigen/src/Core/Inverse.h +117 -0
data/vendor/Eigen/src/Core/Map.h +171 -0
data/vendor/Eigen/src/Core/MapBase.h +310 -0
data/vendor/Eigen/src/Core/MathFunctions.h +2057 -0
data/vendor/Eigen/src/Core/MathFunctionsImpl.h +200 -0
data/vendor/Eigen/src/Core/Matrix.h +565 -0
data/vendor/Eigen/src/Core/MatrixBase.h +547 -0
data/vendor/Eigen/src/Core/NestByValue.h +85 -0
data/vendor/Eigen/src/Core/NoAlias.h +109 -0
data/vendor/Eigen/src/Core/NumTraits.h +335 -0
data/vendor/Eigen/src/Core/PartialReduxEvaluator.h +232 -0
data/vendor/Eigen/src/Core/PermutationMatrix.h +605 -0
data/vendor/Eigen/src/Core/PlainObjectBase.h +1128 -0
data/vendor/Eigen/src/Core/Product.h +191 -0
data/vendor/Eigen/src/Core/ProductEvaluators.h +1179 -0
data/vendor/Eigen/src/Core/Random.h +218 -0
data/vendor/Eigen/src/Core/Redux.h +515 -0
data/vendor/Eigen/src/Core/Ref.h +381 -0
data/vendor/Eigen/src/Core/Replicate.h +142 -0
data/vendor/Eigen/src/Core/Reshaped.h +454 -0
data/vendor/Eigen/src/Core/ReturnByValue.h +119 -0
data/vendor/Eigen/src/Core/Reverse.h +217 -0
data/vendor/Eigen/src/Core/Select.h +164 -0
data/vendor/Eigen/src/Core/SelfAdjointView.h +365 -0
data/vendor/Eigen/src/Core/SelfCwiseBinaryOp.h +47 -0
data/vendor/Eigen/src/Core/Solve.h +188 -0
data/vendor/Eigen/src/Core/SolveTriangular.h +235 -0
data/vendor/Eigen/src/Core/SolverBase.h +168 -0
data/vendor/Eigen/src/Core/StableNorm.h +251 -0
data/vendor/Eigen/src/Core/StlIterators.h +463 -0
data/vendor/Eigen/src/Core/Stride.h +116 -0
data/vendor/Eigen/src/Core/Swap.h +68 -0
data/vendor/Eigen/src/Core/Transpose.h +464 -0
data/vendor/Eigen/src/Core/Transpositions.h +386 -0
data/vendor/Eigen/src/Core/TriangularMatrix.h +1001 -0
data/vendor/Eigen/src/Core/VectorBlock.h +96 -0
data/vendor/Eigen/src/Core/VectorwiseOp.h +784 -0
data/vendor/Eigen/src/Core/Visitor.h +381 -0
data/vendor/Eigen/src/Core/arch/AVX/Complex.h +372 -0
data/vendor/Eigen/src/Core/arch/AVX/MathFunctions.h +228 -0
data/vendor/Eigen/src/Core/arch/AVX/PacketMath.h +1574 -0
data/vendor/Eigen/src/Core/arch/AVX/TypeCasting.h +115 -0
data/vendor/Eigen/src/Core/arch/AVX512/Complex.h +422 -0
data/vendor/Eigen/src/Core/arch/AVX512/MathFunctions.h +362 -0
data/vendor/Eigen/src/Core/arch/AVX512/PacketMath.h +2303 -0
data/vendor/Eigen/src/Core/arch/AVX512/TypeCasting.h +89 -0
data/vendor/Eigen/src/Core/arch/AltiVec/Complex.h +417 -0
data/vendor/Eigen/src/Core/arch/AltiVec/MathFunctions.h +90 -0
data/vendor/Eigen/src/Core/arch/AltiVec/MatrixProduct.h +2937 -0
data/vendor/Eigen/src/Core/arch/AltiVec/MatrixProductCommon.h +221 -0
data/vendor/Eigen/src/Core/arch/AltiVec/MatrixProductMMA.h +629 -0
data/vendor/Eigen/src/Core/arch/AltiVec/PacketMath.h +2711 -0
data/vendor/Eigen/src/Core/arch/CUDA/Complex.h +258 -0
data/vendor/Eigen/src/Core/arch/Default/BFloat16.h +700 -0
data/vendor/Eigen/src/Core/arch/Default/ConjHelper.h +117 -0
data/vendor/Eigen/src/Core/arch/Default/GenericPacketMathFunctions.h +1649 -0
data/vendor/Eigen/src/Core/arch/Default/GenericPacketMathFunctionsFwd.h +110 -0
data/vendor/Eigen/src/Core/arch/Default/Half.h +942 -0
data/vendor/Eigen/src/Core/arch/Default/Settings.h +49 -0
data/vendor/Eigen/src/Core/arch/Default/TypeCasting.h +120 -0
data/vendor/Eigen/src/Core/arch/GPU/MathFunctions.h +103 -0
data/vendor/Eigen/src/Core/arch/GPU/PacketMath.h +1685 -0
data/vendor/Eigen/src/Core/arch/GPU/TypeCasting.h +80 -0
data/vendor/Eigen/src/Core/arch/HIP/hcc/math_constants.h +23 -0
data/vendor/Eigen/src/Core/arch/MSA/Complex.h +648 -0
data/vendor/Eigen/src/Core/arch/MSA/MathFunctions.h +387 -0
data/vendor/Eigen/src/Core/arch/MSA/PacketMath.h +1233 -0
data/vendor/Eigen/src/Core/arch/NEON/Complex.h +584 -0
data/vendor/Eigen/src/Core/arch/NEON/GeneralBlockPanelKernel.h +183 -0
data/vendor/Eigen/src/Core/arch/NEON/MathFunctions.h +75 -0
data/vendor/Eigen/src/Core/arch/NEON/PacketMath.h +4587 -0
data/vendor/Eigen/src/Core/arch/NEON/TypeCasting.h +1419 -0
data/vendor/Eigen/src/Core/arch/SSE/Complex.h +351 -0
data/vendor/Eigen/src/Core/arch/SSE/MathFunctions.h +199 -0
data/vendor/Eigen/src/Core/arch/SSE/PacketMath.h +1505 -0
data/vendor/Eigen/src/Core/arch/SSE/TypeCasting.h +142 -0
data/vendor/Eigen/src/Core/arch/SVE/MathFunctions.h +44 -0
data/vendor/Eigen/src/Core/arch/SVE/PacketMath.h +752 -0
data/vendor/Eigen/src/Core/arch/SVE/TypeCasting.h +49 -0
data/vendor/Eigen/src/Core/arch/SYCL/InteropHeaders.h +232 -0
data/vendor/Eigen/src/Core/arch/SYCL/MathFunctions.h +301 -0
data/vendor/Eigen/src/Core/arch/SYCL/PacketMath.h +670 -0
data/vendor/Eigen/src/Core/arch/SYCL/SyclMemoryModel.h +694 -0
data/vendor/Eigen/src/Core/arch/SYCL/TypeCasting.h +85 -0
data/vendor/Eigen/src/Core/arch/ZVector/Complex.h +426 -0
data/vendor/Eigen/src/Core/arch/ZVector/MathFunctions.h +233 -0
data/vendor/Eigen/src/Core/arch/ZVector/PacketMath.h +1060 -0
data/vendor/Eigen/src/Core/functors/AssignmentFunctors.h +177 -0
data/vendor/Eigen/src/Core/functors/BinaryFunctors.h +541 -0
data/vendor/Eigen/src/Core/functors/NullaryFunctors.h +189 -0
data/vendor/Eigen/src/Core/functors/StlFunctors.h +166 -0
data/vendor/Eigen/src/Core/functors/TernaryFunctors.h +25 -0
data/vendor/Eigen/src/Core/functors/UnaryFunctors.h +1131 -0
data/vendor/Eigen/src/Core/products/GeneralBlockPanelKernel.h +2645 -0
data/vendor/Eigen/src/Core/products/GeneralMatrixMatrix.h +517 -0
data/vendor/Eigen/src/Core/products/GeneralMatrixMatrixTriangular.h +317 -0
data/vendor/Eigen/src/Core/products/GeneralMatrixMatrixTriangular_BLAS.h +145 -0
data/vendor/Eigen/src/Core/products/GeneralMatrixMatrix_BLAS.h +124 -0
data/vendor/Eigen/src/Core/products/GeneralMatrixVector.h +518 -0
data/vendor/Eigen/src/Core/products/GeneralMatrixVector_BLAS.h +136 -0
data/vendor/Eigen/src/Core/products/Parallelizer.h +180 -0
data/vendor/Eigen/src/Core/products/SelfadjointMatrixMatrix.h +544 -0
data/vendor/Eigen/src/Core/products/SelfadjointMatrixMatrix_BLAS.h +295 -0
data/vendor/Eigen/src/Core/products/SelfadjointMatrixVector.h +262 -0
data/vendor/Eigen/src/Core/products/SelfadjointMatrixVector_BLAS.h +118 -0
data/vendor/Eigen/src/Core/products/SelfadjointProduct.h +133 -0
data/vendor/Eigen/src/Core/products/SelfadjointRank2Update.h +94 -0
data/vendor/Eigen/src/Core/products/TriangularMatrixMatrix.h +472 -0
data/vendor/Eigen/src/Core/products/TriangularMatrixMatrix_BLAS.h +317 -0
data/vendor/Eigen/src/Core/products/TriangularMatrixVector.h +350 -0
data/vendor/Eigen/src/Core/products/TriangularMatrixVector_BLAS.h +255 -0
data/vendor/Eigen/src/Core/products/TriangularSolverMatrix.h +337 -0
data/vendor/Eigen/src/Core/products/TriangularSolverMatrix_BLAS.h +167 -0
data/vendor/Eigen/src/Core/products/TriangularSolverVector.h +148 -0
data/vendor/Eigen/src/Core/util/BlasUtil.h +583 -0
data/vendor/Eigen/src/Core/util/ConfigureVectorization.h +512 -0
data/vendor/Eigen/src/Core/util/Constants.h +563 -0
data/vendor/Eigen/src/Core/util/DisableStupidWarnings.h +106 -0
data/vendor/Eigen/src/Core/util/ForwardDeclarations.h +322 -0
data/vendor/Eigen/src/Core/util/IndexedViewHelper.h +186 -0
data/vendor/Eigen/src/Core/util/IntegralConstant.h +272 -0
data/vendor/Eigen/src/Core/util/MKL_support.h +137 -0
data/vendor/Eigen/src/Core/util/Macros.h +1464 -0
data/vendor/Eigen/src/Core/util/Memory.h +1163 -0
data/vendor/Eigen/src/Core/util/Meta.h +812 -0
data/vendor/Eigen/src/Core/util/NonMPL2.h +3 -0
data/vendor/Eigen/src/Core/util/ReenableStupidWarnings.h +31 -0
data/vendor/Eigen/src/Core/util/ReshapedHelper.h +51 -0
data/vendor/Eigen/src/Core/util/StaticAssert.h +221 -0
data/vendor/Eigen/src/Core/util/SymbolicIndex.h +293 -0
data/vendor/Eigen/src/Core/util/XprHelper.h +856 -0
data/vendor/Eigen/src/Eigenvalues/ComplexEigenSolver.h +346 -0
data/vendor/Eigen/src/Eigenvalues/ComplexSchur.h +462 -0
data/vendor/Eigen/src/Eigenvalues/ComplexSchur_LAPACKE.h +91 -0
data/vendor/Eigen/src/Eigenvalues/EigenSolver.h +622 -0
data/vendor/Eigen/src/Eigenvalues/GeneralizedEigenSolver.h +418 -0
data/vendor/Eigen/src/Eigenvalues/GeneralizedSelfAdjointEigenSolver.h +226 -0
data/vendor/Eigen/src/Eigenvalues/HessenbergDecomposition.h +374 -0
data/vendor/Eigen/src/Eigenvalues/MatrixBaseEigenvalues.h +158 -0
data/vendor/Eigen/src/Eigenvalues/RealQZ.h +657 -0
data/vendor/Eigen/src/Eigenvalues/RealSchur.h +558 -0
data/vendor/Eigen/src/Eigenvalues/RealSchur_LAPACKE.h +77 -0
data/vendor/Eigen/src/Eigenvalues/SelfAdjointEigenSolver.h +904 -0
data/vendor/Eigen/src/Eigenvalues/SelfAdjointEigenSolver_LAPACKE.h +87 -0
data/vendor/Eigen/src/Eigenvalues/Tridiagonalization.h +561 -0
data/vendor/Eigen/src/Geometry/AlignedBox.h +486 -0
data/vendor/Eigen/src/Geometry/AngleAxis.h +247 -0
data/vendor/Eigen/src/Geometry/EulerAngles.h +114 -0
data/vendor/Eigen/src/Geometry/Homogeneous.h +501 -0
data/vendor/Eigen/src/Geometry/Hyperplane.h +282 -0
data/vendor/Eigen/src/Geometry/OrthoMethods.h +235 -0
data/vendor/Eigen/src/Geometry/ParametrizedLine.h +232 -0
data/vendor/Eigen/src/Geometry/Quaternion.h +870 -0
data/vendor/Eigen/src/Geometry/Rotation2D.h +199 -0
data/vendor/Eigen/src/Geometry/RotationBase.h +206 -0
data/vendor/Eigen/src/Geometry/Scaling.h +188 -0
data/vendor/Eigen/src/Geometry/Transform.h +1563 -0
data/vendor/Eigen/src/Geometry/Translation.h +202 -0
data/vendor/Eigen/src/Geometry/Umeyama.h +166 -0
data/vendor/Eigen/src/Geometry/arch/Geometry_SIMD.h +168 -0
data/vendor/Eigen/src/Householder/BlockHouseholder.h +110 -0
data/vendor/Eigen/src/Householder/Householder.h +176 -0
data/vendor/Eigen/src/Householder/HouseholderSequence.h +545 -0
data/vendor/Eigen/src/IterativeLinearSolvers/BasicPreconditioners.h +226 -0
data/vendor/Eigen/src/IterativeLinearSolvers/BiCGSTAB.h +212 -0
data/vendor/Eigen/src/IterativeLinearSolvers/ConjugateGradient.h +229 -0
data/vendor/Eigen/src/IterativeLinearSolvers/IncompleteCholesky.h +394 -0
data/vendor/Eigen/src/IterativeLinearSolvers/IncompleteLUT.h +453 -0
data/vendor/Eigen/src/IterativeLinearSolvers/IterativeSolverBase.h +444 -0
data/vendor/Eigen/src/IterativeLinearSolvers/LeastSquareConjugateGradient.h +198 -0
data/vendor/Eigen/src/IterativeLinearSolvers/SolveWithGuess.h +117 -0
data/vendor/Eigen/src/Jacobi/Jacobi.h +483 -0
data/vendor/Eigen/src/KLUSupport/KLUSupport.h +358 -0
data/vendor/Eigen/src/LU/Determinant.h +117 -0
data/vendor/Eigen/src/LU/FullPivLU.h +877 -0
data/vendor/Eigen/src/LU/InverseImpl.h +432 -0
data/vendor/Eigen/src/LU/PartialPivLU.h +624 -0
data/vendor/Eigen/src/LU/PartialPivLU_LAPACKE.h +83 -0
data/vendor/Eigen/src/LU/arch/InverseSize4.h +351 -0
data/vendor/Eigen/src/MetisSupport/MetisSupport.h +137 -0
data/vendor/Eigen/src/OrderingMethods/Amd.h +435 -0
data/vendor/Eigen/src/OrderingMethods/Eigen_Colamd.h +1863 -0
data/vendor/Eigen/src/OrderingMethods/Ordering.h +153 -0
data/vendor/Eigen/src/PaStiXSupport/PaStiXSupport.h +678 -0
data/vendor/Eigen/src/PardisoSupport/PardisoSupport.h +545 -0
data/vendor/Eigen/src/QR/ColPivHouseholderQR.h +674 -0
data/vendor/Eigen/src/QR/ColPivHouseholderQR_LAPACKE.h +97 -0
data/vendor/Eigen/src/QR/CompleteOrthogonalDecomposition.h +635 -0
data/vendor/Eigen/src/QR/FullPivHouseholderQR.h +713 -0
data/vendor/Eigen/src/QR/HouseholderQR.h +434 -0
data/vendor/Eigen/src/QR/HouseholderQR_LAPACKE.h +68 -0
data/vendor/Eigen/src/SPQRSupport/SuiteSparseQRSupport.h +335 -0
data/vendor/Eigen/src/SVD/BDCSVD.h +1366 -0
data/vendor/Eigen/src/SVD/JacobiSVD.h +812 -0
data/vendor/Eigen/src/SVD/JacobiSVD_LAPACKE.h +91 -0
data/vendor/Eigen/src/SVD/SVDBase.h +376 -0
data/vendor/Eigen/src/SVD/UpperBidiagonalization.h +414 -0
data/vendor/Eigen/src/SparseCholesky/SimplicialCholesky.h +697 -0
data/vendor/Eigen/src/SparseCholesky/SimplicialCholesky_impl.h +174 -0
data/vendor/Eigen/src/SparseCore/AmbiVector.h +378 -0
data/vendor/Eigen/src/SparseCore/CompressedStorage.h +274 -0
data/vendor/Eigen/src/SparseCore/ConservativeSparseSparseProduct.h +352 -0
data/vendor/Eigen/src/SparseCore/MappedSparseMatrix.h +67 -0
data/vendor/Eigen/src/SparseCore/SparseAssign.h +270 -0
data/vendor/Eigen/src/SparseCore/SparseBlock.h +571 -0
data/vendor/Eigen/src/SparseCore/SparseColEtree.h +206 -0
data/vendor/Eigen/src/SparseCore/SparseCompressedBase.h +370 -0
data/vendor/Eigen/src/SparseCore/SparseCwiseBinaryOp.h +722 -0
data/vendor/Eigen/src/SparseCore/SparseCwiseUnaryOp.h +150 -0
data/vendor/Eigen/src/SparseCore/SparseDenseProduct.h +342 -0
data/vendor/Eigen/src/SparseCore/SparseDiagonalProduct.h +138 -0
data/vendor/Eigen/src/SparseCore/SparseDot.h +98 -0
data/vendor/Eigen/src/SparseCore/SparseFuzzy.h +29 -0
data/vendor/Eigen/src/SparseCore/SparseMap.h +305 -0
data/vendor/Eigen/src/SparseCore/SparseMatrix.h +1518 -0
data/vendor/Eigen/src/SparseCore/SparseMatrixBase.h +398 -0
data/vendor/Eigen/src/SparseCore/SparsePermutation.h +178 -0
data/vendor/Eigen/src/SparseCore/SparseProduct.h +181 -0
data/vendor/Eigen/src/SparseCore/SparseRedux.h +49 -0
data/vendor/Eigen/src/SparseCore/SparseRef.h +397 -0
data/vendor/Eigen/src/SparseCore/SparseSelfAdjointView.h +659 -0
data/vendor/Eigen/src/SparseCore/SparseSolverBase.h +124 -0
data/vendor/Eigen/src/SparseCore/SparseSparseProductWithPruning.h +198 -0
data/vendor/Eigen/src/SparseCore/SparseTranspose.h +92 -0
data/vendor/Eigen/src/SparseCore/SparseTriangularView.h +189 -0
data/vendor/Eigen/src/SparseCore/SparseUtil.h +186 -0
data/vendor/Eigen/src/SparseCore/SparseVector.h +478 -0
data/vendor/Eigen/src/SparseCore/SparseView.h +254 -0
data/vendor/Eigen/src/SparseCore/TriangularSolver.h +315 -0
data/vendor/Eigen/src/SparseLU/SparseLU.h +923 -0
data/vendor/Eigen/src/SparseLU/SparseLUImpl.h +66 -0
data/vendor/Eigen/src/SparseLU/SparseLU_Memory.h +226 -0
data/vendor/Eigen/src/SparseLU/SparseLU_Structs.h +110 -0
data/vendor/Eigen/src/SparseLU/SparseLU_SupernodalMatrix.h +375 -0
data/vendor/Eigen/src/SparseLU/SparseLU_Utils.h +80 -0
data/vendor/Eigen/src/SparseLU/SparseLU_column_bmod.h +181 -0
data/vendor/Eigen/src/SparseLU/SparseLU_column_dfs.h +179 -0
data/vendor/Eigen/src/SparseLU/SparseLU_copy_to_ucol.h +107 -0
data/vendor/Eigen/src/SparseLU/SparseLU_gemm_kernel.h +280 -0
data/vendor/Eigen/src/SparseLU/SparseLU_heap_relax_snode.h +126 -0
data/vendor/Eigen/src/SparseLU/SparseLU_kernel_bmod.h +130 -0
data/vendor/Eigen/src/SparseLU/SparseLU_panel_bmod.h +223 -0
data/vendor/Eigen/src/SparseLU/SparseLU_panel_dfs.h +258 -0
data/vendor/Eigen/src/SparseLU/SparseLU_pivotL.h +137 -0
data/vendor/Eigen/src/SparseLU/SparseLU_pruneL.h +136 -0
data/vendor/Eigen/src/SparseLU/SparseLU_relax_snode.h +83 -0
data/vendor/Eigen/src/SparseQR/SparseQR.h +758 -0
data/vendor/Eigen/src/StlSupport/StdDeque.h +116 -0
data/vendor/Eigen/src/StlSupport/StdList.h +106 -0
data/vendor/Eigen/src/StlSupport/StdVector.h +131 -0
data/vendor/Eigen/src/StlSupport/details.h +84 -0
data/vendor/Eigen/src/SuperLUSupport/SuperLUSupport.h +1025 -0
data/vendor/Eigen/src/UmfPackSupport/UmfPackSupport.h +642 -0
data/vendor/Eigen/src/misc/Image.h +82 -0
data/vendor/Eigen/src/misc/Kernel.h +79 -0
data/vendor/Eigen/src/misc/RealSvd2x2.h +55 -0
data/vendor/Eigen/src/misc/blas.h +440 -0
data/vendor/Eigen/src/misc/lapack.h +152 -0
data/vendor/Eigen/src/misc/lapacke.h +16292 -0
data/vendor/Eigen/src/misc/lapacke_mangling.h +17 -0
data/vendor/Eigen/src/plugins/ArrayCwiseBinaryOps.h +358 -0
data/vendor/Eigen/src/plugins/ArrayCwiseUnaryOps.h +696 -0
data/vendor/Eigen/src/plugins/BlockMethods.h +1442 -0
data/vendor/Eigen/src/plugins/CommonCwiseBinaryOps.h +115 -0
data/vendor/Eigen/src/plugins/CommonCwiseUnaryOps.h +177 -0
data/vendor/Eigen/src/plugins/IndexedViewMethods.h +262 -0
data/vendor/Eigen/src/plugins/MatrixCwiseBinaryOps.h +152 -0
data/vendor/Eigen/src/plugins/MatrixCwiseUnaryOps.h +95 -0
data/vendor/Eigen/src/plugins/ReshapedMethods.h +149 -0
data/vendor/aarand/aarand.hpp +114 -0
data/vendor/annoy/annoylib.h +1495 -0
data/vendor/annoy/kissrandom.h +120 -0
data/vendor/annoy/mman.h +242 -0
data/vendor/hnswlib/bruteforce.h +152 -0
data/vendor/hnswlib/hnswalg.h +1192 -0
data/vendor/hnswlib/hnswlib.h +108 -0
data/vendor/hnswlib/space_ip.h +282 -0
data/vendor/hnswlib/space_l2.h +281 -0
data/vendor/hnswlib/visited_list_pool.h +79 -0
data/vendor/irlba/irlba.hpp +575 -0
data/vendor/irlba/lanczos.hpp +212 -0
data/vendor/irlba/parallel.hpp +474 -0
data/vendor/irlba/utils.hpp +224 -0
data/vendor/irlba/wrappers.hpp +228 -0
data/vendor/kmeans/Base.hpp +75 -0
data/vendor/kmeans/Details.hpp +79 -0
data/vendor/kmeans/HartiganWong.hpp +492 -0
data/vendor/kmeans/InitializeKmeansPP.hpp +144 -0
data/vendor/kmeans/InitializeNone.hpp +44 -0
data/vendor/kmeans/InitializePCAPartition.hpp +309 -0
data/vendor/kmeans/InitializeRandom.hpp +91 -0
data/vendor/kmeans/Kmeans.hpp +161 -0
data/vendor/kmeans/Lloyd.hpp +134 -0
data/vendor/kmeans/MiniBatch.hpp +269 -0
data/vendor/kmeans/QuickSearch.hpp +179 -0
data/vendor/kmeans/compute_centroids.hpp +32 -0
data/vendor/kmeans/compute_wcss.hpp +27 -0
data/vendor/kmeans/is_edge_case.hpp +42 -0
data/vendor/kmeans/random.hpp +55 -0
data/vendor/knncolle/Annoy/Annoy.hpp +193 -0
data/vendor/knncolle/BruteForce/BruteForce.hpp +120 -0
data/vendor/knncolle/Hnsw/Hnsw.hpp +225 -0
data/vendor/knncolle/Kmknn/Kmknn.hpp +286 -0
data/vendor/knncolle/VpTree/VpTree.hpp +256 -0
data/vendor/knncolle/knncolle.hpp +34 -0
data/vendor/knncolle/utils/Base.hpp +100 -0
data/vendor/knncolle/utils/NeighborQueue.hpp +94 -0
data/vendor/knncolle/utils/distances.hpp +98 -0
data/vendor/knncolle/utils/find_nearest_neighbors.hpp +112 -0
data/vendor/powerit/PowerIterations.hpp +157 -0
data/vendor/umappp/NeighborList.hpp +37 -0
data/vendor/umappp/Umap.hpp +662 -0
data/vendor/umappp/combine_neighbor_sets.hpp +95 -0
data/vendor/umappp/find_ab.hpp +157 -0
data/vendor/umappp/neighbor_similarities.hpp +136 -0
data/vendor/umappp/optimize_layout.hpp +285 -0
data/vendor/umappp/spectral_init.hpp +181 -0
data/vendor/umappp/umappp.hpp +13 -0
metadata +465 -0

data/vendor/knncolle/Kmknn/Kmknn.hpp ADDED Viewed

@@ -0,0 +1,286 @@
+#ifndef KNNCOLLE_KMKNN_HPP
+#define KNNCOLLE_KMKNN_HPP
+#include "../utils/distances.hpp"
+#include "../utils/NeighborQueue.hpp"
+#include "../utils/Base.hpp"
+#include "kmeans/Kmeans.hpp"
+#include <algorithm>
+#include <vector>
+#include <random>
+#include <limits>
+#include <cmath>
+#ifdef DEBUG
+#include <iostream>
+#endif
+/**
+ * @file Kmknn.hpp
+ *
+ * @brief Implements the k-means with k-nearest neighbors (KMKNN) algorithm.
+ */
+namespace knncolle {
+/**
+ * @brief Perform a nearest neighbor search based on k-means clustering.
+ *
+ * In the k-means with k-nearest neighbors (KMKNN) algorithm (Wang, 2012), k-means clustering is first applied to the data points,
+ * with the number of cluster centers defined as the square root of the number of points.
+ * The cluster assignment and distance to the assigned cluster center for each point represent the KMKNN indexing information,
+ * allowing us to speed up the nearest neighbor search by exploiting the triangle inequality between cluster centers, the query point and each point in the cluster to narrow the search space.
+ * The advantage of the KMKNN approach is its simplicity and minimal overhead,
+ * resulting in performance improvements over conventional tree-based methods for high-dimensional data where most points need to be searched anyway.
+ *
+ * @tparam DISTANCE Class to compute the distance between vectors, see `distance::Euclidean` for an example.
+ * @tparam INDEX_t Integer type for the indices.
+ * @tparam DISTANCE_t Floating point type for the distances.
+ * @tparam QUERY_t Floating point type for the query data.
+ * @tparam INTERNAL_t Floating point type for the data.
+ *
+ * @see
+ * Wang X (2012).
+ * A fast exact k-nearest neighbors algorithm for high dimensional search using k-means clustering and triangle inequality.
+ * _Proc Int Jt Conf Neural Netw_, 43, 6:2351-2358.
+ */
+template<class DISTANCE, typename INDEX_t = int, typename DISTANCE_t = double, typename QUERY_t = DISTANCE_t, typename INTERNAL_t = DISTANCE_t>
+class Kmknn : public Base<INDEX_t, DISTANCE_t, QUERY_t> {
+private:
+    INDEX_t num_dim;
+    INDEX_t num_obs;
+public:
+    INDEX_t nobs() const { return num_obs; }
+    INDEX_t ndim() const { return num_dim; }
+private:
+    std::vector<INTERNAL_t> data;
+    std::vector<INDEX_t> sizes;
+    std::vector<INDEX_t> offsets;
+    std::vector<INTERNAL_t> centers;
+    std::vector<INDEX_t> observation_id, new_location;
+    std::vector<DISTANCE_t> dist_to_centroid;
+public:
+    /**
+     * @param ndim Number of dimensions.
+     * @param nobs Number of observations.
+     * @param vals Pointer to an array of length `ndim * nobs`, corresponding to a dimension-by-observation matrix in column-major format,
+     * i.e., contiguous elements belong to the same observation.
+     * @param power Power of `nobs` to define the number of cluster centers.
+     * By default, a square root is performed.
+     *
+     * @tparam INPUT_t Floating-point type of the input data.
+     */
+    template<typename INPUT_t>
+    Kmknn(INDEX_t ndim, INDEX_t nobs, const INPUT_t* vals, double power = 0.5) :
+            num_dim(ndim),
+            num_obs(nobs),
+            data(ndim * nobs),
+            sizes(std::ceil(std::pow(num_obs, power))),
+            offsets(sizes.size()),
+            centers(sizes.size() * ndim),
+            observation_id(nobs),
+            new_location(nobs),
+            dist_to_centroid(nobs)
+    {
+        std::vector<int> clusters(num_obs);
+        auto ncenters = sizes.size();
+        // Try to avoid a copy if we're dealing with the same type;
+        // otherwise, we just dump it into 'data', given that we
+        // won't be rewriting it for a while anyway.
+        const INTERNAL_t* host;
+        if constexpr(std::is_same<INPUT_t, INTERNAL_t>::value) {
+            host = vals;
+        } else {
+            std::copy(vals, vals + data.size(), data.data());
+            host = data.data();
+        }
+        auto output = kmeans::Kmeans<INTERNAL_t, int>().run(ndim, nobs, host, ncenters, centers.data(), clusters.data());
+        std::swap(sizes, output.sizes);
+        // In case there were some duplicate points, we just resize this a bit.
+        if (ncenters != sizes.size()) {
+            ncenters = sizes.size();
+            offsets.resize(ncenters);
+            centers.resize(ncenters * ndim);
+        }
+        for (INDEX_t i = 1; i < ncenters; ++i) {
+            offsets[i] = offsets[i - 1] + sizes[i - 1];
+        }
+        // Organize points correctly; firstly, sorting by distance from the assigned center.
+        std::vector<std::pair<INTERNAL_t, INDEX_t> > by_distance(nobs);
+        {
+            auto sofar = offsets;
+            for (INDEX_t o = 0; o < nobs; ++o) {
+                const auto& clustid = clusters[o];
+                auto& counter = sofar[clustid];
+                auto& current = by_distance[counter];
+                current.first = DISTANCE::normalize(DISTANCE::template raw_distance<INTERNAL_t>(host + o * num_dim, centers.data() + clustid * num_dim, num_dim));
+                current.second = o;
+                ++counter;
+            }
+            for (INDEX_t c = 0; c < ncenters; ++c) {
+                auto begin = by_distance.begin() + offsets[c];
+                std::sort(begin, begin + sizes[c]);
+            }
+        }
+        // Now, copying this over.
+        {
+            auto store = data.data();
+            for (INDEX_t o = 0; o < nobs; ++o, store += num_dim) {
+                const auto& current = by_distance[o];
+                auto source = vals + ndim * current.second; // must use 'vals' here, as 'host' might alias 'data'!
+                std::copy(source, source + ndim, store);
+                observation_id[o] = current.second;
+                new_location[current.second] = o;
+                dist_to_centroid[o] = current.first;
+            }
+        }
+        return;
+    }
+    std::vector<std::pair<INDEX_t, DISTANCE_t> > find_nearest_neighbors(INDEX_t index, int k) const {
+        NeighborQueue<INDEX_t, INTERNAL_t> nearest(k, new_location[index]);
+        search_nn(data.data() + new_location[index] * num_dim, nearest);
+        return report(nearest);
+    }
+    std::vector<std::pair<INDEX_t, DISTANCE_t> > find_nearest_neighbors(const QUERY_t* query, int k) const {
+        NeighborQueue<INDEX_t, INTERNAL_t> nearest(k);
+        search_nn(query, nearest);
+        return report(nearest);
+    }
+    const QUERY_t* observation(INDEX_t index, QUERY_t* buffer) const {
+        auto candidate = data.data() + num_dim * new_location[index];
+        if constexpr(std::is_same<QUERY_t, INTERNAL_t>::value) {
+            return candidate;
+        } else {
+            std::copy(candidate, candidate + num_dim, buffer);
+            return buffer;
+        }
+    }
+    using Base<INDEX_t, DISTANCE_t, QUERY_t>::observation;
+private:
+    template<typename INPUT_t>
+    void search_nn(INPUT_t* target, NeighborQueue<INDEX_t, INTERNAL_t>& nearest) const {
+        /* Computing distances to all centers and sorting them. The aim is to
+         * go through the nearest centers first, to get the shortest
+         * 'threshold' possible through the rest of the search.
+         */
+        std::vector<std::pair<INTERNAL_t, INDEX_t> > center_order(sizes.size());
+        auto clust_ptr = centers.data();
+        for (size_t c = 0; c < sizes.size(); ++c, clust_ptr += num_dim) {
+            center_order[c].first = DISTANCE::template raw_distance<INTERNAL_t>(target, clust_ptr, num_dim);
+            center_order[c].second = c;
+        }
+        std::sort(center_order.begin(), center_order.end());
+        INTERNAL_t threshold_raw = -1;
+        // Computing the distance to each center, and deciding whether to proceed for each cluster.
+        for (const auto& curcent : center_order) {
+            const INDEX_t center = curcent.second;
+            const INTERNAL_t dist2center = DISTANCE::normalize(curcent.first);
+            const auto cur_nobs = sizes[center];
+            const DISTANCE_t* dIt = dist_to_centroid.data() + offsets[center];
+            const DISTANCE_t maxdist = *(dIt + cur_nobs - 1);
+            INDEX_t firstcell=0;
+#if USE_UPPER
+            INTERNAL_t upper_bd = std::numeric_limits<INTERNAL_t>::max();
+#endif
+            if (threshold_raw >= 0) {
+                const INTERNAL_t threshold = DISTANCE::normalize(threshold_raw);
+                /* The conditional expression below exploits the triangle inequality; it is equivalent to asking whether:
+                 *     threshold + maxdist < dist2center
+                 * All points (if any) within this cluster with distances above 'lower_bd' are potentially countable.
+                 */
+                const DISTANCE_t lower_bd = dist2center - threshold;
+                if (maxdist < lower_bd) {
+                    continue;
+                }
+                firstcell=std::lower_bound(dIt, dIt + cur_nobs, lower_bd) - dIt;
+#if USE_UPPER
+                /* This exploits the reverse triangle inequality, to ignore points where:
+                 *     threshold + dist2center < point-to-center distance
+                 */
+                upper_bd = threshold + dist2center;
+#endif
+            }
+            const auto cur_start = offsets[center];
+            const INTERNAL_t * other_cell = data.data() + num_dim * (cur_start + firstcell);
+            for (auto celldex = firstcell; celldex < cur_nobs; ++celldex, other_cell += num_dim) {
+#if USE_UPPER
+                if (*(dIt + celldex) > upper_bd) {
+                    break;
+                }
+#endif
+                const auto dist2cell_raw = DISTANCE::template raw_distance<INTERNAL_t>(target, other_cell, num_dim);
+                nearest.add(cur_start + celldex, dist2cell_raw);
+                if (nearest.is_full()) {
+                    threshold_raw = nearest.limit(); // Shrinking the threshold, if an earlier NN has been found.
+#if USE_UPPER
+                    upper_bd = DISTANCE::normalize(threshold_raw) + dist2center;
+#endif
+                }
+            }
+        }
+    }
+    template<class QUEUE>
+    auto report(QUEUE& nearest) const {
+        auto output = nearest.template report<DISTANCE_t>();
+        for (auto& s : output) {
+            s.first = observation_id[s.first];
+            s.second = DISTANCE::normalize(s.second);
+        }
+        return output;
+    }
+#ifdef DEBUG
+    template<class V>
+    void print_vector(const V& input, const char* msg) const {
+        std::cout << msg << ": ";
+        for (auto v : input) {
+            std::cout << v << " ";
+        }
+        std::cout << std::endl;
+    }
+#endif
+};
+/**
+ * Perform a KMKNN search with Euclidean distances.
+ */
+template<typename INDEX_t = int, typename DISTANCE_t = double, typename QUERY_t = DISTANCE_t, typename INTERNAL_t = DISTANCE_t>
+using KmknnEuclidean = Kmknn<distances::Euclidean, INDEX_t, DISTANCE_t, QUERY_t, INTERNAL_t>;
+/**
+ * Perform a KMKNN search with Manhattan distances.
+ * Note that k-means clustering may not provide a particularly good indexing structure for Manhattan distances, so your mileage may vary.
+ */
+template<typename INDEX_t = int, typename DISTANCE_t = double, typename QUERY_t = DISTANCE_t, typename INTERNAL_t = DISTANCE_t>
+using KmknnManhattan = Kmknn<distances::Manhattan, INDEX_t, DISTANCE_t, QUERY_t, INTERNAL_t>;
+};
+#endif

data/vendor/knncolle/VpTree/VpTree.hpp ADDED Viewed

@@ -0,0 +1,256 @@
+#ifndef KNNCOLLE_VPTREE_HPP
+#define KNNCOLLE_VPTREE_HPP
+#include "../utils/distances.hpp"
+#include "../utils/NeighborQueue.hpp"
+#include "../utils/Base.hpp"
+#include <vector>
+#include <random>
+#include <limits>
+#include <tuple>
+/**
+ * @file VpTree.hpp
+ *
+ * @brief Implements a vantage point (VP) tree to search for nearest neighbors.
+ */
+namespace knncolle {
+/**
+ * @brief Perform a nearest neighbor search based on a vantage point (VP) tree.
+ *
+ * In a vantage point tree (Yianilos, 1993), each node contains a subset of points that is split into two further partitions.
+ * The split is determined by picking an arbitrary point inside that subset as the node center,
+ * computing the distance to all other points from the center, and using the median distance as the "radius" of a hypersphere.
+ * The left child of this node contains all points within that hypersphere while the right child contains the remaining points.
+ * This procedure is applied recursively until all points resolve to individual nodes, thus yielding a VP tree.
+ * Upon searching, the algorithm traverses the tree and exploits the triangle inequality between query points and node centers to narrow the search space.
+ *
+ * The major advantage of VP trees over more conventional KD-trees or ball trees is that the former does not need to construct intermediate nodes, instead using the data points themselves at the nodes.
+ * This reduces the memory usage of the tree and total number of distance calculations for any search.
+ * It can also be very useful when the concept of an intermediate is not well-defined (e.g., for non-numeric data), though this is not particularly relevant for **knncolle**.
+ *
+ * @tparam DISTANCE Class to compute the distance between vectors, see `distance::Euclidean` for an example.
+ * @tparam INDEX_t Integer type for the indices.
+ * @tparam DISTANCE_t Floating point type for the distances.
+ * @tparam QUERY_t Floating point type for the query data.
+ * @tparam INTERNAL_t Floating point type for the internal data store.
+ *
+ * @see
+ * Yianilos PN (1993).
+ * Data structures and algorithms for nearest neighbor search in general metric spaces.
+ * _Proceedings of the Fourth Annual ACM-SIAM Symposium on Discrete Algorithms_, 311-321.
+ *
+ * @see
+ * Hanov S (2011).
+ * VP trees: A data structure for finding stuff fast.
+ * http://stevehanov.ca/blog/index.php?id=130
+ */
+template<class DISTANCE, typename INDEX_t = int, typename DISTANCE_t = double, typename QUERY_t = DISTANCE_t, typename INTERNAL_t = DISTANCE_t>
+class VpTree : public Base<INDEX_t, DISTANCE_t, QUERY_t> {
+    /* Adapted from http://stevehanov.ca/blog/index.php?id=130 */
+private:
+    INDEX_t num_dim;
+    INDEX_t num_obs;
+public:
+    INDEX_t nobs() const { return num_obs; }
+    INDEX_t ndim() const { return num_dim; }
+private:
+    typedef int NodeIndex_t;
+    static const NodeIndex_t LEAF_MARKER=-1;
+    // Single node of a VP tree (has a point and radius; left children are closer to point than the radius)
+    struct Node {
+        INTERNAL_t threshold;  // radius
+        INDEX_t index; // original index of current vantage point
+        NodeIndex_t left;  // node index of the next vantage point for all children closer than 'threshold' from the current vantage point
+        NodeIndex_t right; // node index of the next vantage point for all children further than 'threshold' from the current vantage point
+        Node(NodeIndex_t i=0) : threshold(0), index(i), left(LEAF_MARKER), right(LEAF_MARKER) {}
+    };
+    std::vector<Node> nodes;
+    typedef std::tuple<INDEX_t, const INTERNAL_t*, INTERNAL_t> DataPoint; // internal distances computed using "INTERNAL_t" type, even if output is returned with DISTANCE_t.
+    template<class SAMPLER>
+    NodeIndex_t buildFromPoints(NodeIndex_t lower, NodeIndex_t upper, std::vector<DataPoint>& items, SAMPLER& rng) {
+        if (upper == lower) {     // indicates that we're done here!
+            return LEAF_MARKER;
+        }
+        NodeIndex_t pos = nodes.size();
+        nodes.resize(pos + 1);
+        Node& node=nodes.back();
+        int gap = upper - lower;
+        if (gap > 1) {      // if we did not arrive at leaf yet
+            /* Choose an arbitrary point and move it to the start of the [lower, upper)
+             * interval in 'items'; this is our new vantage point.
+             *
+             * Yes, I know that the modulo method does not provide strictly
+             * uniform values but statistical correctness doesn't really matter
+             * here... but reproducibility across platforms does matter, and
+             * std::uniform_int_distribution is implementation-dependent!
+             */
+            NodeIndex_t i = static_cast<NodeIndex_t>(rng() % gap + lower);
+            std::swap(items[lower], items[i]);
+            const auto& vantage = items[lower];
+            // Compute distances to the new vantage point.
+            const INTERNAL_t* ref = std::get<1>(vantage);
+            for (size_t i = lower + 1; i < upper; ++i) {
+                const INTERNAL_t* loc = std::get<1>(items[i]);
+                std::get<2>(items[i]) = DISTANCE::template raw_distance<INTERNAL_t>(ref, loc, num_dim);
+            }
+            // Partition around the median distance from the vantage point.
+            NodeIndex_t median = lower + gap/2;
+            std::nth_element(items.begin() + lower + 1, items.begin() + median, items.begin() + upper,
+                [&](const DataPoint& left, const DataPoint& right) -> bool {
+                    return std::get<2>(left) < std::get<2>(right);
+                }
+            );
+            // Threshold of the new node will be the distance to the median
+            node.threshold = DISTANCE::normalize(std::get<2>(items[median]));
+            // Recursively build tree
+            node.index = std::get<0>(vantage);
+            node.left = buildFromPoints(lower + 1, median, items, rng);
+            node.right = buildFromPoints(median, upper, items, rng);
+        } else {
+            node.index = std::get<0>(items[lower]);
+        }
+        return pos;
+    }
+private:
+    std::vector<INDEX_t> new_location;
+    std::vector<INTERNAL_t> store;
+public:
+    /**
+     * @param ndim Number of dimensions.
+     * @param nobs Number of observations.
+     * @param vals Pointer to an array of length `ndim * nobs`, corresponding to a dimension-by-observation matrix in column-major format,
+     * i.e., contiguous elements belong to the same observation.
+     *
+     * @tparam INPUT_t Floating-point type of the input data.
+     */
+    template<typename INPUT_t>
+    VpTree(INDEX_t ndim, INDEX_t nobs, const INPUT_t* vals) : num_dim(ndim), num_obs(nobs), new_location(nobs), store(ndim * nobs) {
+        std::vector<DataPoint> items;
+        items.reserve(num_obs);
+        for (INDEX_t i = 0; i < num_obs; ++i) {
+            items.push_back(DataPoint(i, vals + i * num_dim, 0));
+        }
+        nodes.reserve(num_obs);
+        std::mt19937_64 rand(1234567890); // seed doesn't really matter, we don't need statistical correctness here.
+        buildFromPoints(0, num_obs, items, rand);
+        // Actually populating the store based on the traversal order of the nodes.
+        // This should be more cache efficient than an arbitrary input order.
+        auto sIt = store.begin();
+        for (size_t i = 0; i < num_obs; ++i, sIt += num_dim) {
+            const auto& curnode = nodes[i];
+            new_location[curnode.index] = i;
+            auto start = vals + num_dim * curnode.index;
+            std::copy(start, start + num_dim, sIt);
+        }
+        return;
+    }
+    std::vector<std::pair<INDEX_t, DISTANCE_t> > find_nearest_neighbors(INDEX_t index, int k) const {
+        NeighborQueue<INDEX_t, INTERNAL_t> nearest(k, index);
+        INTERNAL_t tau = std::numeric_limits<INTERNAL_t>::max();
+        search_nn(0, store.data() + new_location[index] * num_dim, tau, nearest);
+        return nearest.template report<DISTANCE_t>();
+    }
+    std::vector<std::pair<INDEX_t, DISTANCE_t> > find_nearest_neighbors(const QUERY_t* query, int k) const {
+        NeighborQueue<INDEX_t, INTERNAL_t> nearest(k);
+        INTERNAL_t tau = std::numeric_limits<INTERNAL_t>::max();
+        search_nn(0, query, tau, nearest);
+        return nearest.template report<DISTANCE_t>();
+    }
+    const QUERY_t* observation(INDEX_t index, QUERY_t* buffer) const {
+        auto candidate = store.data() + num_dim * new_location[index];
+        if constexpr(std::is_same<QUERY_t, INTERNAL_t>::value) {
+            return candidate;
+        } else {
+            std::copy(candidate, candidate + num_dim, buffer);
+            return buffer;
+        }
+    }
+    using Base<INDEX_t, DISTANCE_t, QUERY_t>::observation;
+private:
+    template<typename INPUT_t>
+    void search_nn(NodeIndex_t curnode_index, const INPUT_t* target, INTERNAL_t& tau, NeighborQueue<INDEX_t, INTERNAL_t>& nearest) const {
+        if (curnode_index == LEAF_MARKER) { // indicates that we're done here
+            return;
+        }
+        // Compute distance between target and current node
+        const auto& curnode=nodes[curnode_index];
+        INTERNAL_t dist = DISTANCE::normalize(DISTANCE::template raw_distance<INTERNAL_t>(store.data() + curnode_index * num_dim, target, num_dim));
+        // If current node within radius tau
+        if (dist < tau) {
+            nearest.add(curnode.index, dist);
+            if (nearest.is_full()) {
+                tau = nearest.limit(); // update value of tau (farthest point in result list)
+            }
+        }
+        // Return if we arrived at a leaf
+        if (curnode.left == LEAF_MARKER && curnode.right == LEAF_MARKER) {
+            return;
+        }
+        // If the target lies within the radius of ball
+        if (dist < curnode.threshold) {
+            if (dist - tau <= curnode.threshold) {         // if there can still be neighbors inside the ball, recursively search left child first
+                search_nn(curnode.left, target, tau, nearest);
+            }
+            if (dist + tau >= curnode.threshold) {         // if there can still be neighbors outside the ball, recursively search right child
+                search_nn(curnode.right, target, tau, nearest);
+            }
+        // If the target lies outsize the radius of the ball
+        } else {
+            if (dist + tau >= curnode.threshold) {         // if there can still be neighbors outside the ball, recursively search right child first
+                search_nn(curnode.right, target, tau, nearest);
+            }
+            if (dist - tau <= curnode.threshold) {         // if there can still be neighbors inside the ball, recursively search left child
+                search_nn(curnode.left, target, tau, nearest);
+            }
+        }
+    }
+};
+/**
+ * Perform a VP tree search with Euclidean distances.
+ */
+template<typename INDEX_t = int, typename DISTANCE_t = double, typename QUERY_t = DISTANCE_t, typename INTERNAL_t = double>
+using VpTreeEuclidean = VpTree<distances::Euclidean, INDEX_t, DISTANCE_t, QUERY_t, INTERNAL_t>;
+/**
+ * Perform a VP tree search with Manhattan distances.
+ */
+template<typename INDEX_t = int, typename DISTANCE_t = double, typename QUERY_t = DISTANCE_t, typename INTERNAL_t = double>
+using VpTreeManhattan = VpTree<distances::Manhattan, INDEX_t, DISTANCE_t, QUERY_t, INTERNAL_t>;
+};
+#endif

data/vendor/knncolle/knncolle.hpp ADDED Viewed

@@ -0,0 +1,34 @@
+#ifndef KNNCOLLE_HPP
+#define KNNCOLLE_HPP
+#include "BruteForce/BruteForce.hpp"
+#include "VpTree/VpTree.hpp"
+#ifndef KNNCOLLE_NO_KMKNN
+#include "Kmknn/Kmknn.hpp"
+#endif
+#ifndef KNNCOLLE_NO_ANNOY
+#include "Annoy/Annoy.hpp"
+#endif
+#ifndef KNNCOLLE_NO_HNSW
+#include "Hnsw/Hnsw.hpp"
+#endif
+#include "utils/find_nearest_neighbors.hpp"
+/**
+ * @file knncolle.hpp
+ *
+ * @brief Umbrella header to include all algorithms.
+ *
+ * Developers can avoid the inclusion of unnecessary dependencies by setting:
+ *
+ * - `KNNCOLLE_NO_KMKNN`, to avoid including the `Kmknn.hpp` header (which requires the **kmeans** library).
+ * - `KNNCOLLE_NO_ANNOY`, to avoid including the `Annoy.hpp` header (which requires the **Annoy** library).
+ * - `KNNCOLLE_NO_HNSW`, to avoid including the `Hnsw.hpp` header (which requires the **Hnsw** library).
+ */
+#endif

data/vendor/knncolle/utils/Base.hpp ADDED Viewed

@@ -0,0 +1,100 @@
+#ifndef KNNCOLLE_BASE_HPP
+#define KNNCOLLE_BASE_HPP
+#include <vector>
+/**
+ * @file Base.hpp
+ *
+ * @brief Defines the virtual base class for all **knncolle** methods.
+ */
+namespace knncolle {
+/**
+ * @brief Virtual base class defining the **knncolle** interface.
+ *
+ * Defines the minimum set of methods, to be implemented by all concrete subclasses.
+ *
+ * @tparam INDEX_t Integer type for the indices.
+ * @tparam DISTANCE_t Floating point type for the distances.
+ * @tparam QUERY_t Floating point type for the query data.
+ */
+template<typename INDEX_t = int, typename DISTANCE_t = double, typename QUERY_t = DISTANCE_t>
+class Base {
+public:
+    /**
+     * Get the number of observations in the dataset to be searched.
+     */
+    virtual INDEX_t nobs() const = 0;
+    /**
+     * Get the number of dimensions.
+     */
+    virtual INDEX_t ndim() const = 0;
+    virtual ~Base() {}
+public:
+    /**
+     * Get the vector of coordinates for a given observation in the dataset.
+     * Type conversions may be performed if `QUERY_t` differs from the type of the internal data store.
+     *
+     * `buffer` may not be filled if a pointer to the internal data store can be returned directly.
+     * This can be assumed to be the case if the return address is not the same as `buffer`.
+     *
+     * @param index Index of the observation.
+     * This should be non-negative and less than the total number of observations in `nobs()`.
+     * @param buffer Buffer to store the coordinates.
+     *
+     * @return A pointer to an array containing the coordinate vector.
+     *
+     */
+    virtual const QUERY_t* observation(INDEX_t index, QUERY_t* buffer) const = 0;
+    /**
+     * Get the vector of coordinates for a given observation in the dataset.
+     * Type conversions may be performed if `QUERY_t` differs from the type of the internal data store.
+     *
+     * @param index Index of the observation.
+     *
+     * @return A vector of coordinates.
+     *
+     */
+    virtual std::vector<QUERY_t> observation(INDEX_t index) const {
+        std::vector<QUERY_t> output(ndim());
+        auto ptr = observation(index, output.data());
+        if (ptr != output.data()) {
+            std::copy(ptr, ptr + output.size(), output.data());
+        }
+        return output;
+    }
+public:
+    /**
+     * Find the nearest neighbors of the `index`-th observation in the dataset.
+     *
+     * @param index The index of the observation of interest.
+     * This should be non-negative and less than the total number of observations in `nobs()`.
+     * @param k The number of neighbors to identify.
+     *
+     * @return A vector of (index, distance) pairs containing the identities of the nearest neighbors in order of increasing distance.
+     * Length is at most `k` but may be shorter if the total number of observations is less than `k + 1`.
+     */
+    virtual std::vector<std::pair<INDEX_t, DISTANCE_t> > find_nearest_neighbors(INDEX_t index, int k) const = 0;
+    /**
+     * Find the nearest neighbors of a new observation.
+     *
+     * @param query Pointer to an array of length equal to `ndims()`, containing the coordinates of the query point.
+     * @param k The number of neighbors to identify.
+     *
+     * @return A vector of (index, distance) pairs containing the identities of the nearest neighbors in order of increasing distance.
+     * Length is at most `k` but may be shorter if the total number of observations is less than `k`.
+     */
+    virtual std::vector<std::pair<INDEX_t, DISTANCE_t> > find_nearest_neighbors(const QUERY_t* query, int k) const = 0;
+};
+}
+#endif