RubyGems - faiss - Versions diffs - 0.3.2 → 0.3.4 - Mend

faiss 0.3.2 → 0.3.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (295) hide show

checksums.yaml +4 -4
data/CHANGELOG.md +8 -0
data/LICENSE.txt +1 -1
data/ext/faiss/extconf.rb +1 -1
data/ext/faiss/index.cpp +10 -14
data/ext/faiss/numo.hpp +957 -833
data/lib/faiss/version.rb +1 -1
data/vendor/faiss/faiss/AutoTune.cpp +2 -2
data/vendor/faiss/faiss/AutoTune.h +2 -2
data/vendor/faiss/faiss/Clustering.cpp +2 -2
data/vendor/faiss/faiss/Clustering.h +2 -2
data/vendor/faiss/faiss/IVFlib.cpp +2 -2
data/vendor/faiss/faiss/IVFlib.h +2 -2
data/vendor/faiss/faiss/Index.cpp +6 -2
data/vendor/faiss/faiss/Index.h +10 -3
data/vendor/faiss/faiss/Index2Layer.cpp +2 -2
data/vendor/faiss/faiss/Index2Layer.h +2 -2
data/vendor/faiss/faiss/IndexAdditiveQuantizer.cpp +7 -7
data/vendor/faiss/faiss/IndexAdditiveQuantizer.h +2 -2
data/vendor/faiss/faiss/IndexAdditiveQuantizerFastScan.cpp +14 -16
data/vendor/faiss/faiss/IndexAdditiveQuantizerFastScan.h +2 -2
data/vendor/faiss/faiss/IndexBinary.cpp +13 -2
data/vendor/faiss/faiss/IndexBinary.h +8 -2
data/vendor/faiss/faiss/IndexBinaryFlat.cpp +2 -3
data/vendor/faiss/faiss/IndexBinaryFlat.h +2 -2
data/vendor/faiss/faiss/IndexBinaryFromFloat.cpp +2 -2
data/vendor/faiss/faiss/IndexBinaryFromFloat.h +2 -2
data/vendor/faiss/faiss/IndexBinaryHNSW.cpp +2 -7
data/vendor/faiss/faiss/IndexBinaryHNSW.h +2 -2
data/vendor/faiss/faiss/IndexBinaryHash.cpp +2 -3
data/vendor/faiss/faiss/IndexBinaryHash.h +2 -2
data/vendor/faiss/faiss/IndexBinaryIVF.cpp +2 -2
data/vendor/faiss/faiss/IndexBinaryIVF.h +2 -2
data/vendor/faiss/faiss/IndexFastScan.cpp +10 -14
data/vendor/faiss/faiss/IndexFastScan.h +11 -2
data/vendor/faiss/faiss/IndexFlat.cpp +2 -3
data/vendor/faiss/faiss/IndexFlat.h +2 -2
data/vendor/faiss/faiss/IndexFlatCodes.cpp +11 -2
data/vendor/faiss/faiss/IndexFlatCodes.h +5 -2
data/vendor/faiss/faiss/IndexHNSW.cpp +13 -6
data/vendor/faiss/faiss/IndexHNSW.h +2 -2
data/vendor/faiss/faiss/IndexIDMap.cpp +19 -3
data/vendor/faiss/faiss/IndexIDMap.h +5 -2
data/vendor/faiss/faiss/IndexIVF.cpp +2 -3
data/vendor/faiss/faiss/IndexIVF.h +5 -4
data/vendor/faiss/faiss/IndexIVFAdditiveQuantizer.cpp +6 -7
data/vendor/faiss/faiss/IndexIVFAdditiveQuantizer.h +2 -2
data/vendor/faiss/faiss/IndexIVFAdditiveQuantizerFastScan.cpp +3 -14
data/vendor/faiss/faiss/IndexIVFAdditiveQuantizerFastScan.h +2 -4
data/vendor/faiss/faiss/IndexIVFFastScan.cpp +71 -34
data/vendor/faiss/faiss/IndexIVFFastScan.h +19 -2
data/vendor/faiss/faiss/IndexIVFFlat.cpp +2 -2
data/vendor/faiss/faiss/IndexIVFFlat.h +2 -2
data/vendor/faiss/faiss/IndexIVFIndependentQuantizer.cpp +2 -2
data/vendor/faiss/faiss/IndexIVFIndependentQuantizer.h +2 -2
data/vendor/faiss/faiss/IndexIVFPQ.cpp +2 -3
data/vendor/faiss/faiss/IndexIVFPQ.h +2 -2
data/vendor/faiss/faiss/IndexIVFPQFastScan.cpp +7 -33
data/vendor/faiss/faiss/IndexIVFPQFastScan.h +2 -4
data/vendor/faiss/faiss/IndexIVFPQR.cpp +2 -2
data/vendor/faiss/faiss/IndexIVFPQR.h +2 -2
data/vendor/faiss/faiss/IndexIVFSpectralHash.cpp +2 -3
data/vendor/faiss/faiss/IndexIVFSpectralHash.h +2 -2
data/vendor/faiss/faiss/IndexLSH.cpp +2 -3
data/vendor/faiss/faiss/IndexLSH.h +2 -2
data/vendor/faiss/faiss/IndexLattice.cpp +2 -2
data/vendor/faiss/faiss/IndexLattice.h +2 -2
data/vendor/faiss/faiss/IndexNNDescent.cpp +2 -2
data/vendor/faiss/faiss/IndexNNDescent.h +2 -2
data/vendor/faiss/faiss/IndexNSG.cpp +2 -5
data/vendor/faiss/faiss/IndexNSG.h +2 -2
data/vendor/faiss/faiss/IndexNeuralNetCodec.cpp +2 -2
data/vendor/faiss/faiss/IndexNeuralNetCodec.h +2 -2
data/vendor/faiss/faiss/IndexPQ.cpp +26 -26
data/vendor/faiss/faiss/IndexPQ.h +2 -2
data/vendor/faiss/faiss/IndexPQFastScan.cpp +2 -5
data/vendor/faiss/faiss/IndexPQFastScan.h +2 -11
data/vendor/faiss/faiss/IndexPreTransform.cpp +2 -2
data/vendor/faiss/faiss/IndexPreTransform.h +2 -2
data/vendor/faiss/faiss/IndexRefine.cpp +41 -4
data/vendor/faiss/faiss/IndexRefine.h +9 -2
data/vendor/faiss/faiss/IndexReplicas.cpp +2 -2
data/vendor/faiss/faiss/IndexReplicas.h +2 -2
data/vendor/faiss/faiss/IndexRowwiseMinMax.cpp +2 -2
data/vendor/faiss/faiss/IndexRowwiseMinMax.h +2 -2
data/vendor/faiss/faiss/IndexScalarQuantizer.cpp +2 -3
data/vendor/faiss/faiss/IndexScalarQuantizer.h +2 -2
data/vendor/faiss/faiss/IndexShards.cpp +2 -2
data/vendor/faiss/faiss/IndexShards.h +2 -2
data/vendor/faiss/faiss/IndexShardsIVF.cpp +2 -2
data/vendor/faiss/faiss/IndexShardsIVF.h +2 -2
data/vendor/faiss/faiss/MatrixStats.cpp +2 -2
data/vendor/faiss/faiss/MatrixStats.h +2 -2
data/vendor/faiss/faiss/MetaIndexes.cpp +2 -3
data/vendor/faiss/faiss/MetaIndexes.h +2 -2
data/vendor/faiss/faiss/MetricType.h +2 -2
data/vendor/faiss/faiss/VectorTransform.cpp +2 -2
data/vendor/faiss/faiss/VectorTransform.h +2 -2
data/vendor/faiss/faiss/clone_index.cpp +2 -2
data/vendor/faiss/faiss/clone_index.h +2 -2
data/vendor/faiss/faiss/cppcontrib/SaDecodeKernels.h +2 -2
data/vendor/faiss/faiss/cppcontrib/detail/CoarseBitType.h +2 -2
data/vendor/faiss/faiss/cppcontrib/detail/UintReader.h +2 -2
data/vendor/faiss/faiss/cppcontrib/factory_tools.cpp +44 -4
data/vendor/faiss/faiss/cppcontrib/factory_tools.h +7 -2
data/vendor/faiss/faiss/cppcontrib/sa_decode/Level2-avx2-inl.h +2 -2
data/vendor/faiss/faiss/cppcontrib/sa_decode/Level2-inl.h +2 -2
data/vendor/faiss/faiss/cppcontrib/sa_decode/Level2-neon-inl.h +2 -2
data/vendor/faiss/faiss/cppcontrib/sa_decode/MinMax-inl.h +2 -2
data/vendor/faiss/faiss/cppcontrib/sa_decode/MinMaxFP16-inl.h +2 -2
data/vendor/faiss/faiss/cppcontrib/sa_decode/PQ-avx2-inl.h +2 -2
data/vendor/faiss/faiss/cppcontrib/sa_decode/PQ-inl.h +2 -2
data/vendor/faiss/faiss/cppcontrib/sa_decode/PQ-neon-inl.h +2 -2
data/vendor/faiss/faiss/gpu/GpuAutoTune.cpp +2 -5
data/vendor/faiss/faiss/gpu/GpuAutoTune.h +2 -2
data/vendor/faiss/faiss/gpu/GpuCloner.cpp +13 -13
data/vendor/faiss/faiss/gpu/GpuCloner.h +2 -2
data/vendor/faiss/faiss/gpu/GpuClonerOptions.h +6 -6
data/vendor/faiss/faiss/gpu/GpuDistance.h +11 -7
data/vendor/faiss/faiss/gpu/GpuFaissAssert.h +2 -2
data/vendor/faiss/faiss/gpu/GpuIcmEncoder.h +2 -2
data/vendor/faiss/faiss/gpu/GpuIndex.h +8 -7
data/vendor/faiss/faiss/gpu/GpuIndexBinaryFlat.h +2 -2
data/vendor/faiss/faiss/gpu/GpuIndexCagra.h +6 -3
data/vendor/faiss/faiss/gpu/GpuIndexFlat.h +2 -2
data/vendor/faiss/faiss/gpu/GpuIndexIVF.h +2 -2
data/vendor/faiss/faiss/gpu/GpuIndexIVFFlat.h +2 -2
data/vendor/faiss/faiss/gpu/GpuIndexIVFPQ.h +3 -3
data/vendor/faiss/faiss/gpu/GpuIndexIVFScalarQuantizer.h +2 -2
data/vendor/faiss/faiss/gpu/GpuIndicesOptions.h +2 -2
data/vendor/faiss/faiss/gpu/GpuResources.cpp +7 -2
data/vendor/faiss/faiss/gpu/GpuResources.h +11 -4
data/vendor/faiss/faiss/gpu/StandardGpuResources.cpp +51 -21
data/vendor/faiss/faiss/gpu/StandardGpuResources.h +15 -5
data/vendor/faiss/faiss/gpu/impl/IndexUtils.h +2 -2
data/vendor/faiss/faiss/gpu/impl/InterleavedCodes.cpp +2 -2
data/vendor/faiss/faiss/gpu/impl/InterleavedCodes.h +2 -2
data/vendor/faiss/faiss/gpu/impl/RemapIndices.cpp +2 -2
data/vendor/faiss/faiss/gpu/impl/RemapIndices.h +2 -2
data/vendor/faiss/faiss/gpu/perf/IndexWrapper-inl.h +2 -2
data/vendor/faiss/faiss/gpu/perf/IndexWrapper.h +2 -2
data/vendor/faiss/faiss/gpu/perf/PerfClustering.cpp +2 -2
data/vendor/faiss/faiss/gpu/perf/PerfIVFPQAdd.cpp +2 -3
data/vendor/faiss/faiss/gpu/perf/WriteIndex.cpp +2 -2
data/vendor/faiss/faiss/gpu/test/TestCodePacking.cpp +2 -2
data/vendor/faiss/faiss/gpu/test/TestGpuIndexBinaryFlat.cpp +2 -2
data/vendor/faiss/faiss/gpu/test/TestGpuIndexFlat.cpp +54 -54
data/vendor/faiss/faiss/gpu/test/TestGpuIndexIVFFlat.cpp +80 -78
data/vendor/faiss/faiss/gpu/test/TestGpuIndexIVFPQ.cpp +51 -51
data/vendor/faiss/faiss/gpu/test/TestGpuIndexIVFScalarQuantizer.cpp +2 -2
data/vendor/faiss/faiss/gpu/test/TestGpuMemoryException.cpp +3 -3
data/vendor/faiss/faiss/gpu/test/TestGpuResidualQuantizer.cpp +70 -0
data/vendor/faiss/faiss/gpu/test/TestUtils.cpp +74 -4
data/vendor/faiss/faiss/gpu/test/TestUtils.h +2 -2
data/vendor/faiss/faiss/gpu/test/demo_ivfpq_indexing_gpu.cpp +2 -2
data/vendor/faiss/faiss/gpu/utils/{RaftUtils.h → CuvsUtils.h} +12 -11
data/vendor/faiss/faiss/gpu/utils/DeviceUtils.h +2 -2
data/vendor/faiss/faiss/gpu/utils/StackDeviceMemory.cpp +2 -2
data/vendor/faiss/faiss/gpu/utils/StackDeviceMemory.h +2 -2
data/vendor/faiss/faiss/gpu/utils/StaticUtils.h +2 -2
data/vendor/faiss/faiss/gpu/utils/Timer.cpp +2 -2
data/vendor/faiss/faiss/gpu/utils/Timer.h +2 -2
data/vendor/faiss/faiss/impl/AdditiveQuantizer.cpp +79 -11
data/vendor/faiss/faiss/impl/AdditiveQuantizer.h +17 -5
data/vendor/faiss/faiss/impl/AuxIndexStructures.cpp +2 -2
data/vendor/faiss/faiss/impl/AuxIndexStructures.h +2 -2
data/vendor/faiss/faiss/impl/CodePacker.cpp +2 -2
data/vendor/faiss/faiss/impl/CodePacker.h +2 -2
data/vendor/faiss/faiss/impl/DistanceComputer.h +2 -2
data/vendor/faiss/faiss/impl/FaissAssert.h +2 -2
data/vendor/faiss/faiss/impl/FaissException.cpp +2 -2
data/vendor/faiss/faiss/impl/FaissException.h +2 -3
data/vendor/faiss/faiss/impl/HNSW.cpp +24 -19
data/vendor/faiss/faiss/impl/HNSW.h +12 -2
data/vendor/faiss/faiss/impl/IDSelector.cpp +2 -2
data/vendor/faiss/faiss/impl/IDSelector.h +2 -2
data/vendor/faiss/faiss/impl/LocalSearchQuantizer.cpp +2 -2
data/vendor/faiss/faiss/impl/LocalSearchQuantizer.h +2 -2
data/vendor/faiss/faiss/impl/LookupTableScaler.h +2 -2
data/vendor/faiss/faiss/impl/NNDescent.cpp +2 -2
data/vendor/faiss/faiss/impl/NNDescent.h +2 -2
data/vendor/faiss/faiss/impl/NSG.cpp +27 -21
data/vendor/faiss/faiss/impl/NSG.h +20 -8
data/vendor/faiss/faiss/impl/PolysemousTraining.cpp +2 -2
data/vendor/faiss/faiss/impl/PolysemousTraining.h +2 -2
data/vendor/faiss/faiss/impl/ProductAdditiveQuantizer.cpp +2 -4
data/vendor/faiss/faiss/impl/ProductAdditiveQuantizer.h +2 -2
data/vendor/faiss/faiss/impl/ProductQuantizer-inl.h +2 -2
data/vendor/faiss/faiss/impl/ProductQuantizer.cpp +2 -2
data/vendor/faiss/faiss/impl/ProductQuantizer.h +2 -2
data/vendor/faiss/faiss/impl/Quantizer.h +2 -2
data/vendor/faiss/faiss/impl/ResidualQuantizer.cpp +2 -36
data/vendor/faiss/faiss/impl/ResidualQuantizer.h +3 -13
data/vendor/faiss/faiss/impl/ResultHandler.h +2 -2
data/vendor/faiss/faiss/impl/ScalarQuantizer.cpp +2 -2
data/vendor/faiss/faiss/impl/ScalarQuantizer.h +2 -2
data/vendor/faiss/faiss/impl/ThreadedIndex-inl.h +2 -2
data/vendor/faiss/faiss/impl/ThreadedIndex.h +2 -2
data/vendor/faiss/faiss/impl/code_distance/code_distance-avx2.h +2 -2
data/vendor/faiss/faiss/impl/code_distance/code_distance-avx512.h +2 -2
data/vendor/faiss/faiss/impl/code_distance/code_distance-generic.h +2 -2
data/vendor/faiss/faiss/impl/code_distance/code_distance-sve.h +440 -0
data/vendor/faiss/faiss/impl/code_distance/code_distance.h +55 -2
data/vendor/faiss/faiss/impl/index_read.cpp +2 -5
data/vendor/faiss/faiss/impl/index_read_utils.h +2 -2
data/vendor/faiss/faiss/impl/index_write.cpp +2 -6
data/vendor/faiss/faiss/impl/io.cpp +2 -2
data/vendor/faiss/faiss/impl/io.h +2 -2
data/vendor/faiss/faiss/impl/io_macros.h +2 -9
data/vendor/faiss/faiss/impl/kmeans1d.cpp +2 -3
data/vendor/faiss/faiss/impl/kmeans1d.h +2 -2
data/vendor/faiss/faiss/impl/lattice_Zn.cpp +2 -3
data/vendor/faiss/faiss/impl/lattice_Zn.h +2 -2
data/vendor/faiss/faiss/impl/platform_macros.h +12 -2
data/vendor/faiss/faiss/impl/pq4_fast_scan.cpp +2 -2
data/vendor/faiss/faiss/impl/pq4_fast_scan.h +20 -2
data/vendor/faiss/faiss/impl/pq4_fast_scan_search_1.cpp +2 -2
data/vendor/faiss/faiss/impl/pq4_fast_scan_search_qbs.cpp +2 -2
data/vendor/faiss/faiss/impl/residual_quantizer_encode_steps.cpp +3 -3
data/vendor/faiss/faiss/impl/residual_quantizer_encode_steps.h +2 -2
data/vendor/faiss/faiss/impl/simd_result_handlers.h +18 -18
data/vendor/faiss/faiss/index_factory.cpp +20 -21
data/vendor/faiss/faiss/index_factory.h +2 -2
data/vendor/faiss/faiss/index_io.h +2 -2
data/vendor/faiss/faiss/invlists/BlockInvertedLists.cpp +2 -2
data/vendor/faiss/faiss/invlists/BlockInvertedLists.h +2 -2
data/vendor/faiss/faiss/invlists/DirectMap.cpp +2 -2
data/vendor/faiss/faiss/invlists/DirectMap.h +2 -2
data/vendor/faiss/faiss/invlists/InvertedLists.cpp +2 -2
data/vendor/faiss/faiss/invlists/InvertedLists.h +2 -2
data/vendor/faiss/faiss/invlists/InvertedListsIOHook.cpp +2 -2
data/vendor/faiss/faiss/invlists/InvertedListsIOHook.h +2 -2
data/vendor/faiss/faiss/invlists/OnDiskInvertedLists.cpp +2 -3
data/vendor/faiss/faiss/invlists/OnDiskInvertedLists.h +2 -2
data/vendor/faiss/faiss/python/python_callbacks.cpp +2 -2
data/vendor/faiss/faiss/python/python_callbacks.h +2 -2
data/vendor/faiss/faiss/utils/AlignedTable.h +5 -3
data/vendor/faiss/faiss/utils/Heap.cpp +2 -2
data/vendor/faiss/faiss/utils/Heap.h +2 -2
data/vendor/faiss/faiss/utils/NeuralNet.cpp +11 -7
data/vendor/faiss/faiss/utils/NeuralNet.h +2 -2
data/vendor/faiss/faiss/utils/WorkerThread.cpp +2 -2
data/vendor/faiss/faiss/utils/WorkerThread.h +2 -2
data/vendor/faiss/faiss/utils/approx_topk/approx_topk.h +2 -2
data/vendor/faiss/faiss/utils/approx_topk/avx2-inl.h +2 -2
data/vendor/faiss/faiss/utils/approx_topk/generic.h +2 -2
data/vendor/faiss/faiss/utils/approx_topk/mode.h +2 -2
data/vendor/faiss/faiss/utils/approx_topk_hamming/approx_topk_hamming.h +2 -2
data/vendor/faiss/faiss/utils/bf16.h +2 -2
data/vendor/faiss/faiss/utils/distances.cpp +191 -2
data/vendor/faiss/faiss/utils/distances.h +3 -3
data/vendor/faiss/faiss/utils/distances_fused/avx512.cpp +2 -2
data/vendor/faiss/faiss/utils/distances_fused/avx512.h +2 -2
data/vendor/faiss/faiss/utils/distances_fused/distances_fused.cpp +2 -2
data/vendor/faiss/faiss/utils/distances_fused/distances_fused.h +2 -2
data/vendor/faiss/faiss/utils/distances_fused/simdlib_based.cpp +2 -2
data/vendor/faiss/faiss/utils/distances_fused/simdlib_based.h +2 -2
data/vendor/faiss/faiss/utils/distances_simd.cpp +502 -3
data/vendor/faiss/faiss/utils/extra_distances-inl.h +2 -2
data/vendor/faiss/faiss/utils/extra_distances.cpp +2 -3
data/vendor/faiss/faiss/utils/extra_distances.h +2 -2
data/vendor/faiss/faiss/utils/fp16-arm.h +2 -2
data/vendor/faiss/faiss/utils/fp16-fp16c.h +2 -2
data/vendor/faiss/faiss/utils/fp16-inl.h +2 -2
data/vendor/faiss/faiss/utils/fp16.h +2 -2
data/vendor/faiss/faiss/utils/hamming-inl.h +2 -2
data/vendor/faiss/faiss/utils/hamming.cpp +2 -3
data/vendor/faiss/faiss/utils/hamming.h +2 -2
data/vendor/faiss/faiss/utils/hamming_distance/avx2-inl.h +2 -2
data/vendor/faiss/faiss/utils/hamming_distance/avx512-inl.h +490 -0
data/vendor/faiss/faiss/utils/hamming_distance/common.h +2 -2
data/vendor/faiss/faiss/utils/hamming_distance/generic-inl.h +2 -2
data/vendor/faiss/faiss/utils/hamming_distance/hamdis-inl.h +5 -2
data/vendor/faiss/faiss/utils/hamming_distance/neon-inl.h +5 -5
data/vendor/faiss/faiss/utils/ordered_key_value.h +2 -2
data/vendor/faiss/faiss/utils/partitioning.cpp +2 -2
data/vendor/faiss/faiss/utils/partitioning.h +2 -2
data/vendor/faiss/faiss/utils/prefetch.h +2 -2
data/vendor/faiss/faiss/utils/quantize_lut.cpp +2 -2
data/vendor/faiss/faiss/utils/quantize_lut.h +2 -2
data/vendor/faiss/faiss/utils/random.cpp +2 -2
data/vendor/faiss/faiss/utils/random.h +2 -2
data/vendor/faiss/faiss/utils/simdlib.h +2 -2
data/vendor/faiss/faiss/utils/simdlib_avx2.h +2 -2
data/vendor/faiss/faiss/utils/simdlib_avx512.h +2 -2
data/vendor/faiss/faiss/utils/simdlib_emulated.h +2 -2
data/vendor/faiss/faiss/utils/simdlib_neon.h +2 -2
data/vendor/faiss/faiss/utils/simdlib_ppc64.h +2 -2
data/vendor/faiss/faiss/utils/sorting.cpp +2 -2
data/vendor/faiss/faiss/utils/sorting.h +2 -2
data/vendor/faiss/faiss/utils/transpose/transpose-avx2-inl.h +2 -2
data/vendor/faiss/faiss/utils/transpose/transpose-avx512-inl.h +2 -2
data/vendor/faiss/faiss/utils/utils.cpp +7 -7
data/vendor/faiss/faiss/utils/utils.h +4 -3
metadata +9 -10

data/vendor/faiss/faiss/impl/PolysemousTraining.h CHANGED Viewed

@@ -1,5 +1,5 @@
-/**
- * Copyright (c) Facebook, Inc. and its affiliates.
+/*
+ * Copyright (c) Meta Platforms, Inc. and affiliates.
  *
  * This source code is licensed under the MIT license found in the
  * LICENSE file in the root directory of this source tree.

data/vendor/faiss/faiss/impl/ProductAdditiveQuantizer.cpp CHANGED Viewed

@@ -1,5 +1,5 @@
-/**
- * Copyright (c) Facebook, Inc. and its affiliates.
+/*
+ * Copyright (c) Meta Platforms, Inc. and affiliates.
  *
  * This source code is licensed under the MIT license found in the
  * LICENSE file in the root directory of this source tree.
@@ -11,7 +11,6 @@
 #include <cstdio>
 #include <cstring>
 #include <memory>
-#include <random>
 #include <algorithm>
@@ -20,7 +19,6 @@
 #include <faiss/impl/FaissAssert.h>
 #include <faiss/utils/distances.h>
 #include <faiss/utils/hamming.h>
-#include <faiss/utils/utils.h>
 extern "C" {

data/vendor/faiss/faiss/impl/ProductAdditiveQuantizer.h CHANGED Viewed

@@ -1,5 +1,5 @@
-/**
- * Copyright (c) Facebook, Inc. and its affiliates.
+/*
+ * Copyright (c) Meta Platforms, Inc. and affiliates.
  *
  * This source code is licensed under the MIT license found in the
  * LICENSE file in the root directory of this source tree.

data/vendor/faiss/faiss/impl/ProductQuantizer-inl.h CHANGED Viewed

@@ -1,5 +1,5 @@
-/**
- * Copyright (c) Facebook, Inc. and its affiliates.
+/*
+ * Copyright (c) Meta Platforms, Inc. and affiliates.
  *
  * This source code is licensed under the MIT license found in the
  * LICENSE file in the root directory of this source tree.

data/vendor/faiss/faiss/impl/ProductQuantizer.cpp CHANGED Viewed

@@ -1,5 +1,5 @@
-/**
- * Copyright (c) Facebook, Inc. and its affiliates.
+/*
+ * Copyright (c) Meta Platforms, Inc. and affiliates.
  *
  * This source code is licensed under the MIT license found in the
  * LICENSE file in the root directory of this source tree.

data/vendor/faiss/faiss/impl/ProductQuantizer.h CHANGED Viewed

@@ -1,5 +1,5 @@
-/**
- * Copyright (c) Facebook, Inc. and its affiliates.
+/*
+ * Copyright (c) Meta Platforms, Inc. and affiliates.
  *
  * This source code is licensed under the MIT license found in the
  * LICENSE file in the root directory of this source tree.

data/vendor/faiss/faiss/impl/Quantizer.h CHANGED Viewed

@@ -1,5 +1,5 @@
-/**
- * Copyright (c) Facebook, Inc. and its affiliates.
+/*
+ * Copyright (c) Meta Platforms, Inc. and affiliates.
  *
  * This source code is licensed under the MIT license found in the
  * LICENSE file in the root directory of this source tree.

data/vendor/faiss/faiss/impl/ResidualQuantizer.cpp CHANGED Viewed

@@ -1,5 +1,5 @@
-/**
- * Copyright (c) Facebook, Inc. and its affiliates.
+/*
+ * Copyright (c) Meta Platforms, Inc. and affiliates.
  *
  * This source code is licensed under the MIT license found in the
  * LICENSE file in the root directory of this source tree.
@@ -492,40 +492,6 @@ void ResidualQuantizer::refine_beam(
  * Functions using the dot products between codebook entries
  *******************************************************************/
-void ResidualQuantizer::compute_codebook_tables() {
-    cent_norms.resize(total_codebook_size);
-    fvec_norms_L2sqr(
-            cent_norms.data(), codebooks.data(), d, total_codebook_size);
-    size_t cross_table_size = 0;
-    for (int m = 0; m < M; m++) {
-        size_t K = (size_t)1 << nbits[m];
-        cross_table_size += K * codebook_offsets[m];
-    }
-    codebook_cross_products.resize(cross_table_size);
-    size_t ofs = 0;
-    for (int m = 1; m < M; m++) {
-        FINTEGER ki = (size_t)1 << nbits[m];
-        FINTEGER kk = codebook_offsets[m];
-        FINTEGER di = d;
-        float zero = 0, one = 1;
-        assert(ofs + ki * kk <= cross_table_size);
-        sgemm_("Transposed",
-               "Not transposed",
-               &ki,
-               &kk,
-               &di,
-               &one,
-               codebooks.data() + d * kk,
-               &di,
-               codebooks.data(),
-               &di,
-               &zero,
-               codebook_cross_products.data() + ofs,
-               &ki);
-        ofs += ki * kk;
-    }
-}
 void ResidualQuantizer::refine_beam_LUT(
         size_t n,
         const float* query_norms, // size n

data/vendor/faiss/faiss/impl/ResidualQuantizer.h CHANGED Viewed

@@ -1,5 +1,5 @@
-/**
- * Copyright (c) Facebook, Inc. and its affiliates.
+/*
+ * Copyright (c) Meta Platforms, Inc. and affiliates.
  *
  * This source code is licensed under the MIT license found in the
  * LICENSE file in the root directory of this source tree.
@@ -112,7 +112,7 @@ struct ResidualQuantizer : AdditiveQuantizer {
     /** lower-level encode function
      *
-     * @param n              number of vectors to hanlde
+     * @param n              number of vectors to handle
      * @param residuals      vectors to encode, size (n, beam_size, d)
      * @param beam_size      input beam size
      * @param new_beam_size  output beam size (should be <= K * beam_size)
@@ -143,16 +143,6 @@ struct ResidualQuantizer : AdditiveQuantizer {
      * @param beam_size  if != -1, override the beam size
      */
     size_t memory_per_point(int beam_size = -1) const;
-    /** Cross products used in codebook tables used for beam_LUT = 1
-     */
-    void compute_codebook_tables();
-    /// dot products of all codebook entries with the previous codebooks
-    /// size sum(codebook_offsets[m] * 2^nbits[m], m=0..M-1)
-    std::vector<float> codebook_cross_products;
-    /// norms of all codebook entries (size total_codebook_size)
-    std::vector<float> cent_norms;
 };
 } // namespace faiss

data/vendor/faiss/faiss/impl/ResultHandler.h CHANGED Viewed

@@ -1,5 +1,5 @@
-/**
- * Copyright (c) Facebook, Inc. and its affiliates.
+/*
+ * Copyright (c) Meta Platforms, Inc. and affiliates.
  *
  * This source code is licensed under the MIT license found in the
  * LICENSE file in the root directory of this source tree.

data/vendor/faiss/faiss/impl/ScalarQuantizer.cpp CHANGED Viewed

@@ -1,5 +1,5 @@
-/**
- * Copyright (c) Facebook, Inc. and its affiliates.
+/*
+ * Copyright (c) Meta Platforms, Inc. and affiliates.
  *
  * This source code is licensed under the MIT license found in the
  * LICENSE file in the root directory of this source tree.

data/vendor/faiss/faiss/impl/ScalarQuantizer.h CHANGED Viewed

@@ -1,5 +1,5 @@
-/**
- * Copyright (c) Facebook, Inc. and its affiliates.
+/*
+ * Copyright (c) Meta Platforms, Inc. and affiliates.
  *
  * This source code is licensed under the MIT license found in the
  * LICENSE file in the root directory of this source tree.

data/vendor/faiss/faiss/impl/ThreadedIndex-inl.h CHANGED Viewed

@@ -1,5 +1,5 @@
-/**
- * Copyright (c) Facebook, Inc. and its affiliates.
+/*
+ * Copyright (c) Meta Platforms, Inc. and affiliates.
  *
  * This source code is licensed under the MIT license found in the
  * LICENSE file in the root directory of this source tree.

data/vendor/faiss/faiss/impl/ThreadedIndex.h CHANGED Viewed

@@ -1,5 +1,5 @@
-/**
- * Copyright (c) Facebook, Inc. and its affiliates.
+/*
+ * Copyright (c) Meta Platforms, Inc. and affiliates.
  *
  * This source code is licensed under the MIT license found in the
  * LICENSE file in the root directory of this source tree.

data/vendor/faiss/faiss/impl/code_distance/code_distance-avx2.h CHANGED Viewed

@@ -1,5 +1,5 @@
-/**
- * Copyright (c) Facebook, Inc. and its affiliates.
+/*
+ * Copyright (c) Meta Platforms, Inc. and affiliates.
  *
  * This source code is licensed under the MIT license found in the
  * LICENSE file in the root directory of this source tree.

data/vendor/faiss/faiss/impl/code_distance/code_distance-avx512.h CHANGED Viewed

@@ -1,5 +1,5 @@
-/**
- * Copyright (c) Facebook, Inc. and its affiliates.
+/*
+ * Copyright (c) Meta Platforms, Inc. and affiliates.
  *
  * This source code is licensed under the MIT license found in the
  * LICENSE file in the root directory of this source tree.

data/vendor/faiss/faiss/impl/code_distance/code_distance-generic.h CHANGED Viewed

@@ -1,5 +1,5 @@
-/**
- * Copyright (c) Facebook, Inc. and its affiliates.
+/*
+ * Copyright (c) Meta Platforms, Inc. and affiliates.
  *
  * This source code is licensed under the MIT license found in the
  * LICENSE file in the root directory of this source tree.

data/vendor/faiss/faiss/impl/code_distance/code_distance-sve.h ADDED Viewed

@@ -0,0 +1,440 @@
+/*
+ * Copyright (c) Meta Platforms, Inc. and affiliates.
+ *
+ * This source code is licensed under the MIT license found in the
+ * LICENSE file in the root directory of this source tree.
+ */
+#pragma once
+#ifdef __ARM_FEATURE_SVE
+#include <arm_sve.h>
+#include <tuple>
+#include <type_traits>
+#include <faiss/impl/code_distance/code_distance-generic.h>
+namespace faiss {
+template <typename PQDecoderT>
+std::enable_if_t<!std::is_same_v<PQDecoderT, PQDecoder8>, float> inline distance_single_code_sve(
+        // the product quantizer
+        const size_t M,
+        // number of bits per quantization index
+        const size_t nbits,
+        // precomputed distances, layout (M, ksub)
+        const float* sim_table,
+        const uint8_t* code) {
+    // default implementation
+    return distance_single_code_generic<PQDecoderT>(M, nbits, sim_table, code);
+}
+static inline void distance_codes_kernel(
+        svbool_t pg,
+        svuint32_t idx1,
+        svuint32_t offsets_0,
+        const float* tab,
+        svfloat32_t& partialSum) {
+    // add offset
+    const auto indices_to_read_from = svadd_u32_x(pg, idx1, offsets_0);
+    // gather values, similar to some operations of tab[index]
+    const auto collected =
+            svld1_gather_u32index_f32(pg, tab, indices_to_read_from);
+    // collect partial sum
+    partialSum = svadd_f32_m(pg, partialSum, collected);
+}
+static float distance_single_code_sve_for_small_m(
+        // the product quantizer
+        const size_t M,
+        // precomputed distances, layout (M, ksub)
+        const float* sim_table,
+        // codes
+        const uint8_t* __restrict code) {
+    constexpr size_t nbits = 8u;
+    const size_t ksub = 1 << nbits;
+    const auto offsets_0 = svindex_u32(0, static_cast<uint32_t>(ksub));
+    // loop
+    const auto pg = svwhilelt_b32_u64(0, M);
+    auto mm1 = svld1ub_u32(pg, code);
+    mm1 = svadd_u32_x(pg, mm1, offsets_0);
+    const auto collected0 = svld1_gather_u32index_f32(pg, sim_table, mm1);
+    return svaddv_f32(pg, collected0);
+}
+template <typename PQDecoderT>
+std::enable_if_t<std::is_same_v<PQDecoderT, PQDecoder8>, float> inline distance_single_code_sve(
+        // the product quantizer
+        const size_t M,
+        // number of bits per quantization index
+        const size_t nbits,
+        // precomputed distances, layout (M, ksub)
+        const float* sim_table,
+        const uint8_t* code) {
+    if (M <= svcntw())
+        return distance_single_code_sve_for_small_m(M, sim_table, code);
+    const float* tab = sim_table;
+    const size_t ksub = 1 << nbits;
+    const auto offsets_0 = svindex_u32(0, static_cast<uint32_t>(ksub));
+    // accumulators of partial sums
+    auto partialSum = svdup_n_f32(0.f);
+    const auto lanes = svcntb();
+    const auto quad_lanes = lanes / 4;
+    // loop
+    for (std::size_t m = 0; m < M;) {
+        const auto pg = svwhilelt_b8_u64(m, M);
+        const auto mm1 = svld1_u8(pg, code + m);
+        {
+            const auto mm1lo = svunpklo_u16(mm1);
+            const auto pglo = svunpklo_b(pg);
+            {
+                // convert uint8 values to uint32 values
+                const auto idx1 = svunpklo_u32(mm1lo);
+                const auto pglolo = svunpklo_b(pglo);
+                distance_codes_kernel(pglolo, idx1, offsets_0, tab, partialSum);
+                tab += ksub * quad_lanes;
+            }
+            m += quad_lanes;
+            if (m >= M)
+                break;
+            {
+                // convert uint8 values to uint32 values
+                const auto idx1 = svunpkhi_u32(mm1lo);
+                const auto pglohi = svunpkhi_b(pglo);
+                distance_codes_kernel(pglohi, idx1, offsets_0, tab, partialSum);
+                tab += ksub * quad_lanes;
+            }
+            m += quad_lanes;
+            if (m >= M)
+                break;
+        }
+        {
+            const auto mm1hi = svunpkhi_u16(mm1);
+            const auto pghi = svunpkhi_b(pg);
+            {
+                // convert uint8 values to uint32 values
+                const auto idx1 = svunpklo_u32(mm1hi);
+                const auto pghilo = svunpklo_b(pghi);
+                distance_codes_kernel(pghilo, idx1, offsets_0, tab, partialSum);
+                tab += ksub * quad_lanes;
+            }
+            m += quad_lanes;
+            if (m >= M)
+                break;
+            {
+                // convert uint8 values to uint32 values
+                const auto idx1 = svunpkhi_u32(mm1hi);
+                const auto pghihi = svunpkhi_b(pghi);
+                distance_codes_kernel(pghihi, idx1, offsets_0, tab, partialSum);
+                tab += ksub * quad_lanes;
+            }
+            m += quad_lanes;
+        }
+    }
+    return svaddv_f32(svptrue_b32(), partialSum);
+}
+template <typename PQDecoderT>
+std::enable_if_t<!std::is_same_v<PQDecoderT, PQDecoder8>, void>
+distance_four_codes_sve(
+        // the product quantizer
+        const size_t M,
+        // number of bits per quantization index
+        const size_t nbits,
+        // precomputed distances, layout (M, ksub)
+        const float* sim_table,
+        // codes
+        const uint8_t* __restrict code0,
+        const uint8_t* __restrict code1,
+        const uint8_t* __restrict code2,
+        const uint8_t* __restrict code3,
+        // computed distances
+        float& result0,
+        float& result1,
+        float& result2,
+        float& result3) {
+    distance_four_codes_generic<PQDecoderT>(
+            M,
+            nbits,
+            sim_table,
+            code0,
+            code1,
+            code2,
+            code3,
+            result0,
+            result1,
+            result2,
+            result3);
+}
+static void distance_four_codes_sve_for_small_m(
+        // the product quantizer
+        const size_t M,
+        // precomputed distances, layout (M, ksub)
+        const float* sim_table,
+        // codes
+        const uint8_t* __restrict code0,
+        const uint8_t* __restrict code1,
+        const uint8_t* __restrict code2,
+        const uint8_t* __restrict code3,
+        // computed distances
+        float& result0,
+        float& result1,
+        float& result2,
+        float& result3) {
+    constexpr size_t nbits = 8u;
+    const size_t ksub = 1 << nbits;
+    const auto offsets_0 = svindex_u32(0, static_cast<uint32_t>(ksub));
+    const auto quad_lanes = svcntw();
+    // loop
+    const auto pg = svwhilelt_b32_u64(0, M);
+    auto mm10 = svld1ub_u32(pg, code0);
+    auto mm11 = svld1ub_u32(pg, code1);
+    auto mm12 = svld1ub_u32(pg, code2);
+    auto mm13 = svld1ub_u32(pg, code3);
+    mm10 = svadd_u32_x(pg, mm10, offsets_0);
+    mm11 = svadd_u32_x(pg, mm11, offsets_0);
+    mm12 = svadd_u32_x(pg, mm12, offsets_0);
+    mm13 = svadd_u32_x(pg, mm13, offsets_0);
+    const auto collected0 = svld1_gather_u32index_f32(pg, sim_table, mm10);
+    const auto collected1 = svld1_gather_u32index_f32(pg, sim_table, mm11);
+    const auto collected2 = svld1_gather_u32index_f32(pg, sim_table, mm12);
+    const auto collected3 = svld1_gather_u32index_f32(pg, sim_table, mm13);
+    result0 = svaddv_f32(pg, collected0);
+    result1 = svaddv_f32(pg, collected1);
+    result2 = svaddv_f32(pg, collected2);
+    result3 = svaddv_f32(pg, collected3);
+}
+// Combines 4 operations of distance_single_code()
+template <typename PQDecoderT>
+std::enable_if_t<std::is_same_v<PQDecoderT, PQDecoder8>, void>
+distance_four_codes_sve(
+        // the product quantizer
+        const size_t M,
+        // number of bits per quantization index
+        const size_t nbits,
+        // precomputed distances, layout (M, ksub)
+        const float* sim_table,
+        // codes
+        const uint8_t* __restrict code0,
+        const uint8_t* __restrict code1,
+        const uint8_t* __restrict code2,
+        const uint8_t* __restrict code3,
+        // computed distances
+        float& result0,
+        float& result1,
+        float& result2,
+        float& result3) {
+    if (M <= svcntw()) {
+        distance_four_codes_sve_for_small_m(
+                M,
+                sim_table,
+                code0,
+                code1,
+                code2,
+                code3,
+                result0,
+                result1,
+                result2,
+                result3);
+        return;
+    }
+    const float* tab = sim_table;
+    const size_t ksub = 1 << nbits;
+    const auto offsets_0 = svindex_u32(0, static_cast<uint32_t>(ksub));
+    // accumulators of partial sums
+    auto partialSum0 = svdup_n_f32(0.f);
+    auto partialSum1 = svdup_n_f32(0.f);
+    auto partialSum2 = svdup_n_f32(0.f);
+    auto partialSum3 = svdup_n_f32(0.f);
+    const auto lanes = svcntb();
+    const auto quad_lanes = lanes / 4;
+    // loop
+    for (std::size_t m = 0; m < M;) {
+        const auto pg = svwhilelt_b8_u64(m, M);
+        const auto mm10 = svld1_u8(pg, code0 + m);
+        const auto mm11 = svld1_u8(pg, code1 + m);
+        const auto mm12 = svld1_u8(pg, code2 + m);
+        const auto mm13 = svld1_u8(pg, code3 + m);
+        {
+            const auto mm10lo = svunpklo_u16(mm10);
+            const auto mm11lo = svunpklo_u16(mm11);
+            const auto mm12lo = svunpklo_u16(mm12);
+            const auto mm13lo = svunpklo_u16(mm13);
+            const auto pglo = svunpklo_b(pg);
+            {
+                const auto pglolo = svunpklo_b(pglo);
+                {
+                    const auto idx1 = svunpklo_u32(mm10lo);
+                    distance_codes_kernel(
+                            pglolo, idx1, offsets_0, tab, partialSum0);
+                }
+                {
+                    const auto idx1 = svunpklo_u32(mm11lo);
+                    distance_codes_kernel(
+                            pglolo, idx1, offsets_0, tab, partialSum1);
+                }
+                {
+                    const auto idx1 = svunpklo_u32(mm12lo);
+                    distance_codes_kernel(
+                            pglolo, idx1, offsets_0, tab, partialSum2);
+                }
+                {
+                    const auto idx1 = svunpklo_u32(mm13lo);
+                    distance_codes_kernel(
+                            pglolo, idx1, offsets_0, tab, partialSum3);
+                }
+                tab += ksub * quad_lanes;
+            }
+            m += quad_lanes;
+            if (m >= M)
+                break;
+            {
+                const auto pglohi = svunpkhi_b(pglo);
+                {
+                    const auto idx1 = svunpkhi_u32(mm10lo);
+                    distance_codes_kernel(
+                            pglohi, idx1, offsets_0, tab, partialSum0);
+                }
+                {
+                    const auto idx1 = svunpkhi_u32(mm11lo);
+                    distance_codes_kernel(
+                            pglohi, idx1, offsets_0, tab, partialSum1);
+                }
+                {
+                    const auto idx1 = svunpkhi_u32(mm12lo);
+                    distance_codes_kernel(
+                            pglohi, idx1, offsets_0, tab, partialSum2);
+                }
+                {
+                    const auto idx1 = svunpkhi_u32(mm13lo);
+                    distance_codes_kernel(
+                            pglohi, idx1, offsets_0, tab, partialSum3);
+                }
+                tab += ksub * quad_lanes;
+            }
+            m += quad_lanes;
+            if (m >= M)
+                break;
+        }
+        {
+            const auto mm10hi = svunpkhi_u16(mm10);
+            const auto mm11hi = svunpkhi_u16(mm11);
+            const auto mm12hi = svunpkhi_u16(mm12);
+            const auto mm13hi = svunpkhi_u16(mm13);
+            const auto pghi = svunpkhi_b(pg);
+            {
+                const auto pghilo = svunpklo_b(pghi);
+                {
+                    const auto idx1 = svunpklo_u32(mm10hi);
+                    distance_codes_kernel(
+                            pghilo, idx1, offsets_0, tab, partialSum0);
+                }
+                {
+                    const auto idx1 = svunpklo_u32(mm11hi);
+                    distance_codes_kernel(
+                            pghilo, idx1, offsets_0, tab, partialSum1);
+                }
+                {
+                    const auto idx1 = svunpklo_u32(mm12hi);
+                    distance_codes_kernel(
+                            pghilo, idx1, offsets_0, tab, partialSum2);
+                }
+                {
+                    const auto idx1 = svunpklo_u32(mm13hi);
+                    distance_codes_kernel(
+                            pghilo, idx1, offsets_0, tab, partialSum3);
+                }
+                tab += ksub * quad_lanes;
+            }
+            m += quad_lanes;
+            if (m >= M)
+                break;
+            {
+                const auto pghihi = svunpkhi_b(pghi);
+                {
+                    const auto idx1 = svunpkhi_u32(mm10hi);
+                    distance_codes_kernel(
+                            pghihi, idx1, offsets_0, tab, partialSum0);
+                }
+                {
+                    const auto idx1 = svunpkhi_u32(mm11hi);
+                    distance_codes_kernel(
+                            pghihi, idx1, offsets_0, tab, partialSum1);
+                }
+                {
+                    const auto idx1 = svunpkhi_u32(mm12hi);
+                    distance_codes_kernel(
+                            pghihi, idx1, offsets_0, tab, partialSum2);
+                }
+                {
+                    const auto idx1 = svunpkhi_u32(mm13hi);
+                    distance_codes_kernel(
+                            pghihi, idx1, offsets_0, tab, partialSum3);
+                }
+                tab += ksub * quad_lanes;
+            }
+            m += quad_lanes;
+        }
+    }
+    result0 = svaddv_f32(svptrue_b32(), partialSum0);
+    result1 = svaddv_f32(svptrue_b32(), partialSum1);
+    result2 = svaddv_f32(svptrue_b32(), partialSum2);
+    result3 = svaddv_f32(svptrue_b32(), partialSum3);
+}
+} // namespace faiss
+#endif