RubyGems - faiss - Versions diffs - 0.2.4 → 0.2.5 - Mend

faiss 0.2.4 → 0.2.5

Files changed (177) hide show

checksums.yaml +4 -4
data/CHANGELOG.md +5 -0
data/README.md +23 -21
data/ext/faiss/extconf.rb +11 -0
data/ext/faiss/index.cpp +4 -4
data/ext/faiss/index_binary.cpp +6 -6
data/ext/faiss/product_quantizer.cpp +4 -4
data/lib/faiss/version.rb +1 -1
data/vendor/faiss/faiss/AutoTune.cpp +13 -0
data/vendor/faiss/faiss/IVFlib.cpp +101 -2
data/vendor/faiss/faiss/IVFlib.h +26 -2
data/vendor/faiss/faiss/Index.cpp +36 -3
data/vendor/faiss/faiss/Index.h +43 -6
data/vendor/faiss/faiss/Index2Layer.cpp +6 -2
data/vendor/faiss/faiss/Index2Layer.h +6 -1
data/vendor/faiss/faiss/IndexAdditiveQuantizer.cpp +219 -16
data/vendor/faiss/faiss/IndexAdditiveQuantizer.h +63 -5
data/vendor/faiss/faiss/IndexAdditiveQuantizerFastScan.cpp +299 -0
data/vendor/faiss/faiss/IndexAdditiveQuantizerFastScan.h +199 -0
data/vendor/faiss/faiss/IndexBinary.cpp +20 -4
data/vendor/faiss/faiss/IndexBinary.h +18 -3
data/vendor/faiss/faiss/IndexBinaryFlat.cpp +9 -2
data/vendor/faiss/faiss/IndexBinaryFlat.h +4 -2
data/vendor/faiss/faiss/IndexBinaryFromFloat.cpp +4 -1
data/vendor/faiss/faiss/IndexBinaryFromFloat.h +2 -1
data/vendor/faiss/faiss/IndexBinaryHNSW.cpp +5 -1
data/vendor/faiss/faiss/IndexBinaryHNSW.h +2 -1
data/vendor/faiss/faiss/IndexBinaryHash.cpp +17 -4
data/vendor/faiss/faiss/IndexBinaryHash.h +8 -4
data/vendor/faiss/faiss/IndexBinaryIVF.cpp +28 -13
data/vendor/faiss/faiss/IndexBinaryIVF.h +10 -7
data/vendor/faiss/faiss/IndexFastScan.cpp +626 -0
data/vendor/faiss/faiss/IndexFastScan.h +145 -0
data/vendor/faiss/faiss/IndexFlat.cpp +34 -21
data/vendor/faiss/faiss/IndexFlat.h +7 -4
data/vendor/faiss/faiss/IndexFlatCodes.cpp +35 -1
data/vendor/faiss/faiss/IndexFlatCodes.h +12 -0
data/vendor/faiss/faiss/IndexHNSW.cpp +66 -138
data/vendor/faiss/faiss/IndexHNSW.h +4 -2
data/vendor/faiss/faiss/IndexIDMap.cpp +247 -0
data/vendor/faiss/faiss/IndexIDMap.h +107 -0
data/vendor/faiss/faiss/IndexIVF.cpp +121 -33
data/vendor/faiss/faiss/IndexIVF.h +35 -16
data/vendor/faiss/faiss/IndexIVFAdditiveQuantizer.cpp +84 -7
data/vendor/faiss/faiss/IndexIVFAdditiveQuantizer.h +63 -1
data/vendor/faiss/faiss/IndexIVFAdditiveQuantizerFastScan.cpp +590 -0
data/vendor/faiss/faiss/IndexIVFAdditiveQuantizerFastScan.h +171 -0
data/vendor/faiss/faiss/IndexIVFFastScan.cpp +1290 -0
data/vendor/faiss/faiss/IndexIVFFastScan.h +213 -0
data/vendor/faiss/faiss/IndexIVFFlat.cpp +37 -17
data/vendor/faiss/faiss/IndexIVFFlat.h +4 -2
data/vendor/faiss/faiss/IndexIVFPQ.cpp +234 -50
data/vendor/faiss/faiss/IndexIVFPQ.h +5 -1
data/vendor/faiss/faiss/IndexIVFPQFastScan.cpp +23 -852
data/vendor/faiss/faiss/IndexIVFPQFastScan.h +7 -112
data/vendor/faiss/faiss/IndexIVFPQR.cpp +3 -3
data/vendor/faiss/faiss/IndexIVFPQR.h +1 -1
data/vendor/faiss/faiss/IndexIVFSpectralHash.cpp +3 -1
data/vendor/faiss/faiss/IndexIVFSpectralHash.h +2 -1
data/vendor/faiss/faiss/IndexLSH.cpp +4 -2
data/vendor/faiss/faiss/IndexLSH.h +2 -1
data/vendor/faiss/faiss/IndexLattice.cpp +7 -1
data/vendor/faiss/faiss/IndexLattice.h +3 -1
data/vendor/faiss/faiss/IndexNNDescent.cpp +4 -3
data/vendor/faiss/faiss/IndexNNDescent.h +2 -1
data/vendor/faiss/faiss/IndexNSG.cpp +37 -3
data/vendor/faiss/faiss/IndexNSG.h +25 -1
data/vendor/faiss/faiss/IndexPQ.cpp +106 -69
data/vendor/faiss/faiss/IndexPQ.h +19 -5
data/vendor/faiss/faiss/IndexPQFastScan.cpp +15 -450
data/vendor/faiss/faiss/IndexPQFastScan.h +15 -78
data/vendor/faiss/faiss/IndexPreTransform.cpp +47 -8
data/vendor/faiss/faiss/IndexPreTransform.h +15 -3
data/vendor/faiss/faiss/IndexRefine.cpp +8 -4
data/vendor/faiss/faiss/IndexRefine.h +4 -2
data/vendor/faiss/faiss/IndexReplicas.cpp +4 -2
data/vendor/faiss/faiss/IndexReplicas.h +2 -1
data/vendor/faiss/faiss/IndexRowwiseMinMax.cpp +438 -0
data/vendor/faiss/faiss/IndexRowwiseMinMax.h +92 -0
data/vendor/faiss/faiss/IndexScalarQuantizer.cpp +26 -15
data/vendor/faiss/faiss/IndexScalarQuantizer.h +6 -7
data/vendor/faiss/faiss/IndexShards.cpp +4 -1
data/vendor/faiss/faiss/IndexShards.h +2 -1
data/vendor/faiss/faiss/MetaIndexes.cpp +5 -178
data/vendor/faiss/faiss/MetaIndexes.h +3 -81
data/vendor/faiss/faiss/VectorTransform.cpp +43 -0
data/vendor/faiss/faiss/VectorTransform.h +22 -4
data/vendor/faiss/faiss/clone_index.cpp +23 -1
data/vendor/faiss/faiss/clone_index.h +3 -0
data/vendor/faiss/faiss/cppcontrib/SaDecodeKernels.h +300 -0
data/vendor/faiss/faiss/cppcontrib/detail/CoarseBitType.h +24 -0
data/vendor/faiss/faiss/cppcontrib/detail/UintReader.h +195 -0
data/vendor/faiss/faiss/cppcontrib/sa_decode/Level2-avx2-inl.h +2058 -0
data/vendor/faiss/faiss/cppcontrib/sa_decode/Level2-inl.h +408 -0
data/vendor/faiss/faiss/cppcontrib/sa_decode/Level2-neon-inl.h +2147 -0
data/vendor/faiss/faiss/cppcontrib/sa_decode/MinMax-inl.h +460 -0
data/vendor/faiss/faiss/cppcontrib/sa_decode/MinMaxFP16-inl.h +465 -0
data/vendor/faiss/faiss/cppcontrib/sa_decode/PQ-avx2-inl.h +1618 -0
data/vendor/faiss/faiss/cppcontrib/sa_decode/PQ-inl.h +251 -0
data/vendor/faiss/faiss/cppcontrib/sa_decode/PQ-neon-inl.h +1452 -0
data/vendor/faiss/faiss/gpu/GpuAutoTune.cpp +1 -0
data/vendor/faiss/faiss/gpu/GpuCloner.cpp +0 -4
data/vendor/faiss/faiss/gpu/GpuIndex.h +28 -4
data/vendor/faiss/faiss/gpu/GpuIndexBinaryFlat.h +2 -1
data/vendor/faiss/faiss/gpu/GpuIndexFlat.h +10 -8
data/vendor/faiss/faiss/gpu/GpuIndexIVF.h +75 -14
data/vendor/faiss/faiss/gpu/GpuIndexIVFFlat.h +19 -32
data/vendor/faiss/faiss/gpu/GpuIndexIVFPQ.h +22 -31
data/vendor/faiss/faiss/gpu/GpuIndexIVFScalarQuantizer.h +22 -28
data/vendor/faiss/faiss/gpu/GpuResources.cpp +14 -0
data/vendor/faiss/faiss/gpu/GpuResources.h +16 -3
data/vendor/faiss/faiss/gpu/StandardGpuResources.cpp +3 -3
data/vendor/faiss/faiss/gpu/impl/IndexUtils.h +32 -0
data/vendor/faiss/faiss/gpu/test/TestGpuIndexBinaryFlat.cpp +1 -0
data/vendor/faiss/faiss/gpu/test/TestGpuIndexFlat.cpp +311 -75
data/vendor/faiss/faiss/gpu/test/TestUtils.cpp +10 -0
data/vendor/faiss/faiss/gpu/test/TestUtils.h +3 -0
data/vendor/faiss/faiss/gpu/test/demo_ivfpq_indexing_gpu.cpp +2 -2
data/vendor/faiss/faiss/gpu/utils/DeviceUtils.h +5 -4
data/vendor/faiss/faiss/impl/AdditiveQuantizer.cpp +116 -47
data/vendor/faiss/faiss/impl/AdditiveQuantizer.h +44 -13
data/vendor/faiss/faiss/impl/AuxIndexStructures.cpp +0 -54
data/vendor/faiss/faiss/impl/AuxIndexStructures.h +0 -76
data/vendor/faiss/faiss/impl/DistanceComputer.h +64 -0
data/vendor/faiss/faiss/impl/HNSW.cpp +123 -27
data/vendor/faiss/faiss/impl/HNSW.h +19 -16
data/vendor/faiss/faiss/impl/IDSelector.cpp +125 -0
data/vendor/faiss/faiss/impl/IDSelector.h +135 -0
data/vendor/faiss/faiss/impl/LocalSearchQuantizer.cpp +6 -28
data/vendor/faiss/faiss/impl/LocalSearchQuantizer.h +6 -1
data/vendor/faiss/faiss/impl/LookupTableScaler.h +77 -0
data/vendor/faiss/faiss/impl/NNDescent.cpp +1 -0
data/vendor/faiss/faiss/impl/NSG.cpp +1 -1
data/vendor/faiss/faiss/impl/ProductAdditiveQuantizer.cpp +383 -0
data/vendor/faiss/faiss/impl/ProductAdditiveQuantizer.h +154 -0
data/vendor/faiss/faiss/impl/ProductQuantizer.cpp +225 -145
data/vendor/faiss/faiss/impl/ProductQuantizer.h +29 -10
data/vendor/faiss/faiss/impl/Quantizer.h +43 -0
data/vendor/faiss/faiss/impl/ResidualQuantizer.cpp +192 -36
data/vendor/faiss/faiss/impl/ResidualQuantizer.h +40 -20
data/vendor/faiss/faiss/impl/ResultHandler.h +96 -0
data/vendor/faiss/faiss/impl/ScalarQuantizer.cpp +97 -173
data/vendor/faiss/faiss/impl/ScalarQuantizer.h +18 -18
data/vendor/faiss/faiss/impl/index_read.cpp +240 -9
data/vendor/faiss/faiss/impl/index_write.cpp +237 -5
data/vendor/faiss/faiss/impl/kmeans1d.cpp +6 -4
data/vendor/faiss/faiss/impl/pq4_fast_scan.cpp +56 -16
data/vendor/faiss/faiss/impl/pq4_fast_scan.h +25 -8
data/vendor/faiss/faiss/impl/pq4_fast_scan_search_1.cpp +66 -25
data/vendor/faiss/faiss/impl/pq4_fast_scan_search_qbs.cpp +75 -27
data/vendor/faiss/faiss/index_factory.cpp +196 -7
data/vendor/faiss/faiss/index_io.h +5 -0
data/vendor/faiss/faiss/invlists/DirectMap.cpp +1 -0
data/vendor/faiss/faiss/invlists/InvertedLists.cpp +4 -1
data/vendor/faiss/faiss/invlists/OnDiskInvertedLists.cpp +2 -1
data/vendor/faiss/faiss/python/python_callbacks.cpp +27 -0
data/vendor/faiss/faiss/python/python_callbacks.h +15 -0
data/vendor/faiss/faiss/utils/Heap.h +31 -15
data/vendor/faiss/faiss/utils/distances.cpp +380 -56
data/vendor/faiss/faiss/utils/distances.h +113 -15
data/vendor/faiss/faiss/utils/distances_simd.cpp +726 -6
data/vendor/faiss/faiss/utils/extra_distances.cpp +12 -7
data/vendor/faiss/faiss/utils/extra_distances.h +3 -1
data/vendor/faiss/faiss/utils/fp16-fp16c.h +21 -0
data/vendor/faiss/faiss/utils/fp16-inl.h +101 -0
data/vendor/faiss/faiss/utils/fp16.h +11 -0
data/vendor/faiss/faiss/utils/hamming-inl.h +54 -0
data/vendor/faiss/faiss/utils/hamming.cpp +0 -48
data/vendor/faiss/faiss/utils/ordered_key_value.h +10 -0
data/vendor/faiss/faiss/utils/quantize_lut.cpp +62 -0
data/vendor/faiss/faiss/utils/quantize_lut.h +20 -0
data/vendor/faiss/faiss/utils/random.cpp +53 -0
data/vendor/faiss/faiss/utils/random.h +5 -0
data/vendor/faiss/faiss/utils/simdlib_avx2.h +4 -0
data/vendor/faiss/faiss/utils/simdlib_emulated.h +6 -1
data/vendor/faiss/faiss/utils/simdlib_neon.h +7 -2
metadata +37 -3

data/vendor/faiss/faiss/gpu/GpuAutoTune.cpp CHANGED Viewed

@@ -16,6 +16,7 @@
 #include <faiss/gpu/GpuIndexIVFFlat.h>
 #include <faiss/gpu/GpuIndexIVFPQ.h>
 #include <faiss/gpu/GpuIndexIVFScalarQuantizer.h>
+#include <faiss/gpu/impl/IndexUtils.h>
 #include <faiss/gpu/utils/DeviceUtils.h>
 #include <faiss/impl/FaissAssert.h>

data/vendor/faiss/faiss/gpu/GpuCloner.cpp CHANGED Viewed

@@ -121,7 +121,6 @@ Index* ToGpuCloner::clone_Index(const Index* index) {
         GpuIndexFlatConfig config;
         config.device = device;
         config.useFloat16 = useFloat16;
-        config.storeTransposed = storeTransposed;
         return new GpuIndexFlat(provider, ifl, config);
     } else if (
             dynamic_cast<const IndexScalarQuantizer*>(index) &&
@@ -147,7 +146,6 @@ Index* ToGpuCloner::clone_Index(const Index* index) {
         config.device = device;
         config.indicesOptions = indicesOptions;
         config.flatConfig.useFloat16 = useFloat16CoarseQuantizer;
-        config.flatConfig.storeTransposed = storeTransposed;
         GpuIndexIVFFlat* res = new GpuIndexIVFFlat(
                 provider, ifl->d, ifl->nlist, ifl->metric_type, config);
@@ -164,7 +162,6 @@ Index* ToGpuCloner::clone_Index(const Index* index) {
         config.device = device;
         config.indicesOptions = indicesOptions;
         config.flatConfig.useFloat16 = useFloat16CoarseQuantizer;
-        config.flatConfig.storeTransposed = storeTransposed;
         GpuIndexIVFScalarQuantizer* res = new GpuIndexIVFScalarQuantizer(
                 provider,
@@ -195,7 +192,6 @@ Index* ToGpuCloner::clone_Index(const Index* index) {
         config.device = device;
         config.indicesOptions = indicesOptions;
         config.flatConfig.useFloat16 = useFloat16CoarseQuantizer;
-        config.flatConfig.storeTransposed = storeTransposed;
         config.useFloat16LookupTables = useFloat16;
         config.usePrecomputedTables = usePrecomputed;

data/vendor/faiss/faiss/gpu/GpuIndex.h CHANGED Viewed

@@ -74,7 +74,19 @@ class GpuIndex : public faiss::Index {
             const float* x,
             Index::idx_t k,
             float* distances,
-            Index::idx_t* labels) const override;
+            Index::idx_t* labels,
+            const SearchParameters* params = nullptr) const override;
+    /// `x`, `distances` and `labels` and `recons` can be resident on the CPU or
+    /// any GPU; copies are performed as needed
+    void search_and_reconstruct(
+            idx_t n,
+            const float* x,
+            idx_t k,
+            float* distances,
+            idx_t* labels,
+            float* recons,
+            const SearchParameters* params = nullptr) const override;
     /// Overridden to force GPU indices to provide their own GPU-friendly
     /// implementation
@@ -111,7 +123,8 @@ class GpuIndex : public faiss::Index {
             const float* x,
             int k,
             float* distances,
-            Index::idx_t* labels) const = 0;
+            Index::idx_t* labels,
+            const SearchParameters* params) const = 0;
    private:
     /// Handles paged adds if the add set is too large, passes to
@@ -127,7 +140,8 @@ class GpuIndex : public faiss::Index {
             const float* x,
             int k,
             float* outDistancesData,
-            Index::idx_t* outIndicesData) const;
+            Index::idx_t* outIndicesData,
+            const SearchParameters* params) const;
     /// Calls searchImpl_ for a single page of GPU-resident data,
     /// handling paging of the data and copies from the CPU
@@ -136,7 +150,8 @@ class GpuIndex : public faiss::Index {
             const float* x,
             int k,
             float* outDistancesData,
-            Index::idx_t* outIndicesData) const;
+            Index::idx_t* outIndicesData,
+            const SearchParameters* params) const;
    protected:
     /// Manages streams, cuBLAS handles and scratch memory for devices
@@ -149,5 +164,14 @@ class GpuIndex : public faiss::Index {
     size_t minPagedSize_;
 };
+/// If the given index is a GPU index, this returns the index instance
+GpuIndex* tryCastGpuIndex(faiss::Index* index);
+/// Is the given index instance a GPU index?
+bool isGpuIndex(faiss::Index* index);
+/// Does the given CPU index instance have a corresponding GPU implementation?
+bool isGpuIndexImplemented(faiss::Index* index);
 } // namespace gpu
 } // namespace faiss

data/vendor/faiss/faiss/gpu/GpuIndexBinaryFlat.h CHANGED Viewed

@@ -62,7 +62,8 @@ class GpuIndexBinaryFlat : public IndexBinary {
             const uint8_t* x,
             faiss::IndexBinary::idx_t k,
             int32_t* distances,
-            faiss::IndexBinary::idx_t* labels) const override;
+            faiss::IndexBinary::idx_t* labels,
+            const faiss::SearchParameters* params = nullptr) const override;
     void reconstruct(faiss::IndexBinary::idx_t key, uint8_t* recons)
             const override;

data/vendor/faiss/faiss/gpu/GpuIndexFlat.h CHANGED Viewed

@@ -24,17 +24,14 @@ namespace gpu {
 class FlatIndex;
 struct GpuIndexFlatConfig : public GpuIndexConfig {
-    inline GpuIndexFlatConfig() : useFloat16(false), storeTransposed(false) {}
+    inline GpuIndexFlatConfig() : useFloat16(false) {}
     /// Whether or not data is stored as float16
     bool useFloat16;
-    /// Whether or not data is stored (transparently) in a transposed
-    /// layout, enabling use of the NN GEMM call, which is ~10% faster.
-    /// This will improve the speed of the flat index, but will
-    /// substantially slow down any add() calls made, as all data must
-    /// be transposed, and will increase storage requirements (we store
-    /// data in both transposed and non-transposed layouts).
+    /// Deprecated: no longer used
+    /// Previously used to indicate whether internal storage of vectors is
+    /// transposed
     bool storeTransposed;
 };
@@ -98,6 +95,10 @@ class GpuIndexFlat : public GpuIndex {
     void reconstruct_n(Index::idx_t i0, Index::idx_t num, float* out)
             const override;
+    /// Batch reconstruction method
+    void reconstruct_batch(Index::idx_t n, const Index::idx_t* keys, float* out)
+            const override;
     /// Compute residual
     void compute_residual(const float* x, float* residual, Index::idx_t key)
             const override;
@@ -128,7 +129,8 @@ class GpuIndexFlat : public GpuIndex {
             const float* x,
             int k,
             float* distances,
-            Index::idx_t* labels) const override;
+            Index::idx_t* labels,
+            const SearchParameters* params) const override;
    protected:
     /// Our configuration options

data/vendor/faiss/faiss/gpu/GpuIndexIVF.h CHANGED Viewed

@@ -8,18 +8,17 @@
 #pragma once
 #include <faiss/Clustering.h>
+#include <faiss/IndexIVF.h> // for SearchParametersIVF
 #include <faiss/gpu/GpuIndex.h>
 #include <faiss/gpu/GpuIndexFlat.h>
 #include <faiss/gpu/GpuIndicesOptions.h>
-namespace faiss {
-struct IndexIVF;
-}
+#include <memory>
 namespace faiss {
 namespace gpu {
 class GpuIndexFlat;
+class IVFBase;
 struct GpuIndexIVFConfig : public GpuIndexConfig {
     inline GpuIndexIVFConfig() : indicesOptions(INDICES_64_BIT) {}
@@ -31,8 +30,13 @@ struct GpuIndexIVFConfig : public GpuIndexConfig {
     GpuIndexFlatConfig flatConfig;
 };
+/// Base class of all GPU IVF index types. This (for now) deliberately does not
+/// inherit from IndexIVF, as many of the public data members and functionality
+/// in IndexIVF is not supported in the same manner on the GPU.
 class GpuIndexIVF : public GpuIndex {
    public:
+    /// Version that auto-constructs a flat coarse quantizer based on the
+    /// desired metric
     GpuIndexIVF(
             GpuResourcesProvider* provider,
             int dims,
@@ -41,6 +45,17 @@ class GpuIndexIVF : public GpuIndex {
             int nlist,
             GpuIndexIVFConfig config = GpuIndexIVFConfig());
+    /// Version that takes a coarse quantizer instance. The GpuIndexIVF does not
+    /// own the coarseQuantizer instance by default (functions like IndexIVF).
+    GpuIndexIVF(
+            GpuResourcesProvider* provider,
+            Index* coarseQuantizer,
+            int dims,
+            faiss::MetricType metric,
+            float metricArg,
+            int nlist,
+            GpuIndexIVFConfig config = GpuIndexIVFConfig());
     ~GpuIndexIVF() override;
    private:
@@ -54,11 +69,16 @@ class GpuIndexIVF : public GpuIndex {
     /// Copy what we have to the CPU equivalent
     void copyTo(faiss::IndexIVF* index) const;
+    /// Should be called if the user ever changes the state of the IVF coarse
+    /// quantizer manually (e.g., substitutes a new instance or changes vectors
+    /// in the coarse quantizer outside the scope of training)
+    virtual void updateQuantizer() = 0;
     /// Returns the number of inverted lists we're managing
     int getNumLists() const;
     /// Returns the number of vectors present in a particular inverted list
-    virtual int getListLength(int listId) const = 0;
+    int getListLength(int listId) const;
     /// Return the encoded vector data contained in a particular inverted list,
     /// for debugging purposes.
@@ -66,16 +86,12 @@ class GpuIndexIVF : public GpuIndex {
     /// GPU-side representation.
     /// Otherwise, it is converted to the CPU format.
     /// compliant format, while the native GPU format may differ.
-    virtual std::vector<uint8_t> getListVectorData(
-            int listId,
-            bool gpuFormat = false) const = 0;
+    std::vector<uint8_t> getListVectorData(int listId, bool gpuFormat = false)
+            const;
     /// Return the vector indices contained in a particular inverted list, for
     /// debugging purposes.
-    virtual std::vector<Index::idx_t> getListIndices(int listId) const = 0;
-    /// Return the quantizer we're using
-    GpuIndexFlat* getQuantizer();
+    std::vector<Index::idx_t> getListIndices(int listId) const;
     /// Sets the number of list probes per query
     void setNumProbes(int nprobe);
@@ -83,10 +99,49 @@ class GpuIndexIVF : public GpuIndex {
     /// Returns our current number of list probes per query
     int getNumProbes() const;
+    /// Same interface as faiss::IndexIVF, in order to search a set of vectors
+    /// pre-quantized by the IVF quantizer. Does not include IndexIVFStats as
+    /// that can only be obtained on the host via a GPU d2h copy.
+    /// @param n      nb of vectors to query
+    /// @param x      query vectors, size nx * d
+    /// @param assign coarse quantization indices, size nx * nprobe
+    /// @param centroid_dis
+    ///             distances to coarse centroids, size nx * nprobe
+    /// @param distance
+    ///             output distances, size n * k
+    /// @param labels output labels, size n * k
+    /// @param store_pairs store inv list index + inv list offset
+    ///                   instead in upper/lower 32 bit of result,
+    ///                   instead of ids (used for reranking).
+    /// @param params used to override the object's search parameters
+    void search_preassigned(
+            idx_t n,
+            const float* x,
+            idx_t k,
+            const idx_t* assign,
+            const float* centroid_dis,
+            float* distances,
+            idx_t* labels,
+            bool store_pairs,
+            const SearchParametersIVF* params = nullptr) const;
    protected:
+    void verifyIVFSettings_() const;
     bool addImplRequiresIDs_() const override;
     void trainQuantizer_(Index::idx_t n, const float* x);
+    /// Called from GpuIndex for add/add_with_ids
+    void addImpl_(int n, const float* x, const Index::idx_t* ids) override;
+    /// Called from GpuIndex for search
+    void searchImpl_(
+            int n,
+            const float* x,
+            int k,
+            float* distances,
+            Index::idx_t* labels,
+            const SearchParameters* params) const override;
    public:
     /// Exposing this like the CPU version for manipulation
     ClusteringParameters cp;
@@ -97,12 +152,18 @@ class GpuIndexIVF : public GpuIndex {
     /// Exposing this like the CPU version for manipulation
     int nprobe;
-    /// Exposeing this like the CPU version for query
-    GpuIndexFlat* quantizer;
+    /// A user-pluggable coarse quantizer
+    Index* quantizer;
+    /// Whether or not we own the coarse quantizer
+    bool own_fields;
    protected:
     /// Our configuration options
     const GpuIndexIVFConfig ivfConfig_;
+    /// For a trained/initialized index, this is a reference to the base class
+    std::shared_ptr<IVFBase> baseIndex_;
 };
 } // namespace gpu

data/vendor/faiss/faiss/gpu/GpuIndexIVFFlat.h CHANGED Viewed

@@ -40,12 +40,22 @@ class GpuIndexIVFFlat : public GpuIndexIVF {
             GpuIndexIVFFlatConfig config = GpuIndexIVFFlatConfig());
     /// Constructs a new instance with an empty flat quantizer; the user
-    /// provides the number of lists desired.
+    /// provides the number of IVF lists desired.
     GpuIndexIVFFlat(
             GpuResourcesProvider* provider,
             int dims,
             int nlist,
-            faiss::MetricType metric,
+            faiss::MetricType metric = faiss::METRIC_L2,
+            GpuIndexIVFFlatConfig config = GpuIndexIVFFlatConfig());
+    /// Constructs a new instance with a provided CPU or GPU coarse quantizer;
+    /// the user provides the number of IVF lists desired.
+    GpuIndexIVFFlat(
+            GpuResourcesProvider* provider,
+            Index* coarseQuantizer,
+            int dims,
+            int nlist,
+            faiss::MetricType metric = faiss::METRIC_L2,
             GpuIndexIVFFlatConfig config = GpuIndexIVFFlatConfig());
     ~GpuIndexIVFFlat() override;
@@ -69,37 +79,14 @@ class GpuIndexIVFFlat : public GpuIndexIVF {
     /// information
     void reset() override;
+    /// Should be called if the user ever changes the state of the IVF coarse
+    /// quantizer manually (e.g., substitutes a new instance or changes vectors
+    /// in the coarse quantizer outside the scope of training)
+    void updateQuantizer() override;
     /// Trains the coarse quantizer based on the given vector data
     void train(Index::idx_t n, const float* x) override;
-    /// Returns the number of vectors present in a particular inverted list
-    int getListLength(int listId) const override;
-    /// Return the encoded vector data contained in a particular inverted list,
-    /// for debugging purposes.
-    /// If gpuFormat is true, the data is returned as it is encoded in the
-    /// GPU-side representation.
-    /// Otherwise, it is converted to the CPU format.
-    /// compliant format, while the native GPU format may differ.
-    std::vector<uint8_t> getListVectorData(int listId, bool gpuFormat = false)
-            const override;
-    /// Return the vector indices contained in a particular inverted list, for
-    /// debugging purposes.
-    std::vector<Index::idx_t> getListIndices(int listId) const override;
-   protected:
-    /// Called from GpuIndex for add/add_with_ids
-    void addImpl_(int n, const float* x, const Index::idx_t* ids) override;
-    /// Called from GpuIndex for search
-    void searchImpl_(
-            int n,
-            const float* x,
-            int k,
-            float* distances,
-            Index::idx_t* labels) const override;
    protected:
     /// Our configuration options
     const GpuIndexIVFFlatConfig ivfFlatConfig_;
@@ -107,8 +94,8 @@ class GpuIndexIVFFlat : public GpuIndexIVF {
     /// Desired inverted list memory reservation
     size_t reserveMemoryVecs_;
-    /// Instance that we own; contains the inverted list
-    std::unique_ptr<IVFFlat> index_;
+    /// Instance that we own; contains the inverted lists
+    std::shared_ptr<IVFFlat> index_;
 };
 } // namespace gpu

data/vendor/faiss/faiss/gpu/GpuIndexIVFPQ.h CHANGED Viewed

@@ -63,14 +63,27 @@ class GpuIndexIVFPQ : public GpuIndexIVF {
             const faiss::IndexIVFPQ* index,
             GpuIndexIVFPQConfig config = GpuIndexIVFPQConfig());
-    /// Construct an empty index
+    /// Constructs a new instance with an empty flat quantizer; the user
+    /// provides the number of IVF lists desired.
     GpuIndexIVFPQ(
             GpuResourcesProvider* provider,
             int dims,
             int nlist,
             int subQuantizers,
             int bitsPerCode,
-            faiss::MetricType metric,
+            faiss::MetricType metric = faiss::METRIC_L2,
+            GpuIndexIVFPQConfig config = GpuIndexIVFPQConfig());
+    /// Constructs a new instance with a provided CPU or GPU coarse quantizer;
+    /// the user provides the number of IVF lists desired.
+    GpuIndexIVFPQ(
+            GpuResourcesProvider* provider,
+            Index* coarseQuantizer,
+            int dims,
+            int nlist,
+            int subQuantizers,
+            int bitsPerCode,
+            faiss::MetricType metric = faiss::METRIC_L2,
             GpuIndexIVFPQConfig config = GpuIndexIVFPQConfig());
     ~GpuIndexIVFPQ() override;
@@ -112,44 +125,22 @@ class GpuIndexIVFPQ : public GpuIndexIVF {
     /// product centroid information
     void reset() override;
+    /// Should be called if the user ever changes the state of the IVF coarse
+    /// quantizer manually (e.g., substitutes a new instance or changes vectors
+    /// in the coarse quantizer outside the scope of training)
+    void updateQuantizer() override;
     /// Trains the coarse and product quantizer based on the given vector data
     void train(Index::idx_t n, const float* x) override;
-    /// Returns the number of vectors present in a particular inverted list
-    int getListLength(int listId) const override;
-    /// Return the encoded vector data contained in a particular inverted list,
-    /// for debugging purposes.
-    /// If gpuFormat is true, the data is returned as it is encoded in the
-    /// GPU-side representation.
-    /// Otherwise, it is converted to the CPU format.
-    /// compliant format, while the native GPU format may differ.
-    std::vector<uint8_t> getListVectorData(int listId, bool gpuFormat = false)
-            const override;
-    /// Return the vector indices contained in a particular inverted list, for
-    /// debugging purposes.
-    std::vector<Index::idx_t> getListIndices(int listId) const override;
    public:
     /// Like the CPU version, we expose a publically-visible ProductQuantizer
     /// for manipulation
     ProductQuantizer pq;
    protected:
-    /// Called from GpuIndex for add/add_with_ids
-    void addImpl_(int n, const float* x, const Index::idx_t* ids) override;
-    /// Called from GpuIndex for search
-    void searchImpl_(
-            int n,
-            const float* x,
-            int k,
-            float* distances,
-            Index::idx_t* labels) const override;
     /// Throws errors if configuration settings are improper
-    void verifySettings_() const;
+    void verifyPQSettings_() const;
     /// Trains the PQ quantizer based on the given vector data
     void trainResidualQuantizer_(Index::idx_t n, const float* x);
@@ -172,7 +163,7 @@ class GpuIndexIVFPQ : public GpuIndexIVF {
     /// The product quantizer instance that we own; contains the
     /// inverted lists
-    std::unique_ptr<IVFPQ> index_;
+    std::shared_ptr<IVFPQ> index_;
 };
 } // namespace gpu

data/vendor/faiss/faiss/gpu/GpuIndexIVFScalarQuantizer.h CHANGED Viewed

@@ -38,7 +38,7 @@ class GpuIndexIVFScalarQuantizer : public GpuIndexIVF {
                     GpuIndexIVFScalarQuantizerConfig());
     /// Constructs a new instance with an empty flat quantizer; the user
-    /// provides the number of lists desired.
+    /// provides the number of IVF lists desired.
     GpuIndexIVFScalarQuantizer(
             GpuResourcesProvider* provider,
             int dims,
@@ -49,6 +49,19 @@ class GpuIndexIVFScalarQuantizer : public GpuIndexIVF {
             GpuIndexIVFScalarQuantizerConfig config =
                     GpuIndexIVFScalarQuantizerConfig());
+    /// Constructs a new instance with a provided CPU or GPU coarse quantizer;
+    /// the user provides the number of IVF lists desired.
+    GpuIndexIVFScalarQuantizer(
+            GpuResourcesProvider* provider,
+            Index* coarseQuantizer,
+            int dims,
+            int nlist,
+            faiss::ScalarQuantizer::QuantizerType qtype,
+            faiss::MetricType metric = MetricType::METRIC_L2,
+            bool encodeResidual = true,
+            GpuIndexIVFScalarQuantizerConfig config =
+                    GpuIndexIVFScalarQuantizerConfig());
     ~GpuIndexIVFScalarQuantizer() override;
     /// Reserve GPU memory in our inverted lists for this number of vectors
@@ -70,36 +83,17 @@ class GpuIndexIVFScalarQuantizer : public GpuIndexIVF {
     /// quantizer information
     void reset() override;
+    /// Should be called if the user ever changes the state of the IVF coarse
+    /// quantizer manually (e.g., substitutes a new instance or changes vectors
+    /// in the coarse quantizer outside the scope of training)
+    void updateQuantizer() override;
     /// Trains the coarse and scalar quantizer based on the given vector data
     void train(Index::idx_t n, const float* x) override;
-    /// Returns the number of vectors present in a particular inverted list
-    int getListLength(int listId) const override;
-    /// Return the encoded vector data contained in a particular inverted list,
-    /// for debugging purposes.
-    /// If gpuFormat is true, the data is returned as it is encoded in the
-    /// GPU-side representation.
-    /// Otherwise, it is converted to the CPU format.
-    /// compliant format, while the native GPU format may differ.
-    std::vector<uint8_t> getListVectorData(int listId, bool gpuFormat = false)
-            const override;
-    /// Return the vector indices contained in a particular inverted list, for
-    /// debugging purposes.
-    std::vector<Index::idx_t> getListIndices(int listId) const override;
    protected:
-    /// Called from GpuIndex for add/add_with_ids
-    void addImpl_(int n, const float* x, const Index::idx_t* ids) override;
-    /// Called from GpuIndex for search
-    void searchImpl_(
-            int n,
-            const float* x,
-            int k,
-            float* distances,
-            Index::idx_t* labels) const override;
+    /// Validates index SQ parameters
+    void verifySQSettings_() const;
     /// Called from train to handle SQ residual training
     void trainResiduals_(Index::idx_t n, const float* x);
@@ -119,7 +113,7 @@ class GpuIndexIVFScalarQuantizer : public GpuIndexIVF {
     size_t reserveMemoryVecs_;
     /// Instance that we own; contains the inverted list
-    std::unique_ptr<IVFFlat> index_;
+    std::shared_ptr<IVFFlat> index_;
 };
 } // namespace gpu

data/vendor/faiss/faiss/gpu/GpuResources.cpp CHANGED Viewed

@@ -184,5 +184,19 @@ size_t GpuResources::getTempMemoryAvailableCurrentDevice() const {
 GpuResourcesProvider::~GpuResourcesProvider() {}
+//
+// GpuResourcesProviderFromResourceInstance
+//
+GpuResourcesProviderFromInstance::GpuResourcesProviderFromInstance(
+        std::shared_ptr<GpuResources> p)
+        : res_(p) {}
+GpuResourcesProviderFromInstance::~GpuResourcesProviderFromInstance() {}
+std::shared_ptr<GpuResources> GpuResourcesProviderFromInstance::getResources() {
+    return res_;
+}
 } // namespace gpu
 } // namespace faiss

data/vendor/faiss/faiss/gpu/GpuResources.h CHANGED Viewed

@@ -28,8 +28,7 @@ enum AllocType {
     FlatData = 1,
     /// Primary data storage for GpuIndexIVF* (the storage for each individual
-    /// IVF
-    /// list)
+    /// IVF list)
     IVFLists = 2,
     /// Quantizer (PQ, SQ) dictionary information
@@ -251,7 +250,8 @@ class GpuResources {
     cudaStream_t getAsyncCopyStreamCurrentDevice();
 };
-/// Interface for a provider of a shared resources object
+/// Interface for a provider of a shared resources object. This is to avoid
+/// interfacing std::shared_ptr to Python
 class GpuResourcesProvider {
    public:
     virtual ~GpuResourcesProvider();
@@ -260,5 +260,18 @@ class GpuResourcesProvider {
     virtual std::shared_ptr<GpuResources> getResources() = 0;
 };
+/// A simple wrapper for a GpuResources object to make a GpuResourcesProvider
+/// out of it again
+class GpuResourcesProviderFromInstance : public GpuResourcesProvider {
+   public:
+    explicit GpuResourcesProviderFromInstance(std::shared_ptr<GpuResources> p);
+    ~GpuResourcesProviderFromInstance() override;
+    std::shared_ptr<GpuResources> getResources() override;
+   private:
+    std::shared_ptr<GpuResources> res_;
+};
 } // namespace gpu
 } // namespace faiss

data/vendor/faiss/faiss/gpu/StandardGpuResources.cpp CHANGED Viewed

@@ -268,6 +268,9 @@ void StandardGpuResourcesImpl::initializeForDevice(int device) {
         return;
     }
+    FAISS_ASSERT(device < getNumDevices());
+    DeviceScope scope(device);
     // If this is the first device that we're initializing, create our
     // pinned memory allocation
     if (defaultStreams_.empty() && pinnedMemSize_ > 0) {
@@ -285,9 +288,6 @@ void StandardGpuResourcesImpl::initializeForDevice(int device) {
         pinnedMemAllocSize_ = pinnedMemSize_;
     }
-    FAISS_ASSERT(device < getNumDevices());
-    DeviceScope scope(device);
     // Make sure that device properties for all devices are cached
     auto& prop = getDeviceProperties(device);