RubyGems - faiss - Versions diffs - 0.2.0 → 0.2.4 - Mend

faiss 0.2.0 → 0.2.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (215) hide show

checksums.yaml +4 -4
data/CHANGELOG.md +16 -0
data/LICENSE.txt +1 -1
data/README.md +7 -7
data/ext/faiss/extconf.rb +6 -3
data/ext/faiss/numo.hpp +4 -4
data/ext/faiss/utils.cpp +1 -1
data/ext/faiss/utils.h +1 -1
data/lib/faiss/version.rb +1 -1
data/vendor/faiss/faiss/AutoTune.cpp +292 -291
data/vendor/faiss/faiss/AutoTune.h +55 -56
data/vendor/faiss/faiss/Clustering.cpp +365 -194
data/vendor/faiss/faiss/Clustering.h +102 -35
data/vendor/faiss/faiss/IVFlib.cpp +171 -195
data/vendor/faiss/faiss/IVFlib.h +48 -51
data/vendor/faiss/faiss/Index.cpp +85 -103
data/vendor/faiss/faiss/Index.h +54 -48
data/vendor/faiss/faiss/Index2Layer.cpp +126 -224
data/vendor/faiss/faiss/Index2Layer.h +22 -36
data/vendor/faiss/faiss/IndexAdditiveQuantizer.cpp +407 -0
data/vendor/faiss/faiss/IndexAdditiveQuantizer.h +195 -0
data/vendor/faiss/faiss/IndexBinary.cpp +45 -37
data/vendor/faiss/faiss/IndexBinary.h +140 -132
data/vendor/faiss/faiss/IndexBinaryFlat.cpp +73 -53
data/vendor/faiss/faiss/IndexBinaryFlat.h +29 -24
data/vendor/faiss/faiss/IndexBinaryFromFloat.cpp +46 -43
data/vendor/faiss/faiss/IndexBinaryFromFloat.h +16 -15
data/vendor/faiss/faiss/IndexBinaryHNSW.cpp +215 -232
data/vendor/faiss/faiss/IndexBinaryHNSW.h +25 -24
data/vendor/faiss/faiss/IndexBinaryHash.cpp +182 -177
data/vendor/faiss/faiss/IndexBinaryHash.h +41 -34
data/vendor/faiss/faiss/IndexBinaryIVF.cpp +489 -461
data/vendor/faiss/faiss/IndexBinaryIVF.h +97 -68
data/vendor/faiss/faiss/IndexFlat.cpp +115 -176
data/vendor/faiss/faiss/IndexFlat.h +42 -59
data/vendor/faiss/faiss/IndexFlatCodes.cpp +67 -0
data/vendor/faiss/faiss/IndexFlatCodes.h +47 -0
data/vendor/faiss/faiss/IndexHNSW.cpp +372 -348
data/vendor/faiss/faiss/IndexHNSW.h +57 -41
data/vendor/faiss/faiss/IndexIVF.cpp +545 -453
data/vendor/faiss/faiss/IndexIVF.h +169 -118
data/vendor/faiss/faiss/IndexIVFAdditiveQuantizer.cpp +316 -0
data/vendor/faiss/faiss/IndexIVFAdditiveQuantizer.h +121 -0
data/vendor/faiss/faiss/IndexIVFFlat.cpp +247 -252
data/vendor/faiss/faiss/IndexIVFFlat.h +48 -51
data/vendor/faiss/faiss/IndexIVFPQ.cpp +459 -517
data/vendor/faiss/faiss/IndexIVFPQ.h +75 -67
data/vendor/faiss/faiss/IndexIVFPQFastScan.cpp +406 -372
data/vendor/faiss/faiss/IndexIVFPQFastScan.h +82 -57
data/vendor/faiss/faiss/IndexIVFPQR.cpp +104 -102
data/vendor/faiss/faiss/IndexIVFPQR.h +33 -28
data/vendor/faiss/faiss/IndexIVFSpectralHash.cpp +163 -150
data/vendor/faiss/faiss/IndexIVFSpectralHash.h +38 -25
data/vendor/faiss/faiss/IndexLSH.cpp +66 -113
data/vendor/faiss/faiss/IndexLSH.h +20 -38
data/vendor/faiss/faiss/IndexLattice.cpp +42 -56
data/vendor/faiss/faiss/IndexLattice.h +11 -16
data/vendor/faiss/faiss/IndexNNDescent.cpp +229 -0
data/vendor/faiss/faiss/IndexNNDescent.h +72 -0
data/vendor/faiss/faiss/IndexNSG.cpp +301 -0
data/vendor/faiss/faiss/IndexNSG.h +85 -0
data/vendor/faiss/faiss/IndexPQ.cpp +387 -495
data/vendor/faiss/faiss/IndexPQ.h +64 -82
data/vendor/faiss/faiss/IndexPQFastScan.cpp +143 -170
data/vendor/faiss/faiss/IndexPQFastScan.h +46 -32
data/vendor/faiss/faiss/IndexPreTransform.cpp +120 -150
data/vendor/faiss/faiss/IndexPreTransform.h +33 -36
data/vendor/faiss/faiss/IndexRefine.cpp +139 -127
data/vendor/faiss/faiss/IndexRefine.h +32 -23
data/vendor/faiss/faiss/IndexReplicas.cpp +147 -153
data/vendor/faiss/faiss/IndexReplicas.h +62 -56
data/vendor/faiss/faiss/IndexScalarQuantizer.cpp +111 -172
data/vendor/faiss/faiss/IndexScalarQuantizer.h +41 -59
data/vendor/faiss/faiss/IndexShards.cpp +256 -240
data/vendor/faiss/faiss/IndexShards.h +85 -73
data/vendor/faiss/faiss/MatrixStats.cpp +112 -97
data/vendor/faiss/faiss/MatrixStats.h +7 -10
data/vendor/faiss/faiss/MetaIndexes.cpp +135 -157
data/vendor/faiss/faiss/MetaIndexes.h +40 -34
data/vendor/faiss/faiss/MetricType.h +7 -7
data/vendor/faiss/faiss/VectorTransform.cpp +654 -475
data/vendor/faiss/faiss/VectorTransform.h +64 -89
data/vendor/faiss/faiss/clone_index.cpp +78 -73
data/vendor/faiss/faiss/clone_index.h +4 -9
data/vendor/faiss/faiss/gpu/GpuAutoTune.cpp +33 -38
data/vendor/faiss/faiss/gpu/GpuAutoTune.h +11 -9
data/vendor/faiss/faiss/gpu/GpuCloner.cpp +198 -171
data/vendor/faiss/faiss/gpu/GpuCloner.h +53 -35
data/vendor/faiss/faiss/gpu/GpuClonerOptions.cpp +12 -14
data/vendor/faiss/faiss/gpu/GpuClonerOptions.h +27 -25
data/vendor/faiss/faiss/gpu/GpuDistance.h +116 -112
data/vendor/faiss/faiss/gpu/GpuFaissAssert.h +1 -2
data/vendor/faiss/faiss/gpu/GpuIcmEncoder.h +60 -0
data/vendor/faiss/faiss/gpu/GpuIndex.h +134 -137
data/vendor/faiss/faiss/gpu/GpuIndexBinaryFlat.h +76 -73
data/vendor/faiss/faiss/gpu/GpuIndexFlat.h +173 -162
data/vendor/faiss/faiss/gpu/GpuIndexIVF.h +67 -64
data/vendor/faiss/faiss/gpu/GpuIndexIVFFlat.h +89 -86
data/vendor/faiss/faiss/gpu/GpuIndexIVFPQ.h +150 -141
data/vendor/faiss/faiss/gpu/GpuIndexIVFScalarQuantizer.h +101 -103
data/vendor/faiss/faiss/gpu/GpuIndicesOptions.h +17 -16
data/vendor/faiss/faiss/gpu/GpuResources.cpp +116 -128
data/vendor/faiss/faiss/gpu/GpuResources.h +182 -186
data/vendor/faiss/faiss/gpu/StandardGpuResources.cpp +433 -422
data/vendor/faiss/faiss/gpu/StandardGpuResources.h +131 -130
data/vendor/faiss/faiss/gpu/impl/InterleavedCodes.cpp +468 -456
data/vendor/faiss/faiss/gpu/impl/InterleavedCodes.h +25 -19
data/vendor/faiss/faiss/gpu/impl/RemapIndices.cpp +22 -20
data/vendor/faiss/faiss/gpu/impl/RemapIndices.h +9 -8
data/vendor/faiss/faiss/gpu/perf/IndexWrapper-inl.h +39 -44
data/vendor/faiss/faiss/gpu/perf/IndexWrapper.h +16 -14
data/vendor/faiss/faiss/gpu/perf/PerfClustering.cpp +77 -71
data/vendor/faiss/faiss/gpu/perf/PerfIVFPQAdd.cpp +109 -88
data/vendor/faiss/faiss/gpu/perf/WriteIndex.cpp +75 -64
data/vendor/faiss/faiss/gpu/test/TestCodePacking.cpp +230 -215
data/vendor/faiss/faiss/gpu/test/TestGpuIndexBinaryFlat.cpp +80 -86
data/vendor/faiss/faiss/gpu/test/TestGpuIndexFlat.cpp +284 -277
data/vendor/faiss/faiss/gpu/test/TestGpuIndexIVFFlat.cpp +416 -416
data/vendor/faiss/faiss/gpu/test/TestGpuIndexIVFPQ.cpp +611 -517
data/vendor/faiss/faiss/gpu/test/TestGpuIndexIVFScalarQuantizer.cpp +166 -164
data/vendor/faiss/faiss/gpu/test/TestGpuMemoryException.cpp +61 -53
data/vendor/faiss/faiss/gpu/test/TestUtils.cpp +274 -238
data/vendor/faiss/faiss/gpu/test/TestUtils.h +73 -57
data/vendor/faiss/faiss/gpu/test/demo_ivfpq_indexing_gpu.cpp +47 -50
data/vendor/faiss/faiss/gpu/utils/DeviceUtils.h +79 -72
data/vendor/faiss/faiss/gpu/utils/StackDeviceMemory.cpp +140 -146
data/vendor/faiss/faiss/gpu/utils/StackDeviceMemory.h +69 -71
data/vendor/faiss/faiss/gpu/utils/StaticUtils.h +21 -16
data/vendor/faiss/faiss/gpu/utils/Timer.cpp +25 -29
data/vendor/faiss/faiss/gpu/utils/Timer.h +30 -29
data/vendor/faiss/faiss/impl/AdditiveQuantizer.cpp +503 -0
data/vendor/faiss/faiss/impl/AdditiveQuantizer.h +175 -0
data/vendor/faiss/faiss/impl/AuxIndexStructures.cpp +90 -120
data/vendor/faiss/faiss/impl/AuxIndexStructures.h +81 -65
data/vendor/faiss/faiss/impl/FaissAssert.h +73 -58
data/vendor/faiss/faiss/impl/FaissException.cpp +56 -48
data/vendor/faiss/faiss/impl/FaissException.h +41 -29
data/vendor/faiss/faiss/impl/HNSW.cpp +606 -617
data/vendor/faiss/faiss/impl/HNSW.h +179 -200
data/vendor/faiss/faiss/impl/LocalSearchQuantizer.cpp +855 -0
data/vendor/faiss/faiss/impl/LocalSearchQuantizer.h +244 -0
data/vendor/faiss/faiss/impl/NNDescent.cpp +487 -0
data/vendor/faiss/faiss/impl/NNDescent.h +154 -0
data/vendor/faiss/faiss/impl/NSG.cpp +679 -0
data/vendor/faiss/faiss/impl/NSG.h +199 -0
data/vendor/faiss/faiss/impl/PolysemousTraining.cpp +484 -454
data/vendor/faiss/faiss/impl/PolysemousTraining.h +52 -55
data/vendor/faiss/faiss/impl/ProductQuantizer-inl.h +26 -47
data/vendor/faiss/faiss/impl/ProductQuantizer.cpp +469 -459
data/vendor/faiss/faiss/impl/ProductQuantizer.h +76 -87
data/vendor/faiss/faiss/impl/ResidualQuantizer.cpp +758 -0
data/vendor/faiss/faiss/impl/ResidualQuantizer.h +188 -0
data/vendor/faiss/faiss/impl/ResultHandler.h +96 -132
data/vendor/faiss/faiss/impl/ScalarQuantizer.cpp +647 -707
data/vendor/faiss/faiss/impl/ScalarQuantizer.h +48 -46
data/vendor/faiss/faiss/impl/ThreadedIndex-inl.h +129 -131
data/vendor/faiss/faiss/impl/ThreadedIndex.h +61 -55
data/vendor/faiss/faiss/impl/index_read.cpp +631 -480
data/vendor/faiss/faiss/impl/index_write.cpp +547 -407
data/vendor/faiss/faiss/impl/io.cpp +76 -95
data/vendor/faiss/faiss/impl/io.h +31 -41
data/vendor/faiss/faiss/impl/io_macros.h +60 -29
data/vendor/faiss/faiss/impl/kmeans1d.cpp +301 -0
data/vendor/faiss/faiss/impl/kmeans1d.h +48 -0
data/vendor/faiss/faiss/impl/lattice_Zn.cpp +137 -186
data/vendor/faiss/faiss/impl/lattice_Zn.h +40 -51
data/vendor/faiss/faiss/impl/platform_macros.h +29 -8
data/vendor/faiss/faiss/impl/pq4_fast_scan.cpp +77 -124
data/vendor/faiss/faiss/impl/pq4_fast_scan.h +39 -48
data/vendor/faiss/faiss/impl/pq4_fast_scan_search_1.cpp +41 -52
data/vendor/faiss/faiss/impl/pq4_fast_scan_search_qbs.cpp +80 -117
data/vendor/faiss/faiss/impl/simd_result_handlers.h +109 -137
data/vendor/faiss/faiss/index_factory.cpp +619 -397
data/vendor/faiss/faiss/index_factory.h +8 -6
data/vendor/faiss/faiss/index_io.h +23 -26
data/vendor/faiss/faiss/invlists/BlockInvertedLists.cpp +67 -75
data/vendor/faiss/faiss/invlists/BlockInvertedLists.h +22 -24
data/vendor/faiss/faiss/invlists/DirectMap.cpp +96 -112
data/vendor/faiss/faiss/invlists/DirectMap.h +29 -33
data/vendor/faiss/faiss/invlists/InvertedLists.cpp +307 -364
data/vendor/faiss/faiss/invlists/InvertedLists.h +151 -151
data/vendor/faiss/faiss/invlists/InvertedListsIOHook.cpp +29 -34
data/vendor/faiss/faiss/invlists/InvertedListsIOHook.h +17 -18
data/vendor/faiss/faiss/invlists/OnDiskInvertedLists.cpp +257 -293
data/vendor/faiss/faiss/invlists/OnDiskInvertedLists.h +50 -45
data/vendor/faiss/faiss/python/python_callbacks.cpp +23 -26
data/vendor/faiss/faiss/python/python_callbacks.h +9 -16
data/vendor/faiss/faiss/utils/AlignedTable.h +79 -44
data/vendor/faiss/faiss/utils/Heap.cpp +40 -48
data/vendor/faiss/faiss/utils/Heap.h +186 -209
data/vendor/faiss/faiss/utils/WorkerThread.cpp +67 -76
data/vendor/faiss/faiss/utils/WorkerThread.h +32 -33
data/vendor/faiss/faiss/utils/distances.cpp +305 -312
data/vendor/faiss/faiss/utils/distances.h +170 -122
data/vendor/faiss/faiss/utils/distances_simd.cpp +498 -508
data/vendor/faiss/faiss/utils/extra_distances-inl.h +117 -0
data/vendor/faiss/faiss/utils/extra_distances.cpp +113 -232
data/vendor/faiss/faiss/utils/extra_distances.h +30 -29
data/vendor/faiss/faiss/utils/hamming-inl.h +260 -209
data/vendor/faiss/faiss/utils/hamming.cpp +375 -469
data/vendor/faiss/faiss/utils/hamming.h +62 -85
data/vendor/faiss/faiss/utils/ordered_key_value.h +16 -18
data/vendor/faiss/faiss/utils/partitioning.cpp +393 -318
data/vendor/faiss/faiss/utils/partitioning.h +26 -21
data/vendor/faiss/faiss/utils/quantize_lut.cpp +78 -66
data/vendor/faiss/faiss/utils/quantize_lut.h +22 -20
data/vendor/faiss/faiss/utils/random.cpp +39 -63
data/vendor/faiss/faiss/utils/random.h +13 -16
data/vendor/faiss/faiss/utils/simdlib.h +4 -2
data/vendor/faiss/faiss/utils/simdlib_avx2.h +88 -85
data/vendor/faiss/faiss/utils/simdlib_emulated.h +226 -165
data/vendor/faiss/faiss/utils/simdlib_neon.h +832 -0
data/vendor/faiss/faiss/utils/utils.cpp +304 -287
data/vendor/faiss/faiss/utils/utils.h +54 -49
metadata +29 -4

data/vendor/faiss/faiss/IndexIVFPQFastScan.h CHANGED Viewed

@@ -15,7 +15,6 @@
 namespace faiss {
 /** Fast scan version of IVFPQ. Works for 4-bit PQ for now.
  *
  * The codes in the inverted lists are not stored sequentially but
@@ -32,13 +31,12 @@ namespace faiss {
  * 13: idem, collect results in reservoir
  */
-struct IndexIVFPQFastScan: IndexIVF {
-    bool by_residual;              ///< Encode residual or plain vector?
-    ProductQuantizer pq;           ///< produces the codes
+struct IndexIVFPQFastScan : IndexIVF {
+    bool by_residual;    ///< Encode residual or plain vector?
+    ProductQuantizer pq; ///< produces the codes
     // size of the kernel
-    int bbs;  // set at build time
+    int bbs; // set at build time
     // M rounded up to a multiple of 2
     size_t M2;
@@ -57,88 +55,114 @@ struct IndexIVFPQFastScan: IndexIVF {
     int qbs = 0;
     size_t qbs2 = 0;
-    IndexIVFPQFastScan (
-            Index * quantizer, size_t d, size_t nlist,
-            size_t M, size_t nbits_per_idx,
-            MetricType metric = METRIC_L2, int bbs = 32);
+    IndexIVFPQFastScan(
+            Index* quantizer,
+            size_t d,
+            size_t nlist,
+            size_t M,
+            size_t nbits_per_idx,
+            MetricType metric = METRIC_L2,
+            int bbs = 32);
-    IndexIVFPQFastScan ();
+    IndexIVFPQFastScan();
     // built from an IndexIVFPQ
-    explicit IndexIVFPQFastScan(const IndexIVFPQ & orig, int bbs = 32);
+    explicit IndexIVFPQFastScan(const IndexIVFPQ& orig, int bbs = 32);
     /// orig's inverted lists (for debugging)
-    InvertedLists * orig_invlists = nullptr;
+    InvertedLists* orig_invlists = nullptr;
-    void train_residual (idx_t n, const float *x) override;
+    void train_residual(idx_t n, const float* x) override;
     /// build precomputed table, possibly updating use_precomputed_table
-    void precompute_table ();
+    void precompute_table();
     /// same as the regular IVFPQ encoder. The codes are not reorganized by
     /// blocks a that point
     void encode_vectors(
-            idx_t n, const float* x,
-            const idx_t *list_nos, uint8_t * codes,
+            idx_t n,
+            const float* x,
+            const idx_t* list_nos,
+            uint8_t* codes,
             bool include_listno = false) const override;
-    void add_with_ids (
-        idx_t n, const float * x, const idx_t *xids) override;
+    void add_with_ids(idx_t n, const float* x, const idx_t* xids) override;
     void search(
-            idx_t n, const float* x, idx_t k,
-            float* distances, idx_t* labels) const override;
+            idx_t n,
+            const float* x,
+            idx_t k,
+            float* distances,
+            idx_t* labels) const override;
     // prepare look-up tables
     void compute_LUT(
-        size_t n, const float *x,
-        const idx_t *coarse_ids, const float *coarse_dis,
-        AlignedTable<float> & dis_tables,
-        AlignedTable<float> & biases
-    ) const;
+            size_t n,
+            const float* x,
+            const idx_t* coarse_ids,
+            const float* coarse_dis,
+            AlignedTable<float>& dis_tables,
+            AlignedTable<float>& biases) const;
     void compute_LUT_uint8(
-        size_t n, const float *x,
-        const idx_t *coarse_ids, const float *coarse_dis,
-        AlignedTable<uint8_t> & dis_tables,
-        AlignedTable<uint16_t> & biases,
-        float * normalizers
-    ) const;
+            size_t n,
+            const float* x,
+            const idx_t* coarse_ids,
+            const float* coarse_dis,
+            AlignedTable<uint8_t>& dis_tables,
+            AlignedTable<uint16_t>& biases,
+            float* normalizers) const;
     // internal search funcs
-    template<bool is_max>
+    template <bool is_max>
     void search_dispatch_implem(
-            idx_t n, const float* x, idx_t k,
-            float* distances, idx_t* labels) const;
+            idx_t n,
+            const float* x,
+            idx_t k,
+            float* distances,
+            idx_t* labels) const;
-    template<class C>
+    template <class C>
     void search_implem_1(
-            idx_t n, const float* x, idx_t k,
-            float* distances, idx_t* labels) const;
+            idx_t n,
+            const float* x,
+            idx_t k,
+            float* distances,
+            idx_t* labels) const;
-    template<class C>
+    template <class C>
     void search_implem_2(
-            idx_t n, const float* x, idx_t k,
-            float* distances, idx_t* labels) const;
+            idx_t n,
+            const float* x,
+            idx_t k,
+            float* distances,
+            idx_t* labels) const;
     // implem 10 and 12 are not multithreaded internally, so
     // export search stats
-    template<class C>
+    template <class C>
     void search_implem_10(
-            idx_t n, const float* x, idx_t k,
-            float* distances, idx_t* labels,
-            int impl, size_t *ndis_out, size_t *nlist_out) const;
-    template<class C>
+            idx_t n,
+            const float* x,
+            idx_t k,
+            float* distances,
+            idx_t* labels,
+            int impl,
+            size_t* ndis_out,
+            size_t* nlist_out) const;
+    template <class C>
     void search_implem_12(
-            idx_t n, const float* x, idx_t k,
-            float* distances, idx_t* labels,
-            int impl, size_t *ndis_out, size_t *nlist_out) const;
+            idx_t n,
+            const float* x,
+            idx_t k,
+            float* distances,
+            idx_t* labels,
+            int impl,
+            size_t* ndis_out,
+            size_t* nlist_out) const;
 };
 struct IVFFastScanStats {
@@ -148,13 +172,15 @@ struct IVFFastScanStats {
     uint64_t reservoir_times[4];
     double Mcy_at(int i) {
-        return times[i] / (1000*1000.0);
+        return times[i] / (1000 * 1000.0);
     }
     double Mcy_reservoir_at(int i) {
-        return reservoir_times[i] / (1000*1000.0);
+        return reservoir_times[i] / (1000 * 1000.0);
+    }
+    IVFFastScanStats() {
+        reset();
     }
-    IVFFastScanStats() {reset();}
     void reset() {
         memset(this, 0, sizeof(*this));
     }
@@ -162,5 +188,4 @@ struct IVFFastScanStats {
 FAISS_API extern IVFFastScanStats IVFFastScan_stats;
 } // namespace faiss

data/vendor/faiss/faiss/IndexIVFPQR.cpp CHANGED Viewed

@@ -12,115 +12,116 @@
 #include <cinttypes>
 #include <faiss/utils/Heap.h>
-#include <faiss/utils/utils.h>
 #include <faiss/utils/distances.h>
+#include <faiss/utils/utils.h>
 #include <faiss/impl/FaissAssert.h>
 namespace faiss {
 /*****************************************
  * IndexIVFPQR implementation
  ******************************************/
-IndexIVFPQR::IndexIVFPQR (
-            Index * quantizer, size_t d, size_t nlist,
-            size_t M, size_t nbits_per_idx,
-            size_t M_refine, size_t nbits_per_idx_refine):
-    IndexIVFPQ (quantizer, d, nlist, M, nbits_per_idx),
-    refine_pq (d, M_refine, nbits_per_idx_refine),
-    k_factor (4)
-{
+IndexIVFPQR::IndexIVFPQR(
+        Index* quantizer,
+        size_t d,
+        size_t nlist,
+        size_t M,
+        size_t nbits_per_idx,
+        size_t M_refine,
+        size_t nbits_per_idx_refine)
+        : IndexIVFPQ(quantizer, d, nlist, M, nbits_per_idx),
+          refine_pq(d, M_refine, nbits_per_idx_refine),
+          k_factor(4) {
     by_residual = true;
 }
-IndexIVFPQR::IndexIVFPQR ():
-    k_factor (1)
-{
+IndexIVFPQR::IndexIVFPQR() : k_factor(1) {
     by_residual = true;
 }
-void IndexIVFPQR::reset()
-{
+void IndexIVFPQR::reset() {
     IndexIVFPQ::reset();
     refine_codes.clear();
 }
+void IndexIVFPQR::train_residual(idx_t n, const float* x) {
+    float* residual_2 = new float[n * d];
+    ScopeDeleter<float> del(residual_2);
-void IndexIVFPQR::train_residual (idx_t n, const float *x)
-{
-    float * residual_2 = new float [n * d];
-    ScopeDeleter <float> del(residual_2);
-    train_residual_o (n, x, residual_2);
+    train_residual_o(n, x, residual_2);
     if (verbose)
-        printf ("training %zdx%zd 2nd level PQ quantizer on %" PRId64 " %dD-vectors\n",
-                refine_pq.M, refine_pq.ksub, n, d);
+        printf("training %zdx%zd 2nd level PQ quantizer on %" PRId64
+               " %dD-vectors\n",
+               refine_pq.M,
+               refine_pq.ksub,
+               n,
+               d);
     refine_pq.cp.max_points_per_centroid = 1000;
     refine_pq.cp.verbose = verbose;
-    refine_pq.train (n, residual_2);
+    refine_pq.train(n, residual_2);
 }
-void IndexIVFPQR::add_with_ids (idx_t n, const float *x, const idx_t *xids) {
-    add_core (n, x, xids, nullptr);
+void IndexIVFPQR::add_with_ids(idx_t n, const float* x, const idx_t* xids) {
+    add_core(n, x, xids, nullptr);
 }
-void IndexIVFPQR::add_core (idx_t n, const float *x, const idx_t *xids,
-                                const idx_t *precomputed_idx) {
-    float * residual_2 = new float [n * d];
-    ScopeDeleter <float> del(residual_2);
+void IndexIVFPQR::add_core(
+        idx_t n,
+        const float* x,
+        const idx_t* xids,
+        const idx_t* precomputed_idx) {
+    float* residual_2 = new float[n * d];
+    ScopeDeleter<float> del(residual_2);
     idx_t n0 = ntotal;
-    add_core_o (n, x, xids, residual_2, precomputed_idx);
-    refine_codes.resize (ntotal * refine_pq.code_size);
-    refine_pq.compute_codes (
-        residual_2, &refine_codes[n0 * refine_pq.code_size], n);
+    add_core_o(n, x, xids, residual_2, precomputed_idx);
+    refine_codes.resize(ntotal * refine_pq.code_size);
+    refine_pq.compute_codes(
+            residual_2, &refine_codes[n0 * refine_pq.code_size], n);
 }
 #define TIC t0 = get_cycles()
-#define TOC get_cycles () - t0
-void IndexIVFPQR::search_preassigned (
-        idx_t n, const float *x, idx_t k,
-        const idx_t *idx, const float *L1_dis,
-        float *distances, idx_t *labels,
+#define TOC get_cycles() - t0
+void IndexIVFPQR::search_preassigned(
+        idx_t n,
+        const float* x,
+        idx_t k,
+        const idx_t* idx,
+        const float* L1_dis,
+        float* distances,
+        idx_t* labels,
         bool store_pairs,
-        const IVFSearchParameters *params, IndexIVFStats *stats
-        ) const
-{
+        const IVFSearchParameters* params,
+        IndexIVFStats* stats) const {
     uint64_t t0;
     TIC;
     size_t k_coarse = long(k * k_factor);
-    idx_t *coarse_labels = new idx_t [k_coarse * n];
-    ScopeDeleter<idx_t> del1 (coarse_labels);
+    idx_t* coarse_labels = new idx_t[k_coarse * n];
+    ScopeDeleter<idx_t> del1(coarse_labels);
     { // query with quantizer levels 1 and 2.
-        float *coarse_distances = new float [k_coarse * n];
+        float* coarse_distances = new float[k_coarse * n];
         ScopeDeleter<float> del(coarse_distances);
-        IndexIVFPQ::search_preassigned (
-                   n, x, k_coarse,
-                   idx, L1_dis, coarse_distances, coarse_labels,
-                   true, params);
+        IndexIVFPQ::search_preassigned(
+                n,
+                x,
+                k_coarse,
+                idx,
+                L1_dis,
+                coarse_distances,
+                coarse_labels,
+                true,
+                params);
     }
     indexIVFPQ_stats.search_cycles += TOC;
     TIC;
@@ -130,91 +131,92 @@ void IndexIVFPQR::search_preassigned (
 #pragma omp parallel reduction(+ : n_refine)
     {
         // tmp buffers
-        float *residual_1 = new float [2 * d];
-        ScopeDeleter<float> del (residual_1);
-        float *residual_2 = residual_1 + d;
+        float* residual_1 = new float[2 * d];
+        ScopeDeleter<float> del(residual_1);
+        float* residual_2 = residual_1 + d;
 #pragma omp for
         for (idx_t i = 0; i < n; i++) {
-            const float *xq = x + i * d;
-            const idx_t * shortlist = coarse_labels + k_coarse * i;
-            float * heap_sim = distances + k * i;
-            idx_t * heap_ids = labels + k * i;
-            maxheap_heapify (k, heap_sim, heap_ids);
+            const float* xq = x + i * d;
+            const idx_t* shortlist = coarse_labels + k_coarse * i;
+            float* heap_sim = distances + k * i;
+            idx_t* heap_ids = labels + k * i;
+            maxheap_heapify(k, heap_sim, heap_ids);
             for (int j = 0; j < k_coarse; j++) {
                 idx_t sl = shortlist[j];
-                if (sl == -1) continue;
+                if (sl == -1)
+                    continue;
                 int list_no = lo_listno(sl);
                 int ofs = lo_offset(sl);
-                assert (list_no >= 0 && list_no < nlist);
-                assert (ofs >= 0 && ofs < invlists->list_size (list_no));
+                assert(list_no >= 0 && list_no < nlist);
+                assert(ofs >= 0 && ofs < invlists->list_size(list_no));
                 // 1st level residual
-                quantizer->compute_residual (xq, residual_1, list_no);
+                quantizer->compute_residual(xq, residual_1, list_no);
                 // 2nd level residual
-                const uint8_t * l2code =
-                    invlists->get_single_code (list_no, ofs);
+                const uint8_t* l2code = invlists->get_single_code(list_no, ofs);
-                pq.decode (l2code, residual_2);
+                pq.decode(l2code, residual_2);
                 for (int l = 0; l < d; l++)
                     residual_2[l] = residual_1[l] - residual_2[l];
                 // 3rd level residual's approximation
-                idx_t id = invlists->get_single_id (list_no, ofs);
-                assert (0 <= id && id < ntotal);
-                refine_pq.decode (&refine_codes [id * refine_pq.code_size],
-                                  residual_1);
+                idx_t id = invlists->get_single_id(list_no, ofs);
+                assert(0 <= id && id < ntotal);
+                refine_pq.decode(
+                        &refine_codes[id * refine_pq.code_size], residual_1);
-                float dis = fvec_L2sqr (residual_1, residual_2, d);
+                float dis = fvec_L2sqr(residual_1, residual_2, d);
                 if (dis < heap_sim[0]) {
                     idx_t id_or_pair = store_pairs ? sl : id;
-                    maxheap_replace_top (k, heap_sim, heap_ids, dis, id_or_pair);
+                    maxheap_replace_top(k, heap_sim, heap_ids, dis, id_or_pair);
                 }
-                n_refine ++;
+                n_refine++;
             }
-            maxheap_reorder (k, heap_sim, heap_ids);
+            maxheap_reorder(k, heap_sim, heap_ids);
         }
     }
     indexIVFPQ_stats.nrefine += n_refine;
     indexIVFPQ_stats.refine_cycles += TOC;
 }
-void IndexIVFPQR::reconstruct_from_offset (int64_t list_no, int64_t offset,
-                                           float* recons) const
-{
-    IndexIVFPQ::reconstruct_from_offset (list_no, offset, recons);
+void IndexIVFPQR::reconstruct_from_offset(
+        int64_t list_no,
+        int64_t offset,
+        float* recons) const {
+    IndexIVFPQ::reconstruct_from_offset(list_no, offset, recons);
-    idx_t id = invlists->get_single_id (list_no, offset);
-    assert (0 <= id && id < ntotal);
+    idx_t id = invlists->get_single_id(list_no, offset);
+    assert(0 <= id && id < ntotal);
     std::vector<float> r3(d);
-    refine_pq.decode (&refine_codes [id * refine_pq.code_size], r3.data());
+    refine_pq.decode(&refine_codes[id * refine_pq.code_size], r3.data());
     for (int i = 0; i < d; ++i) {
-      recons[i] += r3[i];
+        recons[i] += r3[i];
     }
 }
-void IndexIVFPQR::merge_from (IndexIVF &other_in, idx_t add_id)
-{
-    IndexIVFPQR *other = dynamic_cast<IndexIVFPQR *> (&other_in);
+void IndexIVFPQR::merge_from(IndexIVF& other_in, idx_t add_id) {
+    IndexIVFPQR* other = dynamic_cast<IndexIVFPQR*>(&other_in);
     FAISS_THROW_IF_NOT(other);
-    IndexIVF::merge_from (other_in, add_id);
+    IndexIVF::merge_from(other_in, add_id);
-    refine_codes.insert (refine_codes.end(),
-                         other->refine_codes.begin(),
-                         other->refine_codes.end());
+    refine_codes.insert(
+            refine_codes.end(),
+            other->refine_codes.begin(),
+            other->refine_codes.end());
     other->refine_codes.clear();
 }
 size_t IndexIVFPQR::remove_ids(const IDSelector& /*sel*/) {
-  FAISS_THROW_MSG("not implemented");
-  return 0;
+    FAISS_THROW_MSG("not implemented");
+    return 0;
 }
 } // namespace faiss

data/vendor/faiss/faiss/IndexIVFPQR.h CHANGED Viewed

@@ -13,23 +13,24 @@
 #include <faiss/IndexIVFPQ.h>
 namespace faiss {
 /** Index with an additional level of PQ refinement */
-struct IndexIVFPQR: IndexIVFPQ {
-    ProductQuantizer refine_pq;           ///< 3rd level quantizer
-    std::vector <uint8_t> refine_codes;   ///< corresponding codes
+struct IndexIVFPQR : IndexIVFPQ {
+    ProductQuantizer refine_pq;        ///< 3rd level quantizer
+    std::vector<uint8_t> refine_codes; ///< corresponding codes
     /// factor between k requested in search and the k requested from the IVFPQ
     float k_factor;
-    IndexIVFPQR (
-            Index * quantizer, size_t d, size_t nlist,
-            size_t M, size_t nbits_per_idx,
-            size_t M_refine, size_t nbits_per_idx_refine);
+    IndexIVFPQR(
+            Index* quantizer,
+            size_t d,
+            size_t nlist,
+            size_t M,
+            size_t nbits_per_idx,
+            size_t M_refine,
+            size_t nbits_per_idx_refine);
     void reset() override;
@@ -41,26 +42,30 @@ struct IndexIVFPQR: IndexIVFPQ {
     void add_with_ids(idx_t n, const float* x, const idx_t* xids) override;
     /// same as add_with_ids, but optionally use the precomputed list ids
-    void add_core (idx_t n, const float *x, const idx_t *xids,
-                     const idx_t *precomputed_idx = nullptr);
-    void reconstruct_from_offset (int64_t list_no, int64_t offset,
-                                  float* recons) const override;
-    void merge_from (IndexIVF &other, idx_t add_id) override;
-    void search_preassigned (idx_t n, const float *x, idx_t k,
-                             const idx_t *assign,
-                             const float *centroid_dis,
-                             float *distances, idx_t *labels,
-                             bool store_pairs,
-                             const IVFSearchParameters *params=nullptr,
-                             IndexIVFStats *stats=nullptr
-                             ) const override;
+    void add_core(
+            idx_t n,
+            const float* x,
+            const idx_t* xids,
+            const idx_t* precomputed_idx) override;
+    void reconstruct_from_offset(int64_t list_no, int64_t offset, float* recons)
+            const override;
+    void merge_from(IndexIVF& other, idx_t add_id) override;
+    void search_preassigned(
+            idx_t n,
+            const float* x,
+            idx_t k,
+            const idx_t* assign,
+            const float* centroid_dis,
+            float* distances,
+            idx_t* labels,
+            bool store_pairs,
+            const IVFSearchParameters* params = nullptr,
+            IndexIVFStats* stats = nullptr) const override;
     IndexIVFPQR();
 };
 } // namespace faiss