RubyGems - faiss - Versions diffs - 0.2.0 → 0.2.4 - Mend

faiss 0.2.0 → 0.2.4

Files changed (215) hide show

checksums.yaml +4 -4
data/CHANGELOG.md +16 -0
data/LICENSE.txt +1 -1
data/README.md +7 -7
data/ext/faiss/extconf.rb +6 -3
data/ext/faiss/numo.hpp +4 -4
data/ext/faiss/utils.cpp +1 -1
data/ext/faiss/utils.h +1 -1
data/lib/faiss/version.rb +1 -1
data/vendor/faiss/faiss/AutoTune.cpp +292 -291
data/vendor/faiss/faiss/AutoTune.h +55 -56
data/vendor/faiss/faiss/Clustering.cpp +365 -194
data/vendor/faiss/faiss/Clustering.h +102 -35
data/vendor/faiss/faiss/IVFlib.cpp +171 -195
data/vendor/faiss/faiss/IVFlib.h +48 -51
data/vendor/faiss/faiss/Index.cpp +85 -103
data/vendor/faiss/faiss/Index.h +54 -48
data/vendor/faiss/faiss/Index2Layer.cpp +126 -224
data/vendor/faiss/faiss/Index2Layer.h +22 -36
data/vendor/faiss/faiss/IndexAdditiveQuantizer.cpp +407 -0
data/vendor/faiss/faiss/IndexAdditiveQuantizer.h +195 -0
data/vendor/faiss/faiss/IndexBinary.cpp +45 -37
data/vendor/faiss/faiss/IndexBinary.h +140 -132
data/vendor/faiss/faiss/IndexBinaryFlat.cpp +73 -53
data/vendor/faiss/faiss/IndexBinaryFlat.h +29 -24
data/vendor/faiss/faiss/IndexBinaryFromFloat.cpp +46 -43
data/vendor/faiss/faiss/IndexBinaryFromFloat.h +16 -15
data/vendor/faiss/faiss/IndexBinaryHNSW.cpp +215 -232
data/vendor/faiss/faiss/IndexBinaryHNSW.h +25 -24
data/vendor/faiss/faiss/IndexBinaryHash.cpp +182 -177
data/vendor/faiss/faiss/IndexBinaryHash.h +41 -34
data/vendor/faiss/faiss/IndexBinaryIVF.cpp +489 -461
data/vendor/faiss/faiss/IndexBinaryIVF.h +97 -68
data/vendor/faiss/faiss/IndexFlat.cpp +115 -176
data/vendor/faiss/faiss/IndexFlat.h +42 -59
data/vendor/faiss/faiss/IndexFlatCodes.cpp +67 -0
data/vendor/faiss/faiss/IndexFlatCodes.h +47 -0
data/vendor/faiss/faiss/IndexHNSW.cpp +372 -348
data/vendor/faiss/faiss/IndexHNSW.h +57 -41
data/vendor/faiss/faiss/IndexIVF.cpp +545 -453
data/vendor/faiss/faiss/IndexIVF.h +169 -118
data/vendor/faiss/faiss/IndexIVFAdditiveQuantizer.cpp +316 -0
data/vendor/faiss/faiss/IndexIVFAdditiveQuantizer.h +121 -0
data/vendor/faiss/faiss/IndexIVFFlat.cpp +247 -252
data/vendor/faiss/faiss/IndexIVFFlat.h +48 -51
data/vendor/faiss/faiss/IndexIVFPQ.cpp +459 -517
data/vendor/faiss/faiss/IndexIVFPQ.h +75 -67
data/vendor/faiss/faiss/IndexIVFPQFastScan.cpp +406 -372
data/vendor/faiss/faiss/IndexIVFPQFastScan.h +82 -57
data/vendor/faiss/faiss/IndexIVFPQR.cpp +104 -102
data/vendor/faiss/faiss/IndexIVFPQR.h +33 -28
data/vendor/faiss/faiss/IndexIVFSpectralHash.cpp +163 -150
data/vendor/faiss/faiss/IndexIVFSpectralHash.h +38 -25
data/vendor/faiss/faiss/IndexLSH.cpp +66 -113
data/vendor/faiss/faiss/IndexLSH.h +20 -38
data/vendor/faiss/faiss/IndexLattice.cpp +42 -56
data/vendor/faiss/faiss/IndexLattice.h +11 -16
data/vendor/faiss/faiss/IndexNNDescent.cpp +229 -0
data/vendor/faiss/faiss/IndexNNDescent.h +72 -0
data/vendor/faiss/faiss/IndexNSG.cpp +301 -0
data/vendor/faiss/faiss/IndexNSG.h +85 -0
data/vendor/faiss/faiss/IndexPQ.cpp +387 -495
data/vendor/faiss/faiss/IndexPQ.h +64 -82
data/vendor/faiss/faiss/IndexPQFastScan.cpp +143 -170
data/vendor/faiss/faiss/IndexPQFastScan.h +46 -32
data/vendor/faiss/faiss/IndexPreTransform.cpp +120 -150
data/vendor/faiss/faiss/IndexPreTransform.h +33 -36
data/vendor/faiss/faiss/IndexRefine.cpp +139 -127
data/vendor/faiss/faiss/IndexRefine.h +32 -23
data/vendor/faiss/faiss/IndexReplicas.cpp +147 -153
data/vendor/faiss/faiss/IndexReplicas.h +62 -56
data/vendor/faiss/faiss/IndexScalarQuantizer.cpp +111 -172
data/vendor/faiss/faiss/IndexScalarQuantizer.h +41 -59
data/vendor/faiss/faiss/IndexShards.cpp +256 -240
data/vendor/faiss/faiss/IndexShards.h +85 -73
data/vendor/faiss/faiss/MatrixStats.cpp +112 -97
data/vendor/faiss/faiss/MatrixStats.h +7 -10
data/vendor/faiss/faiss/MetaIndexes.cpp +135 -157
data/vendor/faiss/faiss/MetaIndexes.h +40 -34
data/vendor/faiss/faiss/MetricType.h +7 -7
data/vendor/faiss/faiss/VectorTransform.cpp +654 -475
data/vendor/faiss/faiss/VectorTransform.h +64 -89
data/vendor/faiss/faiss/clone_index.cpp +78 -73
data/vendor/faiss/faiss/clone_index.h +4 -9
data/vendor/faiss/faiss/gpu/GpuAutoTune.cpp +33 -38
data/vendor/faiss/faiss/gpu/GpuAutoTune.h +11 -9
data/vendor/faiss/faiss/gpu/GpuCloner.cpp +198 -171
data/vendor/faiss/faiss/gpu/GpuCloner.h +53 -35
data/vendor/faiss/faiss/gpu/GpuClonerOptions.cpp +12 -14
data/vendor/faiss/faiss/gpu/GpuClonerOptions.h +27 -25
data/vendor/faiss/faiss/gpu/GpuDistance.h +116 -112
data/vendor/faiss/faiss/gpu/GpuFaissAssert.h +1 -2
data/vendor/faiss/faiss/gpu/GpuIcmEncoder.h +60 -0
data/vendor/faiss/faiss/gpu/GpuIndex.h +134 -137
data/vendor/faiss/faiss/gpu/GpuIndexBinaryFlat.h +76 -73
data/vendor/faiss/faiss/gpu/GpuIndexFlat.h +173 -162
data/vendor/faiss/faiss/gpu/GpuIndexIVF.h +67 -64
data/vendor/faiss/faiss/gpu/GpuIndexIVFFlat.h +89 -86
data/vendor/faiss/faiss/gpu/GpuIndexIVFPQ.h +150 -141
data/vendor/faiss/faiss/gpu/GpuIndexIVFScalarQuantizer.h +101 -103
data/vendor/faiss/faiss/gpu/GpuIndicesOptions.h +17 -16
data/vendor/faiss/faiss/gpu/GpuResources.cpp +116 -128
data/vendor/faiss/faiss/gpu/GpuResources.h +182 -186
data/vendor/faiss/faiss/gpu/StandardGpuResources.cpp +433 -422
data/vendor/faiss/faiss/gpu/StandardGpuResources.h +131 -130
data/vendor/faiss/faiss/gpu/impl/InterleavedCodes.cpp +468 -456
data/vendor/faiss/faiss/gpu/impl/InterleavedCodes.h +25 -19
data/vendor/faiss/faiss/gpu/impl/RemapIndices.cpp +22 -20
data/vendor/faiss/faiss/gpu/impl/RemapIndices.h +9 -8
data/vendor/faiss/faiss/gpu/perf/IndexWrapper-inl.h +39 -44
data/vendor/faiss/faiss/gpu/perf/IndexWrapper.h +16 -14
data/vendor/faiss/faiss/gpu/perf/PerfClustering.cpp +77 -71
data/vendor/faiss/faiss/gpu/perf/PerfIVFPQAdd.cpp +109 -88
data/vendor/faiss/faiss/gpu/perf/WriteIndex.cpp +75 -64
data/vendor/faiss/faiss/gpu/test/TestCodePacking.cpp +230 -215
data/vendor/faiss/faiss/gpu/test/TestGpuIndexBinaryFlat.cpp +80 -86
data/vendor/faiss/faiss/gpu/test/TestGpuIndexFlat.cpp +284 -277
data/vendor/faiss/faiss/gpu/test/TestGpuIndexIVFFlat.cpp +416 -416
data/vendor/faiss/faiss/gpu/test/TestGpuIndexIVFPQ.cpp +611 -517
data/vendor/faiss/faiss/gpu/test/TestGpuIndexIVFScalarQuantizer.cpp +166 -164
data/vendor/faiss/faiss/gpu/test/TestGpuMemoryException.cpp +61 -53
data/vendor/faiss/faiss/gpu/test/TestUtils.cpp +274 -238
data/vendor/faiss/faiss/gpu/test/TestUtils.h +73 -57
data/vendor/faiss/faiss/gpu/test/demo_ivfpq_indexing_gpu.cpp +47 -50
data/vendor/faiss/faiss/gpu/utils/DeviceUtils.h +79 -72
data/vendor/faiss/faiss/gpu/utils/StackDeviceMemory.cpp +140 -146
data/vendor/faiss/faiss/gpu/utils/StackDeviceMemory.h +69 -71
data/vendor/faiss/faiss/gpu/utils/StaticUtils.h +21 -16
data/vendor/faiss/faiss/gpu/utils/Timer.cpp +25 -29
data/vendor/faiss/faiss/gpu/utils/Timer.h +30 -29
data/vendor/faiss/faiss/impl/AdditiveQuantizer.cpp +503 -0
data/vendor/faiss/faiss/impl/AdditiveQuantizer.h +175 -0
data/vendor/faiss/faiss/impl/AuxIndexStructures.cpp +90 -120
data/vendor/faiss/faiss/impl/AuxIndexStructures.h +81 -65
data/vendor/faiss/faiss/impl/FaissAssert.h +73 -58
data/vendor/faiss/faiss/impl/FaissException.cpp +56 -48
data/vendor/faiss/faiss/impl/FaissException.h +41 -29
data/vendor/faiss/faiss/impl/HNSW.cpp +606 -617
data/vendor/faiss/faiss/impl/HNSW.h +179 -200
data/vendor/faiss/faiss/impl/LocalSearchQuantizer.cpp +855 -0
data/vendor/faiss/faiss/impl/LocalSearchQuantizer.h +244 -0
data/vendor/faiss/faiss/impl/NNDescent.cpp +487 -0
data/vendor/faiss/faiss/impl/NNDescent.h +154 -0
data/vendor/faiss/faiss/impl/NSG.cpp +679 -0
data/vendor/faiss/faiss/impl/NSG.h +199 -0
data/vendor/faiss/faiss/impl/PolysemousTraining.cpp +484 -454
data/vendor/faiss/faiss/impl/PolysemousTraining.h +52 -55
data/vendor/faiss/faiss/impl/ProductQuantizer-inl.h +26 -47
data/vendor/faiss/faiss/impl/ProductQuantizer.cpp +469 -459
data/vendor/faiss/faiss/impl/ProductQuantizer.h +76 -87
data/vendor/faiss/faiss/impl/ResidualQuantizer.cpp +758 -0
data/vendor/faiss/faiss/impl/ResidualQuantizer.h +188 -0
data/vendor/faiss/faiss/impl/ResultHandler.h +96 -132
data/vendor/faiss/faiss/impl/ScalarQuantizer.cpp +647 -707
data/vendor/faiss/faiss/impl/ScalarQuantizer.h +48 -46
data/vendor/faiss/faiss/impl/ThreadedIndex-inl.h +129 -131
data/vendor/faiss/faiss/impl/ThreadedIndex.h +61 -55
data/vendor/faiss/faiss/impl/index_read.cpp +631 -480
data/vendor/faiss/faiss/impl/index_write.cpp +547 -407
data/vendor/faiss/faiss/impl/io.cpp +76 -95
data/vendor/faiss/faiss/impl/io.h +31 -41
data/vendor/faiss/faiss/impl/io_macros.h +60 -29
data/vendor/faiss/faiss/impl/kmeans1d.cpp +301 -0
data/vendor/faiss/faiss/impl/kmeans1d.h +48 -0
data/vendor/faiss/faiss/impl/lattice_Zn.cpp +137 -186
data/vendor/faiss/faiss/impl/lattice_Zn.h +40 -51
data/vendor/faiss/faiss/impl/platform_macros.h +29 -8
data/vendor/faiss/faiss/impl/pq4_fast_scan.cpp +77 -124
data/vendor/faiss/faiss/impl/pq4_fast_scan.h +39 -48
data/vendor/faiss/faiss/impl/pq4_fast_scan_search_1.cpp +41 -52
data/vendor/faiss/faiss/impl/pq4_fast_scan_search_qbs.cpp +80 -117
data/vendor/faiss/faiss/impl/simd_result_handlers.h +109 -137
data/vendor/faiss/faiss/index_factory.cpp +619 -397
data/vendor/faiss/faiss/index_factory.h +8 -6
data/vendor/faiss/faiss/index_io.h +23 -26
data/vendor/faiss/faiss/invlists/BlockInvertedLists.cpp +67 -75
data/vendor/faiss/faiss/invlists/BlockInvertedLists.h +22 -24
data/vendor/faiss/faiss/invlists/DirectMap.cpp +96 -112
data/vendor/faiss/faiss/invlists/DirectMap.h +29 -33
data/vendor/faiss/faiss/invlists/InvertedLists.cpp +307 -364
data/vendor/faiss/faiss/invlists/InvertedLists.h +151 -151
data/vendor/faiss/faiss/invlists/InvertedListsIOHook.cpp +29 -34
data/vendor/faiss/faiss/invlists/InvertedListsIOHook.h +17 -18
data/vendor/faiss/faiss/invlists/OnDiskInvertedLists.cpp +257 -293
data/vendor/faiss/faiss/invlists/OnDiskInvertedLists.h +50 -45
data/vendor/faiss/faiss/python/python_callbacks.cpp +23 -26
data/vendor/faiss/faiss/python/python_callbacks.h +9 -16
data/vendor/faiss/faiss/utils/AlignedTable.h +79 -44
data/vendor/faiss/faiss/utils/Heap.cpp +40 -48
data/vendor/faiss/faiss/utils/Heap.h +186 -209
data/vendor/faiss/faiss/utils/WorkerThread.cpp +67 -76
data/vendor/faiss/faiss/utils/WorkerThread.h +32 -33
data/vendor/faiss/faiss/utils/distances.cpp +305 -312
data/vendor/faiss/faiss/utils/distances.h +170 -122
data/vendor/faiss/faiss/utils/distances_simd.cpp +498 -508
data/vendor/faiss/faiss/utils/extra_distances-inl.h +117 -0
data/vendor/faiss/faiss/utils/extra_distances.cpp +113 -232
data/vendor/faiss/faiss/utils/extra_distances.h +30 -29
data/vendor/faiss/faiss/utils/hamming-inl.h +260 -209
data/vendor/faiss/faiss/utils/hamming.cpp +375 -469
data/vendor/faiss/faiss/utils/hamming.h +62 -85
data/vendor/faiss/faiss/utils/ordered_key_value.h +16 -18
data/vendor/faiss/faiss/utils/partitioning.cpp +393 -318
data/vendor/faiss/faiss/utils/partitioning.h +26 -21
data/vendor/faiss/faiss/utils/quantize_lut.cpp +78 -66
data/vendor/faiss/faiss/utils/quantize_lut.h +22 -20
data/vendor/faiss/faiss/utils/random.cpp +39 -63
data/vendor/faiss/faiss/utils/random.h +13 -16
data/vendor/faiss/faiss/utils/simdlib.h +4 -2
data/vendor/faiss/faiss/utils/simdlib_avx2.h +88 -85
data/vendor/faiss/faiss/utils/simdlib_emulated.h +226 -165
data/vendor/faiss/faiss/utils/simdlib_neon.h +832 -0
data/vendor/faiss/faiss/utils/utils.cpp +304 -287
data/vendor/faiss/faiss/utils/utils.h +54 -49
metadata +29 -4

data/vendor/faiss/faiss/IndexIVFPQ.cpp CHANGED Viewed

@@ -9,17 +9,17 @@
 #include <faiss/IndexIVFPQ.h>
+#include <stdint.h>
+#include <cassert>
 #include <cinttypes>
 #include <cmath>
 #include <cstdio>
-#include <cassert>
-#include <stdint.h>
 #include <algorithm>
 #include <faiss/utils/Heap.h>
-#include <faiss/utils/utils.h>
 #include <faiss/utils/distances.h>
+#include <faiss/utils/utils.h>
 #include <faiss/Clustering.h>
 #include <faiss/IndexFlat.h>
@@ -36,12 +36,15 @@ namespace faiss {
  * IndexIVFPQ implementation
  ******************************************/
-IndexIVFPQ::IndexIVFPQ (Index * quantizer, size_t d, size_t nlist,
-                        size_t M, size_t nbits_per_idx, MetricType metric):
-    IndexIVF (quantizer, d, nlist, 0, metric),
-    pq (d, M, nbits_per_idx)
-{
-    FAISS_THROW_IF_NOT (nbits_per_idx <= 8);
+IndexIVFPQ::IndexIVFPQ(
+        Index* quantizer,
+        size_t d,
+        size_t nlist,
+        size_t M,
+        size_t nbits_per_idx,
+        MetricType metric)
+        : IndexIVF(quantizer, d, nlist, 0, metric), pq(d, M, nbits_per_idx) {
+    FAISS_THROW_IF_NOT(nbits_per_idx <= 8);
     code_size = pq.code_size;
     invlists->code_size = code_size;
     is_trained = false;
@@ -52,202 +55,197 @@ IndexIVFPQ::IndexIVFPQ (Index * quantizer, size_t d, size_t nlist,
     polysemous_training = nullptr;
     do_polysemous_training = false;
     polysemous_ht = 0;
 }
 /****************************************************************
  * training                                                     */
-void IndexIVFPQ::train_residual (idx_t n, const float *x)
-{
-    train_residual_o (n, x, nullptr);
+void IndexIVFPQ::train_residual(idx_t n, const float* x) {
+    train_residual_o(n, x, nullptr);
 }
+void IndexIVFPQ::train_residual_o(idx_t n, const float* x, float* residuals_2) {
+    const float* x_in = x;
-void IndexIVFPQ::train_residual_o (idx_t n, const float *x, float *residuals_2)
-{
-    const float * x_in = x;
-    x = fvecs_maybe_subsample (
-         d, (size_t*)&n, pq.cp.max_points_per_centroid * pq.ksub,
-         x, verbose, pq.cp.seed);
+    x = fvecs_maybe_subsample(
+            d,
+            (size_t*)&n,
+            pq.cp.max_points_per_centroid * pq.ksub,
+            x,
+            verbose,
+            pq.cp.seed);
-    ScopeDeleter<float> del_x (x_in == x ? nullptr : x);
+    ScopeDeleter<float> del_x(x_in == x ? nullptr : x);
-    const float *trainset;
+    const float* trainset;
     ScopeDeleter<float> del_residuals;
     if (by_residual) {
-        if(verbose) printf("computing residuals\n");
-        idx_t * assign = new idx_t [n]; // assignement to coarse centroids
-        ScopeDeleter<idx_t> del (assign);
-        quantizer->assign (n, x, assign);
-        float *residuals = new float [n * d];
-        del_residuals.set (residuals);
+        if (verbose)
+            printf("computing residuals\n");
+        idx_t* assign = new idx_t[n]; // assignement to coarse centroids
+        ScopeDeleter<idx_t> del(assign);
+        quantizer->assign(n, x, assign);
+        float* residuals = new float[n * d];
+        del_residuals.set(residuals);
         for (idx_t i = 0; i < n; i++)
-           quantizer->compute_residual (x + i * d, residuals+i*d, assign[i]);
+            quantizer->compute_residual(
+                    x + i * d, residuals + i * d, assign[i]);
         trainset = residuals;
     } else {
         trainset = x;
     }
     if (verbose)
-        printf ("training %zdx%zd product quantizer on %" PRId64 " vectors in %dD\n",
-                pq.M, pq.ksub, n, d);
+        printf("training %zdx%zd product quantizer on %" PRId64
+               " vectors in %dD\n",
+               pq.M,
+               pq.ksub,
+               n,
+               d);
     pq.verbose = verbose;
-    pq.train (n, trainset);
+    pq.train(n, trainset);
     if (do_polysemous_training) {
         if (verbose)
             printf("doing polysemous training for PQ\n");
         PolysemousTraining default_pt;
-        PolysemousTraining *pt = polysemous_training;
-        if (!pt) pt = &default_pt;
-        pt->optimize_pq_for_hamming (pq, n, trainset);
+        PolysemousTraining* pt = polysemous_training;
+        if (!pt)
+            pt = &default_pt;
+        pt->optimize_pq_for_hamming(pq, n, trainset);
     }
     // prepare second-level residuals for refine PQ
     if (residuals_2) {
-        uint8_t *train_codes = new uint8_t [pq.code_size * n];
-        ScopeDeleter<uint8_t> del (train_codes);
-        pq.compute_codes (trainset, train_codes, n);
+        uint8_t* train_codes = new uint8_t[pq.code_size * n];
+        ScopeDeleter<uint8_t> del(train_codes);
+        pq.compute_codes(trainset, train_codes, n);
         for (idx_t i = 0; i < n; i++) {
-            const float *xx = trainset + i * d;
-            float * res = residuals_2 + i * d;
-            pq.decode (train_codes + i * pq.code_size, res);
+            const float* xx = trainset + i * d;
+            float* res = residuals_2 + i * d;
+            pq.decode(train_codes + i * pq.code_size, res);
             for (int j = 0; j < d; j++)
                 res[j] = xx[j] - res[j];
         }
     }
     if (by_residual) {
-        precompute_table ();
+        precompute_table();
     }
 }
 /****************************************************************
  * IVFPQ as codec                                               */
 /* produce a binary signature based on the residual vector */
-void IndexIVFPQ::encode (idx_t key, const float * x, uint8_t * code) const
-{
+void IndexIVFPQ::encode(idx_t key, const float* x, uint8_t* code) const {
     if (by_residual) {
         std::vector<float> residual_vec(d);
-        quantizer->compute_residual (x, residual_vec.data(), key);
-        pq.compute_code (residual_vec.data(), code);
-    }
-    else pq.compute_code (x, code);
+        quantizer->compute_residual(x, residual_vec.data(), key);
+        pq.compute_code(residual_vec.data(), code);
+    } else
+        pq.compute_code(x, code);
 }
-void IndexIVFPQ::encode_multiple (size_t n, idx_t *keys,
-                                  const float * x, uint8_t * xcodes,
-                                  bool compute_keys) const
-{
+void IndexIVFPQ::encode_multiple(
+        size_t n,
+        idx_t* keys,
+        const float* x,
+        uint8_t* xcodes,
+        bool compute_keys) const {
     if (compute_keys)
-        quantizer->assign (n, x, keys);
+        quantizer->assign(n, x, keys);
-    encode_vectors (n, x, keys, xcodes);
+    encode_vectors(n, x, keys, xcodes);
 }
-void IndexIVFPQ::decode_multiple (size_t n, const idx_t *keys,
-                                  const uint8_t * xcodes, float * x) const
-{
-    pq.decode (xcodes, x, n);
+void IndexIVFPQ::decode_multiple(
+        size_t n,
+        const idx_t* keys,
+        const uint8_t* xcodes,
+        float* x) const {
+    pq.decode(xcodes, x, n);
     if (by_residual) {
-        std::vector<float> centroid (d);
+        std::vector<float> centroid(d);
         for (size_t i = 0; i < n; i++) {
-            quantizer->reconstruct (keys[i], centroid.data());
-            float *xi = x + i * d;
+            quantizer->reconstruct(keys[i], centroid.data());
+            float* xi = x + i * d;
             for (size_t j = 0; j < d; j++) {
-                xi [j] += centroid [j];
+                xi[j] += centroid[j];
             }
         }
     }
 }
 /****************************************************************
  * add                                                          */
-void IndexIVFPQ::add_with_ids (idx_t n, const float * x, const idx_t *xids)
-{
-    add_core_o (n, x, xids, nullptr);
+void IndexIVFPQ::add_core(
+        idx_t n,
+        const float* x,
+        const idx_t* xids,
+        const idx_t* coarse_idx) {
+    add_core_o(n, x, xids, nullptr, coarse_idx);
 }
-static float * compute_residuals (
-        const Index *quantizer,
-        Index::idx_t n, const float* x,
-        const Index::idx_t *list_nos)
-{
+static float* compute_residuals(
+        const Index* quantizer,
+        Index::idx_t n,
+        const float* x,
+        const Index::idx_t* list_nos) {
     size_t d = quantizer->d;
-    float *residuals = new float [n * d];
+    float* residuals = new float[n * d];
     // TODO: parallelize?
     for (size_t i = 0; i < n; i++) {
         if (list_nos[i] < 0)
-            memset (residuals + i * d, 0, sizeof(*residuals) * d);
+            memset(residuals + i * d, 0, sizeof(*residuals) * d);
         else
-            quantizer->compute_residual (
-                 x + i * d, residuals + i * d, list_nos[i]);
+            quantizer->compute_residual(
+                    x + i * d, residuals + i * d, list_nos[i]);
     }
     return residuals;
 }
-void IndexIVFPQ::encode_vectors(idx_t n, const float* x,
-                                const idx_t *list_nos,
-                                uint8_t * codes,
-                                bool include_listnos) const
-{
+void IndexIVFPQ::encode_vectors(
+        idx_t n,
+        const float* x,
+        const idx_t* list_nos,
+        uint8_t* codes,
+        bool include_listnos) const {
     if (by_residual) {
-        float *to_encode = compute_residuals (quantizer, n, x, list_nos);
-        ScopeDeleter<float> del (to_encode);
-        pq.compute_codes (to_encode, codes, n);
+        float* to_encode = compute_residuals(quantizer, n, x, list_nos);
+        ScopeDeleter<float> del(to_encode);
+        pq.compute_codes(to_encode, codes, n);
     } else {
-        pq.compute_codes (x, codes, n);
+        pq.compute_codes(x, codes, n);
     }
     if (include_listnos) {
         size_t coarse_size = coarse_code_size();
         for (idx_t i = n - 1; i >= 0; i--) {
-            uint8_t * code = codes + i * (coarse_size + code_size);
-            memmove (code + coarse_size,
-                     codes + i * code_size, code_size);
-            encode_listno (list_nos[i], code);
+            uint8_t* code = codes + i * (coarse_size + code_size);
+            memmove(code + coarse_size, codes + i * code_size, code_size);
+            encode_listno(list_nos[i], code);
         }
     }
 }
-void IndexIVFPQ::sa_decode (idx_t n, const uint8_t *codes,
-                            float *x) const
-{
-    size_t coarse_size = coarse_code_size ();
+void IndexIVFPQ::sa_decode(idx_t n, const uint8_t* codes, float* x) const {
+    size_t coarse_size = coarse_code_size();
 #pragma omp parallel
     {
-        std::vector<float> residual (d);
+        std::vector<float> residual(d);
 #pragma omp for
         for (idx_t i = 0; i < n; i++) {
-            const uint8_t *code = codes + i * (code_size + coarse_size);
-            int64_t list_no = decode_listno (code);
-            float *xi = x + i * d;
-            pq.decode (code + coarse_size, xi);
+            const uint8_t* code = codes + i * (code_size + coarse_size);
+            int64_t list_no = decode_listno(code);
+            float* xi = x + i * d;
+            pq.decode(code + coarse_size, xi);
             if (by_residual) {
-                quantizer->reconstruct (list_no, residual.data());
+                quantizer->reconstruct(list_no, residual.data());
                 for (size_t j = 0; j < d; j++) {
                     xi[j] += residual[j];
                 }
@@ -256,120 +254,127 @@ void IndexIVFPQ::sa_decode (idx_t n, const uint8_t *codes,
     }
 }
-void IndexIVFPQ::add_core_o (idx_t n, const float * x, const idx_t *xids,
-                             float *residuals_2, const idx_t *precomputed_idx)
-{
+void IndexIVFPQ::add_core_o(
+        idx_t n,
+        const float* x,
+        const idx_t* xids,
+        float* residuals_2,
+        const idx_t* precomputed_idx) {
     idx_t bs = 32768;
     if (n > bs) {
         for (idx_t i0 = 0; i0 < n; i0 += bs) {
             idx_t i1 = std::min(i0 + bs, n);
             if (verbose) {
-                printf("IndexIVFPQ::add_core_o: adding %" PRId64 ":%" PRId64 " / %" PRId64 "\n",
-                       i0, i1, n);
+                printf("IndexIVFPQ::add_core_o: adding %" PRId64 ":%" PRId64
+                       " / %" PRId64 "\n",
+                       i0,
+                       i1,
+                       n);
             }
-            add_core_o (i1 - i0, x + i0 * d,
-                        xids ? xids + i0 : nullptr,
-                        residuals_2 ? residuals_2 + i0 * d : nullptr,
-                        precomputed_idx ? precomputed_idx + i0 : nullptr);
+            add_core_o(
+                    i1 - i0,
+                    x + i0 * d,
+                    xids ? xids + i0 : nullptr,
+                    residuals_2 ? residuals_2 + i0 * d : nullptr,
+                    precomputed_idx ? precomputed_idx + i0 : nullptr);
         }
         return;
     }
     InterruptCallback::check();
-    direct_map.check_can_add (xids);
+    direct_map.check_can_add(xids);
-    FAISS_THROW_IF_NOT (is_trained);
-    double t0 = getmillisecs ();
-    const idx_t * idx;
+    FAISS_THROW_IF_NOT(is_trained);
+    double t0 = getmillisecs();
+    const idx_t* idx;
     ScopeDeleter<idx_t> del_idx;
     if (precomputed_idx) {
         idx = precomputed_idx;
     } else {
-        idx_t * idx0 = new idx_t [n];
-        del_idx.set (idx0);
-        quantizer->assign (n, x, idx0);
+        idx_t* idx0 = new idx_t[n];
+        del_idx.set(idx0);
+        quantizer->assign(n, x, idx0);
         idx = idx0;
     }
-    double t1 = getmillisecs ();
-    uint8_t * xcodes = new uint8_t [n * code_size];
-    ScopeDeleter<uint8_t> del_xcodes (xcodes);
+    double t1 = getmillisecs();
+    uint8_t* xcodes = new uint8_t[n * code_size];
+    ScopeDeleter<uint8_t> del_xcodes(xcodes);
-    const float *to_encode = nullptr;
+    const float* to_encode = nullptr;
     ScopeDeleter<float> del_to_encode;
     if (by_residual) {
-        to_encode = compute_residuals (quantizer, n, x, idx);
-        del_to_encode.set (to_encode);
+        to_encode = compute_residuals(quantizer, n, x, idx);
+        del_to_encode.set(to_encode);
     } else {
         to_encode = x;
     }
-    pq.compute_codes (to_encode, xcodes, n);
+    pq.compute_codes(to_encode, xcodes, n);
-    double t2 = getmillisecs ();
+    double t2 = getmillisecs();
     // TODO: parallelize?
     size_t n_ignore = 0;
     for (size_t i = 0; i < n; i++) {
         idx_t key = idx[i];
         idx_t id = xids ? xids[i] : ntotal + i;
         if (key < 0) {
-            direct_map.add_single_id (id, -1, 0);
-            n_ignore ++;
+            direct_map.add_single_id(id, -1, 0);
+            n_ignore++;
             if (residuals_2)
-                memset (residuals_2, 0, sizeof(*residuals_2) * d);
+                memset(residuals_2, 0, sizeof(*residuals_2) * d);
             continue;
         }
-        uint8_t *code = xcodes + i * code_size;
-        size_t offset = invlists->add_entry (key, id, code);
+        uint8_t* code = xcodes + i * code_size;
+        size_t offset = invlists->add_entry(key, id, code);
         if (residuals_2) {
-            float *res2 = residuals_2 + i * d;
-            const float *xi = to_encode + i * d;
-            pq.decode (code, res2);
+            float* res2 = residuals_2 + i * d;
+            const float* xi = to_encode + i * d;
+            pq.decode(code, res2);
             for (int j = 0; j < d; j++)
                 res2[j] = xi[j] - res2[j];
         }
-        direct_map.add_single_id (id, key, offset);
+        direct_map.add_single_id(id, key, offset);
     }
-    double t3 = getmillisecs ();
-    if(verbose) {
+    double t3 = getmillisecs();
+    if (verbose) {
         char comment[100] = {0};
         if (n_ignore > 0)
-            snprintf (comment, 100, "(%zd vectors ignored)", n_ignore);
+            snprintf(comment, 100, "(%zd vectors ignored)", n_ignore);
         printf(" add_core times: %.3f %.3f %.3f %s\n",
-               t1 - t0, t2 - t1, t3 - t2, comment);
+               t1 - t0,
+               t2 - t1,
+               t3 - t2,
+               comment);
     }
     ntotal += n;
 }
-void IndexIVFPQ::reconstruct_from_offset (int64_t list_no, int64_t offset,
-                                          float* recons) const
-{
-    const uint8_t* code = invlists->get_single_code (list_no, offset);
+void IndexIVFPQ::reconstruct_from_offset(
+        int64_t list_no,
+        int64_t offset,
+        float* recons) const {
+    const uint8_t* code = invlists->get_single_code(list_no, offset);
     if (by_residual) {
         std::vector<float> centroid(d);
-        quantizer->reconstruct (list_no, centroid.data());
+        quantizer->reconstruct(list_no, centroid.data());
-        pq.decode (code, recons);
+        pq.decode(code, recons);
         for (int i = 0; i < d; ++i) {
             recons[i] += centroid[i];
         }
     } else {
-        pq.decode (code, recons);
+        pq.decode(code, recons);
     }
 }
 /// 2G by default, accommodates tables up to PQ32 w/ 65536 centroids
 size_t precomputed_table_max_bytes = ((size_t)1) << 31;
@@ -403,20 +408,18 @@ size_t precomputed_table_max_bytes = ((size_t)1) << 31;
  * is faster when the length of the lists is > ksub * M.
  */
-void initialize_IVFPQ_precomputed_table (
-    int &use_precomputed_table,
-    const Index *quantizer,
-    const ProductQuantizer &pq,
-    AlignedTable<float> & precomputed_table,
-    bool verbose
-)
-{
+void initialize_IVFPQ_precomputed_table(
+        int& use_precomputed_table,
+        const Index* quantizer,
+        const ProductQuantizer& pq,
+        AlignedTable<float>& precomputed_table,
+        bool verbose) {
     size_t nlist = quantizer->ntotal;
     size_t d = quantizer->d;
     FAISS_THROW_IF_NOT(d == pq.d);
     if (use_precomputed_table == -1) {
-        precomputed_table.resize (0);
+        precomputed_table.resize(0);
         return;
     }
@@ -424,23 +427,23 @@ void initialize_IVFPQ_precomputed_table (
         if (quantizer->metric_type == METRIC_INNER_PRODUCT) {
             if (verbose) {
                 printf("IndexIVFPQ::precompute_table: precomputed "
-                        "tables not needed for inner product quantizers\n");
+                       "tables not needed for inner product quantizers\n");
             }
-            precomputed_table.resize (0);
+            precomputed_table.resize(0);
             return;
         }
-        const MultiIndexQuantizer *miq =
-            dynamic_cast<const MultiIndexQuantizer *> (quantizer);
+        const MultiIndexQuantizer* miq =
+                dynamic_cast<const MultiIndexQuantizer*>(quantizer);
         if (miq && pq.M % miq->pq.M == 0)
             use_precomputed_table = 2;
         else {
             size_t table_size = pq.M * pq.ksub * nlist * sizeof(float);
             if (table_size > precomputed_table_max_bytes) {
                 if (verbose) {
-                    printf(
-                       "IndexIVFPQ::precompute_table: not precomputing table, "
-                       "it would be too big: %zd bytes (max %zd)\n",
-                       table_size, precomputed_table_max_bytes);
+                    printf("IndexIVFPQ::precompute_table: not precomputing table, "
+                           "it would be too big: %zd bytes (max %zd)\n",
+                           table_size,
+                           precomputed_table_max_bytes);
                     use_precomputed_table = 0;
                 }
                 return;
@@ -450,80 +453,68 @@ void initialize_IVFPQ_precomputed_table (
     } // otherwise assume user has set appropriate flag on input
     if (verbose) {
-        printf ("precomputing IVFPQ tables type %d\n",
-                use_precomputed_table);
+        printf("precomputing IVFPQ tables type %d\n", use_precomputed_table);
     }
     // squared norms of the PQ centroids
-    std::vector<float> r_norms (pq.M * pq.ksub, NAN);
+    std::vector<float> r_norms(pq.M * pq.ksub, NAN);
     for (int m = 0; m < pq.M; m++)
         for (int j = 0; j < pq.ksub; j++)
-            r_norms [m * pq.ksub + j] =
-                fvec_norm_L2sqr (pq.get_centroids (m, j), pq.dsub);
+            r_norms[m * pq.ksub + j] =
+                    fvec_norm_L2sqr(pq.get_centroids(m, j), pq.dsub);
     if (use_precomputed_table == 1) {
-        precomputed_table.resize (nlist * pq.M * pq.ksub);
-        std::vector<float> centroid (d);
+        precomputed_table.resize(nlist * pq.M * pq.ksub);
+        std::vector<float> centroid(d);
         for (size_t i = 0; i < nlist; i++) {
-            quantizer->reconstruct (i, centroid.data());
+            quantizer->reconstruct(i, centroid.data());
-            float *tab = &precomputed_table[i * pq.M * pq.ksub];
-            pq.compute_inner_prod_table (centroid.data(), tab);
-            fvec_madd (pq.M * pq.ksub, r_norms.data(), 2.0, tab, tab);
+            float* tab = &precomputed_table[i * pq.M * pq.ksub];
+            pq.compute_inner_prod_table(centroid.data(), tab);
+            fvec_madd(pq.M * pq.ksub, r_norms.data(), 2.0, tab, tab);
         }
     } else if (use_precomputed_table == 2) {
-        const MultiIndexQuantizer *miq =
-           dynamic_cast<const MultiIndexQuantizer *> (quantizer);
-        FAISS_THROW_IF_NOT (miq);
-        const ProductQuantizer &cpq = miq->pq;
-        FAISS_THROW_IF_NOT (pq.M % cpq.M == 0);
+        const MultiIndexQuantizer* miq =
+                dynamic_cast<const MultiIndexQuantizer*>(quantizer);
+        FAISS_THROW_IF_NOT(miq);
+        const ProductQuantizer& cpq = miq->pq;
+        FAISS_THROW_IF_NOT(pq.M % cpq.M == 0);
         precomputed_table.resize(cpq.ksub * pq.M * pq.ksub);
         // reorder PQ centroid table
-        std::vector<float> centroids (d * cpq.ksub, NAN);
+        std::vector<float> centroids(d * cpq.ksub, NAN);
         for (int m = 0; m < cpq.M; m++) {
             for (size_t i = 0; i < cpq.ksub; i++) {
-                memcpy (centroids.data() + i * d + m * cpq.dsub,
-                        cpq.get_centroids (m, i),
-                        sizeof (*centroids.data()) * cpq.dsub);
+                memcpy(centroids.data() + i * d + m * cpq.dsub,
+                       cpq.get_centroids(m, i),
+                       sizeof(*centroids.data()) * cpq.dsub);
             }
         }
-        pq.compute_inner_prod_tables (cpq.ksub, centroids.data (),
-                                      precomputed_table.data ());
+        pq.compute_inner_prod_tables(
+                cpq.ksub, centroids.data(), precomputed_table.data());
         for (size_t i = 0; i < cpq.ksub; i++) {
-            float *tab = &precomputed_table[i * pq.M * pq.ksub];
-            fvec_madd (pq.M * pq.ksub, r_norms.data(), 2.0, tab, tab);
+            float* tab = &precomputed_table[i * pq.M * pq.ksub];
+            fvec_madd(pq.M * pq.ksub, r_norms.data(), 2.0, tab, tab);
         }
     }
 }
-void IndexIVFPQ::precompute_table ()
-{
-    initialize_IVFPQ_precomputed_table (
-        use_precomputed_table, quantizer, pq, precomputed_table,
-        verbose
-    );
+void IndexIVFPQ::precompute_table() {
+    initialize_IVFPQ_precomputed_table(
+            use_precomputed_table, quantizer, pq, precomputed_table, verbose);
 }
 namespace {
 using idx_t = Index::idx_t;
 #define TIC t0 = get_cycles()
-#define TOC get_cycles () - t0
+#define TOC get_cycles() - t0
 /** QueryTables manages the various ways of searching an
  * IndexIVFPQ. The code contains a lot of branches, depending on:
@@ -533,43 +524,42 @@ using idx_t = Index::idx_t;
  * - polysemous_ht: are we filtering with polysemous codes?
  */
 struct QueryTables {
     /*****************************************************
      * General data from the IVFPQ
      *****************************************************/
-    const IndexIVFPQ & ivfpq;
-    const IVFSearchParameters *params;
+    const IndexIVFPQ& ivfpq;
+    const IVFSearchParameters* params;
     // copied from IndexIVFPQ for easier access
     int d;
-    const ProductQuantizer & pq;
+    const ProductQuantizer& pq;
     MetricType metric_type;
     bool by_residual;
     int use_precomputed_table;
     int polysemous_ht;
     // pre-allocated data buffers
-    float * sim_table, * sim_table_2;
-    float * residual_vec, *decoded_vec;
+    float *sim_table, *sim_table_2;
+    float *residual_vec, *decoded_vec;
     // single data buffer
     std::vector<float> mem;
     // for table pointers
-    std::vector<const float *> sim_table_ptrs;
-    explicit QueryTables (const IndexIVFPQ & ivfpq,
-                          const IVFSearchParameters *params):
-        ivfpq(ivfpq),
-        d(ivfpq.d),
-        pq (ivfpq.pq),
-        metric_type (ivfpq.metric_type),
-        by_residual (ivfpq.by_residual),
-        use_precomputed_table (ivfpq.use_precomputed_table)
-    {
-        mem.resize (pq.ksub * pq.M * 2 + d * 2);
-        sim_table = mem.data ();
+    std::vector<const float*> sim_table_ptrs;
+    explicit QueryTables(
+            const IndexIVFPQ& ivfpq,
+            const IVFSearchParameters* params)
+            : ivfpq(ivfpq),
+              d(ivfpq.d),
+              pq(ivfpq.pq),
+              metric_type(ivfpq.metric_type),
+              by_residual(ivfpq.by_residual),
+              use_precomputed_table(ivfpq.use_precomputed_table) {
+        mem.resize(pq.ksub * pq.M * 2 + d * 2);
+        sim_table = mem.data();
         sim_table_2 = sim_table + pq.ksub * pq.M;
         residual_vec = sim_table_2 + pq.ksub * pq.M;
         decoded_vec = residual_vec + d;
@@ -577,14 +567,14 @@ struct QueryTables {
         // for polysemous
         polysemous_ht = ivfpq.polysemous_ht;
         if (auto ivfpq_params =
-            dynamic_cast<const IVFPQSearchParameters *>(params)) {
+                    dynamic_cast<const IVFPQSearchParameters*>(params)) {
             polysemous_ht = ivfpq_params->polysemous_ht;
         }
-        if (polysemous_ht != 0)  {
-            q_code.resize (pq.code_size);
+        if (polysemous_ht != 0) {
+            q_code.resize(pq.code_size);
         }
         init_list_cycles = 0;
-        sim_table_ptrs.resize (pq.M);
+        sim_table_ptrs.resize(pq.M);
     }
     /*****************************************************
@@ -592,29 +582,29 @@ struct QueryTables {
      *****************************************************/
     // field specific to query
-    const float * qi;
+    const float* qi;
-    // query-specific intialization
-    void init_query (const float * qi) {
+    // query-specific initialization
+    void init_query(const float* qi) {
         this->qi = qi;
         if (metric_type == METRIC_INNER_PRODUCT)
-            init_query_IP ();
+            init_query_IP();
         else
-            init_query_L2 ();
+            init_query_L2();
         if (!by_residual && polysemous_ht != 0)
-            pq.compute_code (qi, q_code.data());
+            pq.compute_code(qi, q_code.data());
     }
-    void init_query_IP () {
+    void init_query_IP() {
         // precompute some tables specific to the query qi
-        pq.compute_inner_prod_table (qi, sim_table);
+        pq.compute_inner_prod_table(qi, sim_table);
     }
-    void init_query_L2 () {
+    void init_query_L2() {
         if (!by_residual) {
-            pq.compute_distance_table (qi, sim_table);
+            pq.compute_distance_table(qi, sim_table);
         } else if (use_precomputed_table) {
-            pq.compute_inner_prod_table (qi, sim_table_2);
+            pq.compute_inner_prod_table(qi, sim_table_2);
         }
     }
@@ -632,96 +622,95 @@ struct QueryTables {
     /// once we know the query and the centroid, we can prepare the
     /// sim_table that will be used for accumulation
     /// and dis0, the initial value
-    float precompute_list_tables () {
+    float precompute_list_tables() {
         float dis0 = 0;
-        uint64_t t0; TIC;
+        uint64_t t0;
+        TIC;
         if (by_residual) {
             if (metric_type == METRIC_INNER_PRODUCT)
-                dis0 = precompute_list_tables_IP ();
+                dis0 = precompute_list_tables_IP();
             else
-                dis0 = precompute_list_tables_L2 ();
+                dis0 = precompute_list_tables_L2();
         }
         init_list_cycles += TOC;
         return dis0;
-     }
+    }
-    float precompute_list_table_pointers () {
+    float precompute_list_table_pointers() {
         float dis0 = 0;
-        uint64_t t0; TIC;
+        uint64_t t0;
+        TIC;
         if (by_residual) {
             if (metric_type == METRIC_INNER_PRODUCT)
-              FAISS_THROW_MSG ("not implemented");
+                FAISS_THROW_MSG("not implemented");
             else
-              dis0 = precompute_list_table_pointers_L2 ();
+                dis0 = precompute_list_table_pointers_L2();
         }
         init_list_cycles += TOC;
         return dis0;
-     }
+    }
     /*****************************************************
      * compute tables for inner prod
      *****************************************************/
-    float precompute_list_tables_IP ()
-    {
+    float precompute_list_tables_IP() {
         // prepare the sim_table that will be used for accumulation
         // and dis0, the initial value
-        ivfpq.quantizer->reconstruct (key, decoded_vec);
+        ivfpq.quantizer->reconstruct(key, decoded_vec);
         // decoded_vec = centroid
-        float dis0 = fvec_inner_product (qi, decoded_vec, d);
+        float dis0 = fvec_inner_product(qi, decoded_vec, d);
         if (polysemous_ht) {
             for (int i = 0; i < d; i++) {
-                residual_vec [i] = qi[i] - decoded_vec[i];
+                residual_vec[i] = qi[i] - decoded_vec[i];
             }
-            pq.compute_code (residual_vec, q_code.data());
+            pq.compute_code(residual_vec, q_code.data());
         }
         return dis0;
     }
     /*****************************************************
      * compute tables for L2 distance
      *****************************************************/
-    float precompute_list_tables_L2 ()
-    {
+    float precompute_list_tables_L2() {
         float dis0 = 0;
         if (use_precomputed_table == 0 || use_precomputed_table == -1) {
-            ivfpq.quantizer->compute_residual (qi, residual_vec, key);
-            pq.compute_distance_table (residual_vec, sim_table);
+            ivfpq.quantizer->compute_residual(qi, residual_vec, key);
+            pq.compute_distance_table(residual_vec, sim_table);
             if (polysemous_ht != 0) {
-                pq.compute_code (residual_vec, q_code.data());
+                pq.compute_code(residual_vec, q_code.data());
             }
         } else if (use_precomputed_table == 1) {
             dis0 = coarse_dis;
-            fvec_madd (
+            fvec_madd(
                     pq.M * pq.ksub,
                     ivfpq.precomputed_table.data() + key * pq.ksub * pq.M,
-                    -2.0, sim_table_2,
-                    sim_table
-            );
+                    -2.0,
+                    sim_table_2,
+                    sim_table);
             if (polysemous_ht != 0) {
-                ivfpq.quantizer->compute_residual (qi, residual_vec, key);
-                pq.compute_code (residual_vec, q_code.data());
+                ivfpq.quantizer->compute_residual(qi, residual_vec, key);
+                pq.compute_code(residual_vec, q_code.data());
             }
         } else if (use_precomputed_table == 2) {
             dis0 = coarse_dis;
-            const MultiIndexQuantizer *miq =
-                dynamic_cast<const MultiIndexQuantizer *> (ivfpq.quantizer);
-            FAISS_THROW_IF_NOT (miq);
-            const ProductQuantizer &cpq = miq->pq;
+            const MultiIndexQuantizer* miq =
+                    dynamic_cast<const MultiIndexQuantizer*>(ivfpq.quantizer);
+            FAISS_THROW_IF_NOT(miq);
+            const ProductQuantizer& cpq = miq->pq;
             int Mf = pq.M / cpq.M;
-            const float *qtab = sim_table_2; // query-specific table
-            float *ltab = sim_table; // (output) list-specific table
+            const float* qtab = sim_table_2; // query-specific table
+            float* ltab = sim_table;         // (output) list-specific table
             long k = key;
             for (int cm = 0; cm < cpq.M; cm++) {
@@ -730,54 +719,48 @@ struct QueryTables {
                 k >>= cpq.nbits;
                 // get corresponding table
-                const float *pc = ivfpq.precomputed_table.data() +
-                    (ki * pq.M + cm * Mf) * pq.ksub;
+                const float* pc = ivfpq.precomputed_table.data() +
+                        (ki * pq.M + cm * Mf) * pq.ksub;
                 if (polysemous_ht == 0) {
                     // sum up with query-specific table
-                    fvec_madd (Mf * pq.ksub,
-                               pc,
-                               -2.0, qtab,
-                               ltab);
+                    fvec_madd(Mf * pq.ksub, pc, -2.0, qtab, ltab);
                     ltab += Mf * pq.ksub;
                     qtab += Mf * pq.ksub;
                 } else {
                     for (int m = cm * Mf; m < (cm + 1) * Mf; m++) {
-                        q_code[m] = fvec_madd_and_argmin
-                            (pq.ksub, pc, -2, qtab, ltab);
+                        q_code[m] = fvec_madd_and_argmin(
+                                pq.ksub, pc, -2, qtab, ltab);
                         pc += pq.ksub;
                         ltab += pq.ksub;
                         qtab += pq.ksub;
                     }
                 }
             }
         }
         return dis0;
     }
-    float precompute_list_table_pointers_L2 ()
-    {
+    float precompute_list_table_pointers_L2() {
         float dis0 = 0;
         if (use_precomputed_table == 1) {
             dis0 = coarse_dis;
-            const float * s = ivfpq.precomputed_table.data() +
-                    key * pq.ksub * pq.M;
+            const float* s =
+                    ivfpq.precomputed_table.data() + key * pq.ksub * pq.M;
             for (int m = 0; m < pq.M; m++) {
-                sim_table_ptrs [m] = s;
+                sim_table_ptrs[m] = s;
                 s += pq.ksub;
             }
         } else if (use_precomputed_table == 2) {
             dis0 = coarse_dis;
-            const MultiIndexQuantizer *miq =
-                dynamic_cast<const MultiIndexQuantizer *> (ivfpq.quantizer);
-            FAISS_THROW_IF_NOT (miq);
-            const ProductQuantizer &cpq = miq->pq;
+            const MultiIndexQuantizer* miq =
+                    dynamic_cast<const MultiIndexQuantizer*>(ivfpq.quantizer);
+            FAISS_THROW_IF_NOT(miq);
+            const ProductQuantizer& cpq = miq->pq;
             int Mf = pq.M / cpq.M;
             long k = key;
@@ -786,21 +769,21 @@ struct QueryTables {
                 int ki = k & ((uint64_t(1) << cpq.nbits) - 1);
                 k >>= cpq.nbits;
-                const float *pc = ivfpq.precomputed_table.data() +
-                    (ki * pq.M + cm * Mf) * pq.ksub;
+                const float* pc = ivfpq.precomputed_table.data() +
+                        (ki * pq.M + cm * Mf) * pq.ksub;
                 for (int m = m0; m < m0 + Mf; m++) {
-                    sim_table_ptrs [m] = pc;
+                    sim_table_ptrs[m] = pc;
                     pc += pq.ksub;
                 }
                 m0 += Mf;
             }
         } else {
-          FAISS_THROW_MSG ("need precomputed tables");
+            FAISS_THROW_MSG("need precomputed tables");
         }
         if (polysemous_ht) {
-            FAISS_THROW_MSG ("not implemented");
+            FAISS_THROW_MSG("not implemented");
             // Not clear that it makes sense to implemente this,
             // because it costs M * ksub, which is what we wanted to
             // avoid with the tables pointers.
@@ -808,82 +791,72 @@ struct QueryTables {
         return dis0;
     }
 };
-template<class C>
+template <class C>
 struct KnnSearchResults {
     idx_t key;
-    const idx_t *ids;
+    const idx_t* ids;
     // heap params
     size_t k;
-    float * heap_sim;
-    idx_t * heap_ids;
+    float* heap_sim;
+    idx_t* heap_ids;
     size_t nup;
-    inline void add (idx_t j, float dis) {
-        if (C::cmp (heap_sim[0], dis)) {
-            idx_t id = ids ? ids[j] : lo_build (key, j);
-            heap_replace_top<C> (k, heap_sim, heap_ids, dis, id);
+    inline void add(idx_t j, float dis) {
+        if (C::cmp(heap_sim[0], dis)) {
+            idx_t id = ids ? ids[j] : lo_build(key, j);
+            heap_replace_top<C>(k, heap_sim, heap_ids, dis, id);
             nup++;
         }
     }
 };
-template<class C>
+template <class C>
 struct RangeSearchResults {
     idx_t key;
-    const idx_t *ids;
+    const idx_t* ids;
     // wrapped result structure
     float radius;
-    RangeQueryResult & rres;
+    RangeQueryResult& rres;
-    inline void add (idx_t j, float dis) {
-        if (C::cmp (radius, dis)) {
-            idx_t id = ids ? ids[j] : lo_build (key, j);
-            rres.add (dis, id);
+    inline void add(idx_t j, float dis) {
+        if (C::cmp(radius, dis)) {
+            idx_t id = ids ? ids[j] : lo_build(key, j);
+            rres.add(dis, id);
         }
     }
 };
 /*****************************************************
  * Scaning the codes.
  * The scanning functions call their favorite precompute_*
  * function to precompute the tables they need.
  *****************************************************/
 template <typename IDType, MetricType METRIC_TYPE, class PQDecoder>
-struct IVFPQScannerT: QueryTables {
-    const uint8_t * list_codes;
-    const IDType * list_ids;
+struct IVFPQScannerT : QueryTables {
+    const uint8_t* list_codes;
+    const IDType* list_ids;
     size_t list_size;
-    IVFPQScannerT (const IndexIVFPQ & ivfpq, const IVFSearchParameters *params):
-        QueryTables (ivfpq, params)
-    {
+    IVFPQScannerT(const IndexIVFPQ& ivfpq, const IVFSearchParameters* params)
+            : QueryTables(ivfpq, params) {
         assert(METRIC_TYPE == metric_type);
     }
     float dis0;
-    void init_list (idx_t list_no, float coarse_dis,
-                      int mode) {
+    void init_list(idx_t list_no, float coarse_dis, int mode) {
         this->key = list_no;
         this->coarse_dis = coarse_dis;
         if (mode == 2) {
-            dis0 = precompute_list_tables ();
+            dis0 = precompute_list_tables();
         } else if (mode == 1) {
-            dis0 = precompute_list_table_pointers ();
+            dis0 = precompute_list_table_pointers();
         }
     }
@@ -892,15 +865,16 @@ struct IVFPQScannerT: QueryTables {
      *****************************************************/
     /// version of the scan where we use precomputed tables
-    template<class SearchResultType>
-    void scan_list_with_table (size_t ncode, const uint8_t *codes,
-                               SearchResultType & res) const
-    {
+    template <class SearchResultType>
+    void scan_list_with_table(
+            size_t ncode,
+            const uint8_t* codes,
+            SearchResultType& res) const {
         for (size_t j = 0; j < ncode; j++) {
             PQDecoder decoder(codes, pq.nbits);
             codes += pq.code_size;
             float dis = dis0;
-            const float *tab = sim_table;
+            const float* tab = sim_table;
             for (size_t m = 0; m < pq.M; m++) {
                 dis += tab[decoder.decode()];
@@ -911,43 +885,43 @@ struct IVFPQScannerT: QueryTables {
         }
     }
     /// tables are not precomputed, but pointers are provided to the
     /// relevant X_c|x_r tables
-    template<class SearchResultType>
-    void scan_list_with_pointer (size_t ncode, const uint8_t *codes,
-                                 SearchResultType & res) const
-    {
+    template <class SearchResultType>
+    void scan_list_with_pointer(
+            size_t ncode,
+            const uint8_t* codes,
+            SearchResultType& res) const {
         for (size_t j = 0; j < ncode; j++) {
             PQDecoder decoder(codes, pq.nbits);
             codes += pq.code_size;
             float dis = dis0;
-            const float *tab = sim_table_2;
+            const float* tab = sim_table_2;
             for (size_t m = 0; m < pq.M; m++) {
                 int ci = decoder.decode();
-                dis += sim_table_ptrs [m][ci] - 2 * tab [ci];
+                dis += sim_table_ptrs[m][ci] - 2 * tab[ci];
                 tab += pq.ksub;
             }
-            res.add (j, dis);
+            res.add(j, dis);
         }
     }
     /// nothing is precomputed: access residuals on-the-fly
-    template<class SearchResultType>
-    void scan_on_the_fly_dist (size_t ncode, const uint8_t *codes,
-                                 SearchResultType &res) const
-    {
-        const float *dvec;
+    template <class SearchResultType>
+    void scan_on_the_fly_dist(
+            size_t ncode,
+            const uint8_t* codes,
+            SearchResultType& res) const {
+        const float* dvec;
         float dis0 = 0;
         if (by_residual) {
             if (METRIC_TYPE == METRIC_INNER_PRODUCT) {
-                ivfpq.quantizer->reconstruct (key, residual_vec);
-                dis0 = fvec_inner_product (residual_vec, qi, d);
+                ivfpq.quantizer->reconstruct(key, residual_vec);
+                dis0 = fvec_inner_product(residual_vec, qi, d);
             } else {
-                ivfpq.quantizer->compute_residual (qi, residual_vec, key);
+                ivfpq.quantizer->compute_residual(qi, residual_vec, key);
             }
             dvec = residual_vec;
         } else {
@@ -956,17 +930,16 @@ struct IVFPQScannerT: QueryTables {
         }
         for (size_t j = 0; j < ncode; j++) {
-            pq.decode (codes, decoded_vec);
+            pq.decode(codes, decoded_vec);
             codes += pq.code_size;
             float dis;
             if (METRIC_TYPE == METRIC_INNER_PRODUCT) {
-                dis = dis0 + fvec_inner_product (decoded_vec, qi, d);
+                dis = dis0 + fvec_inner_product(decoded_vec, qi, d);
             } else {
-                dis = fvec_L2sqr (decoded_vec, dvec, d);
+                dis = fvec_L2sqr(decoded_vec, dvec, d);
             }
-            res.add (j, dis);
+            res.add(j, dis);
         }
     }
@@ -975,110 +948,99 @@ struct IVFPQScannerT: QueryTables {
      *****************************************************/
     template <class HammingComputer, class SearchResultType>
-    void scan_list_polysemous_hc (
-             size_t ncode, const uint8_t *codes,
-             SearchResultType & res) const
-    {
+    void scan_list_polysemous_hc(
+            size_t ncode,
+            const uint8_t* codes,
+            SearchResultType& res) const {
         int ht = ivfpq.polysemous_ht;
         size_t n_hamming_pass = 0, nup = 0;
         int code_size = pq.code_size;
-        HammingComputer hc (q_code.data(), code_size);
+        HammingComputer hc(q_code.data(), code_size);
         for (size_t j = 0; j < ncode; j++) {
-            const uint8_t *b_code = codes;
-            int hd = hc.hamming (b_code);
+            const uint8_t* b_code = codes;
+            int hd = hc.hamming(b_code);
             if (hd < ht) {
-                n_hamming_pass ++;
+                n_hamming_pass++;
                 PQDecoder decoder(codes, pq.nbits);
                 float dis = dis0;
-                const float *tab = sim_table;
+                const float* tab = sim_table;
                 for (size_t m = 0; m < pq.M; m++) {
                     dis += tab[decoder.decode()];
                     tab += pq.ksub;
                 }
-                res.add (j, dis);
+                res.add(j, dis);
             }
             codes += code_size;
         }
 #pragma omp critical
-        {
-            indexIVFPQ_stats.n_hamming_pass += n_hamming_pass;
-        }
+        { indexIVFPQ_stats.n_hamming_pass += n_hamming_pass; }
     }
-    template<class SearchResultType>
-    void scan_list_polysemous (
-             size_t ncode, const uint8_t *codes,
-             SearchResultType &res) const
-    {
+    template <class SearchResultType>
+    void scan_list_polysemous(
+            size_t ncode,
+            const uint8_t* codes,
+            SearchResultType& res) const {
         switch (pq.code_size) {
 #define HANDLE_CODE_SIZE(cs)                                            \
-        case cs:                                                        \
-            scan_list_polysemous_hc \
-            <HammingComputer ## cs, SearchResultType>   \
-                (ncode, codes, res);             \
-            break
-        HANDLE_CODE_SIZE(4);
-        HANDLE_CODE_SIZE(8);
-        HANDLE_CODE_SIZE(16);
-        HANDLE_CODE_SIZE(20);
-        HANDLE_CODE_SIZE(32);
-        HANDLE_CODE_SIZE(64);
+    case cs:                                                            \
+        scan_list_polysemous_hc<HammingComputer##cs, SearchResultType>( \
+                ncode, codes, res);                                     \
+        break
+            HANDLE_CODE_SIZE(4);
+            HANDLE_CODE_SIZE(8);
+            HANDLE_CODE_SIZE(16);
+            HANDLE_CODE_SIZE(20);
+            HANDLE_CODE_SIZE(32);
+            HANDLE_CODE_SIZE(64);
 #undef HANDLE_CODE_SIZE
-        default:
-            if (pq.code_size % 8 == 0)
-                scan_list_polysemous_hc
-                    <HammingComputerM8, SearchResultType>
-                    (ncode, codes, res);
-            else
-                scan_list_polysemous_hc
-                    <HammingComputerM4, SearchResultType>
-                    (ncode, codes, res);
-            break;
+            default:
+                scan_list_polysemous_hc<
+                        HammingComputerDefault,
+                        SearchResultType>(ncode, codes, res);
+                break;
         }
     }
 };
 /* We put as many parameters as possible in template. Hopefully the
  * gain in runtime is worth the code bloat. C is the comparator < or
  * >, it is directly related to METRIC_TYPE. precompute_mode is how
  * much we precompute (2 = precompute distance tables, 1 = precompute
  * pointers to distances, 0 = compute distances one by one).
  * Currently only 2 is supported */
-template<MetricType METRIC_TYPE, class C, class PQDecoder>
-struct IVFPQScanner:
-    IVFPQScannerT<Index::idx_t, METRIC_TYPE, PQDecoder>,
-    InvertedListScanner
-{
-    bool store_pairs;
+template <MetricType METRIC_TYPE, class C, class PQDecoder>
+struct IVFPQScanner : IVFPQScannerT<Index::idx_t, METRIC_TYPE, PQDecoder>,
+                      InvertedListScanner {
     int precompute_mode;
-    IVFPQScanner(const IndexIVFPQ & ivfpq, bool store_pairs,
-                 int precompute_mode):
-        IVFPQScannerT<Index::idx_t, METRIC_TYPE, PQDecoder>(ivfpq, nullptr),
-        store_pairs(store_pairs), precompute_mode(precompute_mode)
-    {
+    IVFPQScanner(const IndexIVFPQ& ivfpq, bool store_pairs, int precompute_mode)
+            : IVFPQScannerT<Index::idx_t, METRIC_TYPE, PQDecoder>(
+                      ivfpq,
+                      nullptr),
+              precompute_mode(precompute_mode) {
+        this->store_pairs = store_pairs;
     }
-    void set_query (const float *query) override {
-        this->init_query (query);
+    void set_query(const float* query) override {
+        this->init_query(query);
     }
-    void set_list (idx_t list_no, float coarse_dis) override {
-        this->init_list (list_no, coarse_dis, precompute_mode);
+    void set_list(idx_t list_no, float coarse_dis) override {
+        this->list_no = list_no;
+        this->init_list(list_no, coarse_dis, precompute_mode);
     }
-    float distance_to_code (const uint8_t *code) const override {
+    float distance_to_code(const uint8_t* code) const override {
         assert(precompute_mode == 2);
         float dis = this->dis0;
-        const float *tab = this->sim_table;
+        const float* tab = this->sim_table;
         PQDecoder decoder(code, this->pq.nbits);
         for (size_t m = 0; m < this->pq.M; m++) {
@@ -1088,112 +1050,100 @@ struct IVFPQScanner:
         return dis;
     }
-    size_t scan_codes (size_t ncode,
-                       const uint8_t *codes,
-                       const idx_t *ids,
-                       float *heap_sim, idx_t *heap_ids,
-                       size_t k) const override
-    {
+    size_t scan_codes(
+            size_t ncode,
+            const uint8_t* codes,
+            const idx_t* ids,
+            float* heap_sim,
+            idx_t* heap_ids,
+            size_t k) const override {
         KnnSearchResults<C> res = {
-            /* key */      this->key,
-            /* ids */      this->store_pairs ? nullptr : ids,
-            /* k */        k,
-            /* heap_sim */ heap_sim,
-            /* heap_ids */ heap_ids,
-            /* nup */      0
-        };
+                /* key */ this->key,
+                /* ids */ this->store_pairs ? nullptr : ids,
+                /* k */ k,
+                /* heap_sim */ heap_sim,
+                /* heap_ids */ heap_ids,
+                /* nup */ 0};
         if (this->polysemous_ht > 0) {
             assert(precompute_mode == 2);
-            this->scan_list_polysemous (ncode, codes, res);
+            this->scan_list_polysemous(ncode, codes, res);
         } else if (precompute_mode == 2) {
-            this->scan_list_with_table (ncode, codes, res);
+            this->scan_list_with_table(ncode, codes, res);
         } else if (precompute_mode == 1) {
-            this->scan_list_with_pointer (ncode, codes, res);
+            this->scan_list_with_pointer(ncode, codes, res);
         } else if (precompute_mode == 0) {
-            this->scan_on_the_fly_dist (ncode, codes, res);
+            this->scan_on_the_fly_dist(ncode, codes, res);
         } else {
             FAISS_THROW_MSG("bad precomp mode");
         }
         return res.nup;
     }
-    void scan_codes_range (size_t ncode,
-                           const uint8_t *codes,
-                           const idx_t *ids,
-                           float radius,
-                           RangeQueryResult & rres) const override
-    {
+    void scan_codes_range(
+            size_t ncode,
+            const uint8_t* codes,
+            const idx_t* ids,
+            float radius,
+            RangeQueryResult& rres) const override {
         RangeSearchResults<C> res = {
-            /* key */      this->key,
-            /* ids */      this->store_pairs ? nullptr : ids,
-            /* radius */   radius,
-            /* rres */     rres
-        };
+                /* key */ this->key,
+                /* ids */ this->store_pairs ? nullptr : ids,
+                /* radius */ radius,
+                /* rres */ rres};
         if (this->polysemous_ht > 0) {
             assert(precompute_mode == 2);
-            this->scan_list_polysemous (ncode, codes, res);
+            this->scan_list_polysemous(ncode, codes, res);
         } else if (precompute_mode == 2) {
-            this->scan_list_with_table (ncode, codes, res);
+            this->scan_list_with_table(ncode, codes, res);
         } else if (precompute_mode == 1) {
-            this->scan_list_with_pointer (ncode, codes, res);
+            this->scan_list_with_pointer(ncode, codes, res);
         } else if (precompute_mode == 0) {
-            this->scan_on_the_fly_dist (ncode, codes, res);
+            this->scan_on_the_fly_dist(ncode, codes, res);
         } else {
             FAISS_THROW_MSG("bad precomp mode");
         }
     }
 };
-template<class PQDecoder>
-InvertedListScanner *get_InvertedListScanner1 (const IndexIVFPQ &index,
-                                               bool store_pairs)
-{
-   if (index.metric_type == METRIC_INNER_PRODUCT) {
-        return new IVFPQScanner
-            <METRIC_INNER_PRODUCT, CMin<float, idx_t>, PQDecoder>
-            (index, store_pairs, 2);
+template <class PQDecoder>
+InvertedListScanner* get_InvertedListScanner1(
+        const IndexIVFPQ& index,
+        bool store_pairs) {
+    if (index.metric_type == METRIC_INNER_PRODUCT) {
+        return new IVFPQScanner<
+                METRIC_INNER_PRODUCT,
+                CMin<float, idx_t>,
+                PQDecoder>(index, store_pairs, 2);
     } else if (index.metric_type == METRIC_L2) {
-        return new IVFPQScanner
-            <METRIC_L2, CMax<float, idx_t>, PQDecoder>
-            (index, store_pairs, 2);
+        return new IVFPQScanner<METRIC_L2, CMax<float, idx_t>, PQDecoder>(
+                index, store_pairs, 2);
     }
     return nullptr;
 }
 } // anonymous namespace
-InvertedListScanner *
-IndexIVFPQ::get_InvertedListScanner (bool store_pairs) const
-{
+InvertedListScanner* IndexIVFPQ::get_InvertedListScanner(
+        bool store_pairs) const {
     if (pq.nbits == 8) {
-        return get_InvertedListScanner1<PQDecoder8> (*this, store_pairs);
+        return get_InvertedListScanner1<PQDecoder8>(*this, store_pairs);
     } else if (pq.nbits == 16) {
-        return get_InvertedListScanner1<PQDecoder16> (*this, store_pairs);
+        return get_InvertedListScanner1<PQDecoder16>(*this, store_pairs);
     } else {
-        return get_InvertedListScanner1<PQDecoderGeneric> (*this, store_pairs);
+        return get_InvertedListScanner1<PQDecoderGeneric>(*this, store_pairs);
     }
     return nullptr;
 }
 IndexIVFPQStats indexIVFPQ_stats;
-void IndexIVFPQStats::reset () {
-    memset (this, 0, sizeof (*this));
+void IndexIVFPQStats::reset() {
+    memset(this, 0, sizeof(*this));
 }
-IndexIVFPQ::IndexIVFPQ ()
-{
+IndexIVFPQ::IndexIVFPQ() {
     // initialize some runtime values
     use_precomputed_table = 0;
     scan_table_threshold = 0;
@@ -1202,43 +1152,40 @@ IndexIVFPQ::IndexIVFPQ ()
     polysemous_training = nullptr;
 }
 struct CodeCmp {
-    const uint8_t *tab;
+    const uint8_t* tab;
     size_t code_size;
-    bool operator () (int a, int b) const {
-        return cmp (a, b) > 0;
+    bool operator()(int a, int b) const {
+        return cmp(a, b) > 0;
     }
-    int cmp (int a, int b) const {
-        return memcmp (tab + a * code_size, tab + b * code_size,
-                       code_size);
+    int cmp(int a, int b) const {
+        return memcmp(tab + a * code_size, tab + b * code_size, code_size);
     }
 };
-size_t IndexIVFPQ::find_duplicates (idx_t *dup_ids, size_t *lims) const
-{
+size_t IndexIVFPQ::find_duplicates(idx_t* dup_ids, size_t* lims) const {
     size_t ngroup = 0;
     lims[0] = 0;
     for (size_t list_no = 0; list_no < nlist; list_no++) {
-        size_t n = invlists->list_size (list_no);
-        std::vector<int> ord (n);
-        for (int i = 0; i < n; i++) ord[i] = i;
-        InvertedLists::ScopedCodes codes (invlists, list_no);
-        CodeCmp cs = { codes.get(), code_size };
-        std::sort (ord.begin(), ord.end(), cs);
-        InvertedLists::ScopedIds list_ids (invlists, list_no);
-        int prev = -1;  // all elements from prev to i-1 are equal
+        size_t n = invlists->list_size(list_no);
+        std::vector<int> ord(n);
+        for (int i = 0; i < n; i++)
+            ord[i] = i;
+        InvertedLists::ScopedCodes codes(invlists, list_no);
+        CodeCmp cs = {codes.get(), code_size};
+        std::sort(ord.begin(), ord.end(), cs);
+        InvertedLists::ScopedIds list_ids(invlists, list_no);
+        int prev = -1; // all elements from prev to i-1 are equal
         for (int i = 0; i < n; i++) {
-            if (prev >= 0 && cs.cmp (ord [prev], ord [i]) == 0) {
+            if (prev >= 0 && cs.cmp(ord[prev], ord[i]) == 0) {
                 // same as previous => remember
                 if (prev + 1 == i) { // start new group
                     ngroup++;
                     lims[ngroup] = lims[ngroup - 1];
-                    dup_ids [lims [ngroup]++] = list_ids [ord [prev]];
+                    dup_ids[lims[ngroup]++] = list_ids[ord[prev]];
                 }
-                dup_ids [lims [ngroup]++] = list_ids [ord [i]];
+                dup_ids[lims[ngroup]++] = list_ids[ord[i]];
             } else { // not same as previous.
                 prev = i;
             }
@@ -1247,9 +1194,4 @@ size_t IndexIVFPQ::find_duplicates (idx_t *dup_ids, size_t *lims) const
     return ngroup;
 }
 } // namespace faiss