RubyGems - faiss - Versions diffs - 0.2.0 → 0.2.1 - Mend

faiss 0.2.0 → 0.2.1

Files changed (202) hide show

checksums.yaml +4 -4
data/CHANGELOG.md +4 -0
data/lib/faiss/version.rb +1 -1
data/vendor/faiss/faiss/AutoTune.cpp +292 -291
data/vendor/faiss/faiss/AutoTune.h +55 -56
data/vendor/faiss/faiss/Clustering.cpp +334 -195
data/vendor/faiss/faiss/Clustering.h +88 -35
data/vendor/faiss/faiss/IVFlib.cpp +171 -195
data/vendor/faiss/faiss/IVFlib.h +48 -51
data/vendor/faiss/faiss/Index.cpp +85 -103
data/vendor/faiss/faiss/Index.h +54 -48
data/vendor/faiss/faiss/Index2Layer.cpp +139 -164
data/vendor/faiss/faiss/Index2Layer.h +22 -22
data/vendor/faiss/faiss/IndexBinary.cpp +45 -37
data/vendor/faiss/faiss/IndexBinary.h +140 -132
data/vendor/faiss/faiss/IndexBinaryFlat.cpp +73 -53
data/vendor/faiss/faiss/IndexBinaryFlat.h +29 -24
data/vendor/faiss/faiss/IndexBinaryFromFloat.cpp +46 -43
data/vendor/faiss/faiss/IndexBinaryFromFloat.h +16 -15
data/vendor/faiss/faiss/IndexBinaryHNSW.cpp +215 -232
data/vendor/faiss/faiss/IndexBinaryHNSW.h +25 -24
data/vendor/faiss/faiss/IndexBinaryHash.cpp +182 -177
data/vendor/faiss/faiss/IndexBinaryHash.h +41 -34
data/vendor/faiss/faiss/IndexBinaryIVF.cpp +489 -461
data/vendor/faiss/faiss/IndexBinaryIVF.h +97 -68
data/vendor/faiss/faiss/IndexFlat.cpp +116 -147
data/vendor/faiss/faiss/IndexFlat.h +35 -46
data/vendor/faiss/faiss/IndexHNSW.cpp +372 -348
data/vendor/faiss/faiss/IndexHNSW.h +57 -41
data/vendor/faiss/faiss/IndexIVF.cpp +474 -454
data/vendor/faiss/faiss/IndexIVF.h +146 -113
data/vendor/faiss/faiss/IndexIVFFlat.cpp +248 -250
data/vendor/faiss/faiss/IndexIVFFlat.h +48 -51
data/vendor/faiss/faiss/IndexIVFPQ.cpp +457 -516
data/vendor/faiss/faiss/IndexIVFPQ.h +74 -66
data/vendor/faiss/faiss/IndexIVFPQFastScan.cpp +406 -372
data/vendor/faiss/faiss/IndexIVFPQFastScan.h +82 -57
data/vendor/faiss/faiss/IndexIVFPQR.cpp +104 -102
data/vendor/faiss/faiss/IndexIVFPQR.h +33 -28
data/vendor/faiss/faiss/IndexIVFSpectralHash.cpp +125 -133
data/vendor/faiss/faiss/IndexIVFSpectralHash.h +19 -21
data/vendor/faiss/faiss/IndexLSH.cpp +75 -96
data/vendor/faiss/faiss/IndexLSH.h +21 -26
data/vendor/faiss/faiss/IndexLattice.cpp +42 -56
data/vendor/faiss/faiss/IndexLattice.h +11 -16
data/vendor/faiss/faiss/IndexNNDescent.cpp +231 -0
data/vendor/faiss/faiss/IndexNNDescent.h +72 -0
data/vendor/faiss/faiss/IndexNSG.cpp +303 -0
data/vendor/faiss/faiss/IndexNSG.h +85 -0
data/vendor/faiss/faiss/IndexPQ.cpp +405 -464
data/vendor/faiss/faiss/IndexPQ.h +64 -67
data/vendor/faiss/faiss/IndexPQFastScan.cpp +143 -170
data/vendor/faiss/faiss/IndexPQFastScan.h +46 -32
data/vendor/faiss/faiss/IndexPreTransform.cpp +120 -150
data/vendor/faiss/faiss/IndexPreTransform.h +33 -36
data/vendor/faiss/faiss/IndexRefine.cpp +115 -131
data/vendor/faiss/faiss/IndexRefine.h +22 -23
data/vendor/faiss/faiss/IndexReplicas.cpp +147 -153
data/vendor/faiss/faiss/IndexReplicas.h +62 -56
data/vendor/faiss/faiss/IndexResidual.cpp +291 -0
data/vendor/faiss/faiss/IndexResidual.h +152 -0
data/vendor/faiss/faiss/IndexScalarQuantizer.cpp +120 -155
data/vendor/faiss/faiss/IndexScalarQuantizer.h +41 -45
data/vendor/faiss/faiss/IndexShards.cpp +256 -240
data/vendor/faiss/faiss/IndexShards.h +85 -73
data/vendor/faiss/faiss/MatrixStats.cpp +112 -97
data/vendor/faiss/faiss/MatrixStats.h +7 -10
data/vendor/faiss/faiss/MetaIndexes.cpp +135 -157
data/vendor/faiss/faiss/MetaIndexes.h +40 -34
data/vendor/faiss/faiss/MetricType.h +7 -7
data/vendor/faiss/faiss/VectorTransform.cpp +652 -474
data/vendor/faiss/faiss/VectorTransform.h +61 -89
data/vendor/faiss/faiss/clone_index.cpp +77 -73
data/vendor/faiss/faiss/clone_index.h +4 -9
data/vendor/faiss/faiss/gpu/GpuAutoTune.cpp +33 -38
data/vendor/faiss/faiss/gpu/GpuAutoTune.h +11 -9
data/vendor/faiss/faiss/gpu/GpuCloner.cpp +197 -170
data/vendor/faiss/faiss/gpu/GpuCloner.h +53 -35
data/vendor/faiss/faiss/gpu/GpuClonerOptions.cpp +12 -14
data/vendor/faiss/faiss/gpu/GpuClonerOptions.h +27 -25
data/vendor/faiss/faiss/gpu/GpuDistance.h +116 -112
data/vendor/faiss/faiss/gpu/GpuFaissAssert.h +1 -2
data/vendor/faiss/faiss/gpu/GpuIndex.h +134 -137
data/vendor/faiss/faiss/gpu/GpuIndexBinaryFlat.h +76 -73
data/vendor/faiss/faiss/gpu/GpuIndexFlat.h +173 -162
data/vendor/faiss/faiss/gpu/GpuIndexIVF.h +67 -64
data/vendor/faiss/faiss/gpu/GpuIndexIVFFlat.h +89 -86
data/vendor/faiss/faiss/gpu/GpuIndexIVFPQ.h +150 -141
data/vendor/faiss/faiss/gpu/GpuIndexIVFScalarQuantizer.h +101 -103
data/vendor/faiss/faiss/gpu/GpuIndicesOptions.h +17 -16
data/vendor/faiss/faiss/gpu/GpuResources.cpp +116 -128
data/vendor/faiss/faiss/gpu/GpuResources.h +182 -186
data/vendor/faiss/faiss/gpu/StandardGpuResources.cpp +433 -422
data/vendor/faiss/faiss/gpu/StandardGpuResources.h +131 -130
data/vendor/faiss/faiss/gpu/impl/InterleavedCodes.cpp +468 -456
data/vendor/faiss/faiss/gpu/impl/InterleavedCodes.h +25 -19
data/vendor/faiss/faiss/gpu/impl/RemapIndices.cpp +22 -20
data/vendor/faiss/faiss/gpu/impl/RemapIndices.h +9 -8
data/vendor/faiss/faiss/gpu/perf/IndexWrapper-inl.h +39 -44
data/vendor/faiss/faiss/gpu/perf/IndexWrapper.h +16 -14
data/vendor/faiss/faiss/gpu/perf/PerfClustering.cpp +77 -71
data/vendor/faiss/faiss/gpu/perf/PerfIVFPQAdd.cpp +109 -88
data/vendor/faiss/faiss/gpu/perf/WriteIndex.cpp +75 -64
data/vendor/faiss/faiss/gpu/test/TestCodePacking.cpp +230 -215
data/vendor/faiss/faiss/gpu/test/TestGpuIndexBinaryFlat.cpp +80 -86
data/vendor/faiss/faiss/gpu/test/TestGpuIndexFlat.cpp +284 -277
data/vendor/faiss/faiss/gpu/test/TestGpuIndexIVFFlat.cpp +416 -416
data/vendor/faiss/faiss/gpu/test/TestGpuIndexIVFPQ.cpp +611 -517
data/vendor/faiss/faiss/gpu/test/TestGpuIndexIVFScalarQuantizer.cpp +166 -164
data/vendor/faiss/faiss/gpu/test/TestGpuMemoryException.cpp +61 -53
data/vendor/faiss/faiss/gpu/test/TestUtils.cpp +274 -238
data/vendor/faiss/faiss/gpu/test/TestUtils.h +73 -57
data/vendor/faiss/faiss/gpu/test/demo_ivfpq_indexing_gpu.cpp +47 -50
data/vendor/faiss/faiss/gpu/utils/DeviceUtils.h +79 -72
data/vendor/faiss/faiss/gpu/utils/StackDeviceMemory.cpp +140 -146
data/vendor/faiss/faiss/gpu/utils/StackDeviceMemory.h +69 -71
data/vendor/faiss/faiss/gpu/utils/StaticUtils.h +21 -16
data/vendor/faiss/faiss/gpu/utils/Timer.cpp +25 -29
data/vendor/faiss/faiss/gpu/utils/Timer.h +30 -29
data/vendor/faiss/faiss/impl/AdditiveQuantizer.cpp +270 -0
data/vendor/faiss/faiss/impl/AdditiveQuantizer.h +115 -0
data/vendor/faiss/faiss/impl/AuxIndexStructures.cpp +90 -120
data/vendor/faiss/faiss/impl/AuxIndexStructures.h +81 -65
data/vendor/faiss/faiss/impl/FaissAssert.h +73 -58
data/vendor/faiss/faiss/impl/FaissException.cpp +56 -48
data/vendor/faiss/faiss/impl/FaissException.h +41 -29
data/vendor/faiss/faiss/impl/HNSW.cpp +595 -611
data/vendor/faiss/faiss/impl/HNSW.h +179 -200
data/vendor/faiss/faiss/impl/LocalSearchQuantizer.cpp +672 -0
data/vendor/faiss/faiss/impl/LocalSearchQuantizer.h +172 -0
data/vendor/faiss/faiss/impl/NNDescent.cpp +487 -0
data/vendor/faiss/faiss/impl/NNDescent.h +154 -0
data/vendor/faiss/faiss/impl/NSG.cpp +682 -0
data/vendor/faiss/faiss/impl/NSG.h +199 -0
data/vendor/faiss/faiss/impl/PolysemousTraining.cpp +484 -454
data/vendor/faiss/faiss/impl/PolysemousTraining.h +52 -55
data/vendor/faiss/faiss/impl/ProductQuantizer-inl.h +26 -47
data/vendor/faiss/faiss/impl/ProductQuantizer.cpp +469 -459
data/vendor/faiss/faiss/impl/ProductQuantizer.h +76 -87
data/vendor/faiss/faiss/impl/ResidualQuantizer.cpp +448 -0
data/vendor/faiss/faiss/impl/ResidualQuantizer.h +130 -0
data/vendor/faiss/faiss/impl/ResultHandler.h +96 -132
data/vendor/faiss/faiss/impl/ScalarQuantizer.cpp +648 -701
data/vendor/faiss/faiss/impl/ScalarQuantizer.h +48 -46
data/vendor/faiss/faiss/impl/ThreadedIndex-inl.h +129 -131
data/vendor/faiss/faiss/impl/ThreadedIndex.h +61 -55
data/vendor/faiss/faiss/impl/index_read.cpp +547 -479
data/vendor/faiss/faiss/impl/index_write.cpp +497 -407
data/vendor/faiss/faiss/impl/io.cpp +75 -94
data/vendor/faiss/faiss/impl/io.h +31 -41
data/vendor/faiss/faiss/impl/io_macros.h +40 -29
data/vendor/faiss/faiss/impl/lattice_Zn.cpp +137 -186
data/vendor/faiss/faiss/impl/lattice_Zn.h +40 -51
data/vendor/faiss/faiss/impl/platform_macros.h +29 -8
data/vendor/faiss/faiss/impl/pq4_fast_scan.cpp +77 -124
data/vendor/faiss/faiss/impl/pq4_fast_scan.h +39 -48
data/vendor/faiss/faiss/impl/pq4_fast_scan_search_1.cpp +41 -52
data/vendor/faiss/faiss/impl/pq4_fast_scan_search_qbs.cpp +80 -117
data/vendor/faiss/faiss/impl/simd_result_handlers.h +109 -137
data/vendor/faiss/faiss/index_factory.cpp +269 -218
data/vendor/faiss/faiss/index_factory.h +6 -7
data/vendor/faiss/faiss/index_io.h +23 -26
data/vendor/faiss/faiss/invlists/BlockInvertedLists.cpp +67 -75
data/vendor/faiss/faiss/invlists/BlockInvertedLists.h +22 -24
data/vendor/faiss/faiss/invlists/DirectMap.cpp +96 -112
data/vendor/faiss/faiss/invlists/DirectMap.h +29 -33
data/vendor/faiss/faiss/invlists/InvertedLists.cpp +307 -364
data/vendor/faiss/faiss/invlists/InvertedLists.h +151 -151
data/vendor/faiss/faiss/invlists/InvertedListsIOHook.cpp +29 -34
data/vendor/faiss/faiss/invlists/InvertedListsIOHook.h +17 -18
data/vendor/faiss/faiss/invlists/OnDiskInvertedLists.cpp +257 -293
data/vendor/faiss/faiss/invlists/OnDiskInvertedLists.h +50 -45
data/vendor/faiss/faiss/python/python_callbacks.cpp +23 -26
data/vendor/faiss/faiss/python/python_callbacks.h +9 -16
data/vendor/faiss/faiss/utils/AlignedTable.h +79 -44
data/vendor/faiss/faiss/utils/Heap.cpp +40 -48
data/vendor/faiss/faiss/utils/Heap.h +186 -209
data/vendor/faiss/faiss/utils/WorkerThread.cpp +67 -76
data/vendor/faiss/faiss/utils/WorkerThread.h +32 -33
data/vendor/faiss/faiss/utils/distances.cpp +301 -310
data/vendor/faiss/faiss/utils/distances.h +133 -118
data/vendor/faiss/faiss/utils/distances_simd.cpp +456 -516
data/vendor/faiss/faiss/utils/extra_distances-inl.h +117 -0
data/vendor/faiss/faiss/utils/extra_distances.cpp +113 -232
data/vendor/faiss/faiss/utils/extra_distances.h +30 -29
data/vendor/faiss/faiss/utils/hamming-inl.h +260 -209
data/vendor/faiss/faiss/utils/hamming.cpp +375 -469
data/vendor/faiss/faiss/utils/hamming.h +62 -85
data/vendor/faiss/faiss/utils/ordered_key_value.h +16 -18
data/vendor/faiss/faiss/utils/partitioning.cpp +393 -318
data/vendor/faiss/faiss/utils/partitioning.h +26 -21
data/vendor/faiss/faiss/utils/quantize_lut.cpp +78 -66
data/vendor/faiss/faiss/utils/quantize_lut.h +22 -20
data/vendor/faiss/faiss/utils/random.cpp +39 -63
data/vendor/faiss/faiss/utils/random.h +13 -16
data/vendor/faiss/faiss/utils/simdlib.h +4 -2
data/vendor/faiss/faiss/utils/simdlib_avx2.h +88 -85
data/vendor/faiss/faiss/utils/simdlib_emulated.h +226 -165
data/vendor/faiss/faiss/utils/simdlib_neon.h +832 -0
data/vendor/faiss/faiss/utils/utils.cpp +304 -287
data/vendor/faiss/faiss/utils/utils.h +53 -48
metadata +20 -2

data/vendor/faiss/faiss/IndexPQ.h CHANGED Viewed

@@ -5,8 +5,6 @@
  * LICENSE file in the root directory of this source tree.
  */
-// -*- c++ -*-
 #ifndef FAISS_INDEX_PQ_H
 #define FAISS_INDEX_PQ_H
@@ -15,18 +13,15 @@
 #include <vector>
 #include <faiss/Index.h>
-#include <faiss/impl/ProductQuantizer.h>
 #include <faiss/impl/PolysemousTraining.h>
+#include <faiss/impl/ProductQuantizer.h>
 #include <faiss/impl/platform_macros.h>
 namespace faiss {
 /** Index based on a product quantizer. Stored vectors are
  * approximated by PQ codes. */
-struct IndexPQ: Index {
+struct IndexPQ : Index {
     /// The product quantizer used to encode the vectors
     ProductQuantizer pq;
@@ -39,23 +34,23 @@ struct IndexPQ: Index {
      * @param M      number of subquantizers
      * @param nbits  number of bit per subvector index
      */
-    IndexPQ (int d,                    ///< dimensionality of the input vectors
-             size_t M,                 ///< number of subquantizers
-             size_t nbits,             ///< number of bit per subvector index
-             MetricType metric = METRIC_L2);
+    IndexPQ(int d,        ///< dimensionality of the input vectors
+            size_t M,     ///< number of subquantizers
+            size_t nbits, ///< number of bit per subvector index
+            MetricType metric = METRIC_L2);
-    IndexPQ ();
+    IndexPQ();
     void train(idx_t n, const float* x) override;
     void add(idx_t n, const float* x) override;
     void search(
-        idx_t n,
-        const float* x,
-        idx_t k,
-        float* distances,
-        idx_t* labels) const override;
+            idx_t n,
+            const float* x,
+            idx_t k,
+            float* distances,
+            idx_t* labels) const override;
     void reset() override;
@@ -66,16 +61,13 @@ struct IndexPQ: Index {
     size_t remove_ids(const IDSelector& sel) override;
     /* The standalone codec interface */
-    size_t sa_code_size () const override;
+    size_t sa_code_size() const override;
-    void sa_encode (idx_t n, const float *x,
-                          uint8_t *bytes) const override;
+    void sa_encode(idx_t n, const float* x, uint8_t* bytes) const override;
-    void sa_decode (idx_t n, const uint8_t *bytes,
-                            float *x) const override;
+    void sa_decode(idx_t n, const uint8_t* bytes, float* x) const override;
-    DistanceComputer * get_distance_computer() const override;
+    DistanceComputer* get_distance_computer() const override;
     /******************************************************
      * Polysemous codes implementation
@@ -87,12 +79,12 @@ struct IndexPQ: Index {
     /// how to perform the search in search_core
     enum Search_type_t {
-        ST_PQ,             ///< asymmetric product quantizer (default)
-        ST_HE,             ///< Hamming distance on codes
-        ST_generalized_HE, ///< nb of same codes
-        ST_SDC,            ///< symmetric product quantizer (SDC)
-        ST_polysemous,     ///< HE filter (using ht) + PQ combination
-        ST_polysemous_generalize,  ///< Filter on generalized Hamming
+        ST_PQ,                    ///< asymmetric product quantizer (default)
+        ST_HE,                    ///< Hamming distance on codes
+        ST_generalized_HE,        ///< nb of same codes
+        ST_SDC,                   ///< symmetric product quantizer (SDC)
+        ST_polysemous,            ///< HE filter (using ht) + PQ combination
+        ST_polysemous_generalize, ///< Filter on generalized Hamming
     };
     Search_type_t search_type;
@@ -105,16 +97,23 @@ struct IndexPQ: Index {
     int polysemous_ht;
     // actual polysemous search
-    void search_core_polysemous (idx_t n, const float *x, idx_t k,
-                               float *distances, idx_t *labels) const;
+    void search_core_polysemous(
+            idx_t n,
+            const float* x,
+            idx_t k,
+            float* distances,
+            idx_t* labels) const;
     /// prepare query for a polysemous search, but instead of
     /// computing the result, just get the histogram of Hamming
     /// distances. May be computed on a provided dataset if xb != NULL
     /// @param dist_histogram (M * nbits + 1)
-    void hamming_distance_histogram (idx_t n, const float *x,
-                                     idx_t nb, const float *xb,
-                                     int64_t *dist_histogram);
+    void hamming_distance_histogram(
+            idx_t n,
+            const float* x,
+            idx_t nb,
+            const float* xb,
+            int64_t* dist_histogram);
     /** compute pairwise distances between queries and database
      *
@@ -122,80 +121,78 @@ struct IndexPQ: Index {
      * @param x    query vector, size n * d
      * @param dis  output distances, size n * ntotal
      */
-    void hamming_distance_table (idx_t n, const float *x,
-                                 int32_t *dis) const;
+    void hamming_distance_table(idx_t n, const float* x, int32_t* dis) const;
 };
 /// statistics are robust to internal threading, but not if
 /// IndexPQ::search is called by multiple threads
 struct IndexPQStats {
-    size_t nq;       // nb of queries run
-    size_t ncode;    // nb of codes visited
+    size_t nq;    // nb of queries run
+    size_t ncode; // nb of codes visited
     size_t n_hamming_pass; // nb of passed Hamming distance tests (for polysemy)
-    IndexPQStats () {reset (); }
-    void reset ();
+    IndexPQStats() {
+        reset();
+    }
+    void reset();
 };
 FAISS_API extern IndexPQStats indexPQ_stats;
 /** Quantizer where centroids are virtual: they are the Cartesian
  *  product of sub-centroids. */
-struct MultiIndexQuantizer: Index  {
+struct MultiIndexQuantizer : Index {
     ProductQuantizer pq;
-    MultiIndexQuantizer (int d,         ///< dimension of the input vectors
-                         size_t M,      ///< number of subquantizers
-                         size_t nbits); ///< number of bit per subvector index
+    MultiIndexQuantizer(
+            int d,         ///< dimension of the input vectors
+            size_t M,      ///< number of subquantizers
+            size_t nbits); ///< number of bit per subvector index
     void train(idx_t n, const float* x) override;
     void search(
-        idx_t n, const float* x, idx_t k,
-        float* distances, idx_t* labels) const override;
+            idx_t n,
+            const float* x,
+            idx_t k,
+            float* distances,
+            idx_t* labels) const override;
     /// add and reset will crash at runtime
     void add(idx_t n, const float* x) override;
     void reset() override;
-    MultiIndexQuantizer () {}
+    MultiIndexQuantizer() {}
     void reconstruct(idx_t key, float* recons) const override;
 };
 /** MultiIndexQuantizer where the PQ assignmnet is performed by sub-indexes
  */
-struct MultiIndexQuantizer2: MultiIndexQuantizer {
+struct MultiIndexQuantizer2 : MultiIndexQuantizer {
     /// M Indexes on d / M dimensions
     std::vector<Index*> assign_indexes;
     bool own_fields;
-    MultiIndexQuantizer2 (
-        int d, size_t M, size_t nbits,
-        Index **indexes);
+    MultiIndexQuantizer2(int d, size_t M, size_t nbits, Index** indexes);
-    MultiIndexQuantizer2 (
-        int d, size_t nbits,
-        Index *assign_index_0,
-        Index *assign_index_1);
+    MultiIndexQuantizer2(
+            int d,
+            size_t nbits,
+            Index* assign_index_0,
+            Index* assign_index_1);
     void train(idx_t n, const float* x) override;
     void search(
-        idx_t n, const float* x, idx_t k,
-        float* distances, idx_t* labels) const override;
+            idx_t n,
+            const float* x,
+            idx_t k,
+            float* distances,
+            idx_t* labels) const override;
 };
 } // namespace faiss
 #endif

data/vendor/faiss/faiss/IndexPQFastScan.cpp CHANGED Viewed

@@ -5,24 +5,21 @@
  * LICENSE file in the root directory of this source tree.
  */
 #include <faiss/IndexPQFastScan.h>
+#include <limits.h>
 #include <cassert>
 #include <memory>
-#include <limits.h>
 #include <omp.h>
 #include <faiss/impl/FaissAssert.h>
-#include <faiss/utils/utils.h>
 #include <faiss/utils/random.h>
+#include <faiss/utils/utils.h>
+#include <faiss/impl/pq4_fast_scan.h>
 #include <faiss/impl/simd_result_handlers.h>
 #include <faiss/utils/quantize_lut.h>
-#include <faiss/impl/pq4_fast_scan.h>
 namespace faiss {
@@ -33,25 +30,24 @@ inline size_t roundup(size_t a, size_t b) {
 }
 IndexPQFastScan::IndexPQFastScan(
-        int d, size_t M, size_t nbits,
+        int d,
+        size_t M,
+        size_t nbits,
         MetricType metric,
-        int bbs):
-    Index(d, metric), pq(d, M, nbits),
-    bbs(bbs), ntotal2(0), M2(roundup(M, 2))
-{
+        int bbs)
+        : Index(d, metric),
+          pq(d, M, nbits),
+          bbs(bbs),
+          ntotal2(0),
+          M2(roundup(M, 2)) {
     FAISS_THROW_IF_NOT(nbits == 4);
     is_trained = false;
 }
-IndexPQFastScan::IndexPQFastScan():
-    bbs(0), ntotal2(0), M2(0)
-{}
+IndexPQFastScan::IndexPQFastScan() : bbs(0), ntotal2(0), M2(0) {}
-IndexPQFastScan::IndexPQFastScan(const IndexPQ & orig, int bbs):
-    Index(orig.d, orig.metric_type),
-    pq(orig.pq),
-    bbs(bbs)
-{
+IndexPQFastScan::IndexPQFastScan(const IndexPQ& orig, int bbs)
+        : Index(orig.d, orig.metric_type), pq(orig.pq), bbs(bbs) {
     FAISS_THROW_IF_NOT(orig.pq.nbits == 4);
     ntotal = orig.ntotal;
     is_trained = orig.is_trained;
@@ -70,16 +66,10 @@ IndexPQFastScan::IndexPQFastScan(const IndexPQ & orig, int bbs):
     codes.resize(ntotal2 * M2 / 2);
     // printf("M=%d M2=%d code_size=%d\n", M, M2, pq.code_size);
-    pq4_pack_codes(
-            orig.codes.data(),
-            ntotal, M,
-            ntotal2, bbs, M2,
-            codes.get()
-    );
+    pq4_pack_codes(orig.codes.data(), ntotal, M, ntotal2, bbs, M2, codes.get());
 }
-void IndexPQFastScan::train (idx_t n, const float *x)
-{
+void IndexPQFastScan::train(idx_t n, const float* x) {
     if (is_trained) {
         return;
     }
@@ -87,11 +77,10 @@ void IndexPQFastScan::train (idx_t n, const float *x)
     is_trained = true;
 }
-void IndexPQFastScan::add (idx_t n, const float *x) {
-    FAISS_THROW_IF_NOT (is_trained);
+void IndexPQFastScan::add(idx_t n, const float* x) {
+    FAISS_THROW_IF_NOT(is_trained);
     AlignedTable<uint8_t> tmp_codes(n * pq.code_size);
-    pq.compute_codes (x, tmp_codes.get(), n);
+    pq.compute_codes(x, tmp_codes.get(), n);
     ntotal2 = roundup(ntotal + n, bbs);
     size_t new_size = ntotal2 * M2 / 2;
     size_t old_size = codes.size();
@@ -100,39 +89,35 @@ void IndexPQFastScan::add (idx_t n, const float *x) {
         memset(codes.get() + old_size, 0, new_size - old_size);
     }
     pq4_pack_codes_range(
-        tmp_codes.get(), pq.M, ntotal, ntotal + n,
-        bbs, M2, codes.get()
-    );
+            tmp_codes.get(), pq.M, ntotal, ntotal + n, bbs, M2, codes.get());
     ntotal += n;
 }
-void IndexPQFastScan::reset()
-{
+void IndexPQFastScan::reset() {
     codes.resize(0);
     ntotal = 0;
- }
+}
 namespace {
 // from impl/ProductQuantizer.cpp
 template <class C, typename dis_t>
 void pq_estimators_from_tables_generic(
-        const ProductQuantizer& pq, size_t nbits,
-        const uint8_t *codes, size_t ncodes,
-        const dis_t *dis_table, size_t k,
-        typename C::T *heap_dis, int64_t *heap_ids)
-{
+        const ProductQuantizer& pq,
+        size_t nbits,
+        const uint8_t* codes,
+        size_t ncodes,
+        const dis_t* dis_table,
+        size_t k,
+        typename C::T* heap_dis,
+        int64_t* heap_ids) {
     using accu_t = typename C::T;
     const size_t M = pq.M;
     const size_t ksub = pq.ksub;
     for (size_t j = 0; j < ncodes; ++j) {
-        PQDecoderGeneric decoder(
-                codes + j * pq.code_size, nbits
-        );
+        PQDecoderGeneric decoder(codes + j * pq.code_size, nbits);
         accu_t dis = 0;
-        const dis_t * __restrict dt = dis_table;
+        const dis_t* __restrict dt = dis_table;
         for (size_t m = 0; m < M; m++) {
             uint64_t c = decoder.decode();
             dis += dt[c];
@@ -146,53 +131,55 @@ void pq_estimators_from_tables_generic(
     }
 }
 } // anonymous namespace
 using namespace quantize_lut;
 void IndexPQFastScan::compute_quantized_LUT(
-        idx_t n, const float* x,
-        uint8_t *lut, float *normalizers) const
-{
+        idx_t n,
+        const float* x,
+        uint8_t* lut,
+        float* normalizers) const {
     size_t dim12 = pq.ksub * pq.M;
-    std::unique_ptr<float[]> dis_tables(new float [n * dim12]);
+    std::unique_ptr<float[]> dis_tables(new float[n * dim12]);
     if (metric_type == METRIC_L2) {
-        pq.compute_distance_tables (n, x, dis_tables.get());
+        pq.compute_distance_tables(n, x, dis_tables.get());
     } else {
-        pq.compute_inner_prod_tables (n, x, dis_tables.get());
+        pq.compute_inner_prod_tables(n, x, dis_tables.get());
     }
-    for(uint64_t i = 0; i < n; i++) {
+    for (uint64_t i = 0; i < n; i++) {
         round_uint8_per_column(
-                dis_tables.get() + i * dim12, pq.M, pq.ksub,
-                &normalizers[2 * i], &normalizers[2 * i + 1]
-        );
+                dis_tables.get() + i * dim12,
+                pq.M,
+                pq.ksub,
+                &normalizers[2 * i],
+                &normalizers[2 * i + 1]);
     }
-    for(uint64_t i = 0; i < n; i++) {
-        const float *t_in = dis_tables.get() + i * dim12;
-        uint8_t *t_out = lut + i * M2 * pq.ksub;
+    for (uint64_t i = 0; i < n; i++) {
+        const float* t_in = dis_tables.get() + i * dim12;
+        uint8_t* t_out = lut + i * M2 * pq.ksub;
-        for(int j = 0; j < dim12; j++) {
+        for (int j = 0; j < dim12; j++) {
             t_out[j] = int(t_in[j]);
         }
         memset(t_out + dim12, 0, (M2 - pq.M) * pq.ksub);
     }
 }
 /******************************************************************************
  * Search driver routine
  ******************************************************************************/
 void IndexPQFastScan::search(
-                idx_t n, const float* x, idx_t k,
-                float* distances, idx_t* labels) const
-{
+        idx_t n,
+        const float* x,
+        idx_t k,
+        float* distances,
+        idx_t* labels) const {
+    FAISS_THROW_IF_NOT(k > 0);
     if (metric_type == METRIC_L2) {
         search_dispatch_implem<true>(n, x, k, distances, labels);
     } else {
@@ -200,20 +187,20 @@ void IndexPQFastScan::search(
     }
 }
-template<bool is_max>
+template <bool is_max>
 void IndexPQFastScan::search_dispatch_implem(
-                idx_t n,
-                const float* x,
-                idx_t k,
-                float* distances,
-                idx_t* labels) const
-{
-    using Cfloat = typename std::conditional<is_max,
-        CMax<float, int64_t>, CMin<float, int64_t> >::type;
-    using C = typename std::conditional<is_max,
-        CMax<uint16_t, int>, CMin<uint16_t, int> >::type;
+        idx_t n,
+        const float* x,
+        idx_t k,
+        float* distances,
+        idx_t* labels) const {
+    using Cfloat = typename std::conditional<
+            is_max,
+            CMax<float, int64_t>,
+            CMin<float, int64_t>>::type;
+    using C = typename std::
+            conditional<is_max, CMax<uint16_t, int>, CMin<uint16_t, int>>::type;
     if (n == 0) {
         return;
@@ -229,26 +216,24 @@ void IndexPQFastScan::search_dispatch_implem(
             impl = 14;
         }
         if (k > 20) {
-            impl ++;
+            impl++;
         }
     }
     if (implem == 1) {
         FAISS_THROW_IF_NOT(orig_codes);
         FAISS_THROW_IF_NOT(is_max);
-        float_maxheap_array_t res = {
-            size_t(n), size_t(k), labels, distances };
-        pq.search (x, n, orig_codes, ntotal, &res, true);
+        float_maxheap_array_t res = {size_t(n), size_t(k), labels, distances};
+        pq.search(x, n, orig_codes, ntotal, &res, true);
     } else if (implem == 2 || implem == 3 || implem == 4) {
         FAISS_THROW_IF_NOT(orig_codes);
         size_t dim12 = pq.ksub * pq.M;
-        std::unique_ptr<float[]> dis_tables(new float [n * dim12]);
+        std::unique_ptr<float[]> dis_tables(new float[n * dim12]);
         if (is_max) {
-            pq.compute_distance_tables (n, x, dis_tables.get());
+            pq.compute_distance_tables(n, x, dis_tables.get());
         } else {
-            pq.compute_inner_prod_tables (n, x, dis_tables.get());
+            pq.compute_inner_prod_tables(n, x, dis_tables.get());
         }
         std::vector<float> normalizers(n * 2);
@@ -256,34 +241,39 @@ void IndexPQFastScan::search_dispatch_implem(
         if (implem == 2) {
             // default float
         } else if (implem == 3 || implem == 4) {
-            for(uint64_t i = 0; i < n; i++) {
+            for (uint64_t i = 0; i < n; i++) {
                 round_uint8_per_column(
-                        dis_tables.get() + i * dim12, pq.M,
+                        dis_tables.get() + i * dim12,
+                        pq.M,
                         pq.ksub,
-                        &normalizers[2 * i], &normalizers[2 * i + 1]
-                );
+                        &normalizers[2 * i],
+                        &normalizers[2 * i + 1]);
             }
         }
         for (int64_t i = 0; i < n; i++) {
-            int64_t *heap_ids = labels + i * k;
-            float *heap_dis = distances + i * k;
+            int64_t* heap_ids = labels + i * k;
+            float* heap_dis = distances + i * k;
-            heap_heapify<Cfloat> (k, heap_dis, heap_ids);
+            heap_heapify<Cfloat>(k, heap_dis, heap_ids);
             pq_estimators_from_tables_generic<Cfloat>(
-                pq, pq.nbits, orig_codes, ntotal,
-                dis_tables.get() + i * dim12,
-                k, heap_dis, heap_ids
-            );
+                    pq,
+                    pq.nbits,
+                    orig_codes,
+                    ntotal,
+                    dis_tables.get() + i * dim12,
+                    k,
+                    heap_dis,
+                    heap_ids);
-            heap_reorder<Cfloat> (k, heap_dis, heap_ids);
+            heap_reorder<Cfloat>(k, heap_dis, heap_ids);
             if (implem == 4) {
                 float a = normalizers[2 * i];
                 float b = normalizers[2 * i + 1];
-                for(int j = 0; j < k; j++) {
+                for (int j = 0; j < k; j++) {
                     heap_dis[j] = heap_dis[j] / a + b;
                 }
             }
@@ -303,30 +293,30 @@ void IndexPQFastScan::search_dispatch_implem(
             for (int slice = 0; slice < nt; slice++) {
                 idx_t i0 = n * slice / nt;
                 idx_t i1 = n * (slice + 1) / nt;
-                float *dis_i = distances + i0 * k;
-                idx_t *lab_i = labels + i0 * k;
+                float* dis_i = distances + i0 * k;
+                idx_t* lab_i = labels + i0 * k;
                 if (impl == 12 || impl == 13) {
                     search_implem_12<C>(
-                        i1 - i0, x + i0 * d, k, dis_i, lab_i, impl);
+                            i1 - i0, x + i0 * d, k, dis_i, lab_i, impl);
                 } else {
                     search_implem_14<C>(
-                        i1 - i0, x + i0 * d, k, dis_i, lab_i, impl);
+                            i1 - i0, x + i0 * d, k, dis_i, lab_i, impl);
                 }
             }
         }
     } else {
         FAISS_THROW_FMT("invalid implem %d impl=%d", implem, impl);
     }
 }
-template<class C>
+template <class C>
 void IndexPQFastScan::search_implem_12(
-                idx_t n, const float* x, idx_t k,
-                float* distances, idx_t* labels,
-                int impl) const
-{
+        idx_t n,
+        const float* x,
+        idx_t k,
+        float* distances,
+        idx_t* labels,
+        int impl) const {
     FAISS_THROW_IF_NOT(bbs == 32);
     // handle qbs2 blocking by recursive call
@@ -335,23 +325,25 @@ void IndexPQFastScan::search_implem_12(
         for (int64_t i0 = 0; i0 < n; i0 += qbs2) {
             int64_t i1 = std::min(i0 + qbs2, n);
             search_implem_12<C>(
-                    i1 - i0, x + d * i0, k,
-                    distances + i0 * k, labels + i0 * k, impl
-            );
+                    i1 - i0,
+                    x + d * i0,
+                    k,
+                    distances + i0 * k,
+                    labels + i0 * k,
+                    impl);
         }
         return;
     }
     size_t dim12 = pq.ksub * M2;
     AlignedTable<uint8_t> quantized_dis_tables(n * dim12);
-    std::unique_ptr<float []> normalizers(new float[2 * n]);
+    std::unique_ptr<float[]> normalizers(new float[2 * n]);
     if (skip & 1) {
         quantized_dis_tables.clear();
     } else {
         compute_quantized_LUT(
-            n, x, quantized_dis_tables.get(), normalizers.get()
-        );
+                n, x, quantized_dis_tables.get(), normalizers.get());
     }
     AlignedTable<uint8_t> LUT(n * dim12);
@@ -365,9 +357,8 @@ void IndexPQFastScan::search_implem_12(
         qbs = pq4_preferred_qbs(n);
     }
-    int LUT_nq = pq4_pack_LUT_qbs(
-        qbs, M2, quantized_dis_tables.get(), LUT.get()
-    );
+    int LUT_nq =
+            pq4_pack_LUT_qbs(qbs, M2, quantized_dis_tables.get(), LUT.get());
     FAISS_THROW_IF_NOT(LUT_nq == n);
     if (k == 1) {
@@ -377,37 +368,30 @@ void IndexPQFastScan::search_implem_12(
         } else {
             handler.disable = bool(skip & 2);
             pq4_accumulate_loop_qbs(
-                qbs, ntotal2, M2,
-                codes.get(), LUT.get(),
-                handler
-            );
+                    qbs, ntotal2, M2, codes.get(), LUT.get(), handler);
         }
         handler.to_flat_arrays(distances, labels, normalizers.get());
     } else if (impl == 12) {
         std::vector<uint16_t> tmp_dis(n * k);
         std::vector<int32_t> tmp_ids(n * k);
         if (skip & 4) {
             // skip
         } else {
-            HeapHandler<C> handler(n, tmp_dis.data(), tmp_ids.data(), k, ntotal);
+            HeapHandler<C> handler(
+                    n, tmp_dis.data(), tmp_ids.data(), k, ntotal);
             handler.disable = bool(skip & 2);
             pq4_accumulate_loop_qbs(
-                qbs, ntotal2, M2,
-                codes.get(), LUT.get(),
-                handler
-            );
+                    qbs, ntotal2, M2, codes.get(), LUT.get(), handler);
             if (!(skip & 8)) {
                 handler.to_flat_arrays(distances, labels, normalizers.get());
             }
         }
     } else { // impl == 13
         ReservoirHandler<C> handler(n, ntotal, k, 2 * k);
@@ -417,10 +401,7 @@ void IndexPQFastScan::search_implem_12(
             // skip
         } else {
             pq4_accumulate_loop_qbs(
-                qbs, ntotal2, M2,
-                codes.get(), LUT.get(),
-                handler
-            );
+                    qbs, ntotal2, M2, codes.get(), LUT.get(), handler);
         }
         if (!(skip & 8)) {
@@ -431,18 +412,19 @@ void IndexPQFastScan::search_implem_12(
         FastScan_stats.t1 += handler.times[1];
         FastScan_stats.t2 += handler.times[2];
         FastScan_stats.t3 += handler.times[3];
     }
 }
 FastScanStats FastScan_stats;
-template<class C>
+template <class C>
 void IndexPQFastScan::search_implem_14(
-                idx_t n, const float* x, idx_t k,
-                float* distances, idx_t* labels, int impl) const
-{
+        idx_t n,
+        const float* x,
+        idx_t k,
+        float* distances,
+        idx_t* labels,
+        int impl) const {
     FAISS_THROW_IF_NOT(bbs % 32 == 0);
     int qbs2 = qbs == 0 ? 4 : qbs;
@@ -452,23 +434,25 @@ void IndexPQFastScan::search_implem_14(
         for (int64_t i0 = 0; i0 < n; i0 += qbs2) {
             int64_t i1 = std::min(i0 + qbs2, n);
             search_implem_14<C>(
-                    i1 - i0, x + d * i0, k,
-                    distances + i0 * k, labels + i0 * k, impl
-            );
+                    i1 - i0,
+                    x + d * i0,
+                    k,
+                    distances + i0 * k,
+                    labels + i0 * k,
+                    impl);
         }
         return;
     }
     size_t dim12 = pq.ksub * M2;
     AlignedTable<uint8_t> quantized_dis_tables(n * dim12);
-    std::unique_ptr<float []> normalizers(new float[2 * n]);
+    std::unique_ptr<float[]> normalizers(new float[2 * n]);
     if (skip & 1) {
         quantized_dis_tables.clear();
     } else {
         compute_quantized_LUT(
-            n, x, quantized_dis_tables.get(), normalizers.get()
-        );
+                n, x, quantized_dis_tables.get(), normalizers.get());
     }
     AlignedTable<uint8_t> LUT(n * dim12);
@@ -480,37 +464,30 @@ void IndexPQFastScan::search_implem_14(
             // pass
         } else {
             handler.disable = bool(skip & 2);
-            pq4_accumulate_loop (
-                n, ntotal2, bbs, M2,
-                codes.get(), LUT.get(),
-                handler
-            );
+            pq4_accumulate_loop(
+                    n, ntotal2, bbs, M2, codes.get(), LUT.get(), handler);
         }
         handler.to_flat_arrays(distances, labels, normalizers.get());
     } else if (impl == 14) {
         std::vector<uint16_t> tmp_dis(n * k);
         std::vector<int32_t> tmp_ids(n * k);
         if (skip & 4) {
             // skip
         } else if (k > 1) {
-            HeapHandler<C> handler(n, tmp_dis.data(), tmp_ids.data(), k, ntotal);
+            HeapHandler<C> handler(
+                    n, tmp_dis.data(), tmp_ids.data(), k, ntotal);
             handler.disable = bool(skip & 2);
-            pq4_accumulate_loop (
-                n, ntotal2, bbs, M2,
-                codes.get(), LUT.get(),
-                handler
-            );
+            pq4_accumulate_loop(
+                    n, ntotal2, bbs, M2, codes.get(), LUT.get(), handler);
             if (!(skip & 8)) {
                 handler.to_flat_arrays(distances, labels, normalizers.get());
             }
         }
     } else { // impl == 15
         ReservoirHandler<C> handler(n, ntotal, k, 2 * k);
@@ -519,11 +496,8 @@ void IndexPQFastScan::search_implem_14(
         if (skip & 4) {
             // skip
         } else {
-            pq4_accumulate_loop (
-                n, ntotal2, bbs, M2,
-                codes.get(), LUT.get(),
-                handler
-            );
+            pq4_accumulate_loop(
+                    n, ntotal2, bbs, M2, codes.get(), LUT.get(), handler);
         }
         if (!(skip & 8)) {
@@ -532,5 +506,4 @@ void IndexPQFastScan::search_implem_14(
     }
 }
 } // namespace faiss