RubyGems - faiss - Versions diffs - 0.2.0 → 0.2.1 - Mend

faiss 0.2.0 → 0.2.1

Files changed (202) hide show

checksums.yaml +4 -4
data/CHANGELOG.md +4 -0
data/lib/faiss/version.rb +1 -1
data/vendor/faiss/faiss/AutoTune.cpp +292 -291
data/vendor/faiss/faiss/AutoTune.h +55 -56
data/vendor/faiss/faiss/Clustering.cpp +334 -195
data/vendor/faiss/faiss/Clustering.h +88 -35
data/vendor/faiss/faiss/IVFlib.cpp +171 -195
data/vendor/faiss/faiss/IVFlib.h +48 -51
data/vendor/faiss/faiss/Index.cpp +85 -103
data/vendor/faiss/faiss/Index.h +54 -48
data/vendor/faiss/faiss/Index2Layer.cpp +139 -164
data/vendor/faiss/faiss/Index2Layer.h +22 -22
data/vendor/faiss/faiss/IndexBinary.cpp +45 -37
data/vendor/faiss/faiss/IndexBinary.h +140 -132
data/vendor/faiss/faiss/IndexBinaryFlat.cpp +73 -53
data/vendor/faiss/faiss/IndexBinaryFlat.h +29 -24
data/vendor/faiss/faiss/IndexBinaryFromFloat.cpp +46 -43
data/vendor/faiss/faiss/IndexBinaryFromFloat.h +16 -15
data/vendor/faiss/faiss/IndexBinaryHNSW.cpp +215 -232
data/vendor/faiss/faiss/IndexBinaryHNSW.h +25 -24
data/vendor/faiss/faiss/IndexBinaryHash.cpp +182 -177
data/vendor/faiss/faiss/IndexBinaryHash.h +41 -34
data/vendor/faiss/faiss/IndexBinaryIVF.cpp +489 -461
data/vendor/faiss/faiss/IndexBinaryIVF.h +97 -68
data/vendor/faiss/faiss/IndexFlat.cpp +116 -147
data/vendor/faiss/faiss/IndexFlat.h +35 -46
data/vendor/faiss/faiss/IndexHNSW.cpp +372 -348
data/vendor/faiss/faiss/IndexHNSW.h +57 -41
data/vendor/faiss/faiss/IndexIVF.cpp +474 -454
data/vendor/faiss/faiss/IndexIVF.h +146 -113
data/vendor/faiss/faiss/IndexIVFFlat.cpp +248 -250
data/vendor/faiss/faiss/IndexIVFFlat.h +48 -51
data/vendor/faiss/faiss/IndexIVFPQ.cpp +457 -516
data/vendor/faiss/faiss/IndexIVFPQ.h +74 -66
data/vendor/faiss/faiss/IndexIVFPQFastScan.cpp +406 -372
data/vendor/faiss/faiss/IndexIVFPQFastScan.h +82 -57
data/vendor/faiss/faiss/IndexIVFPQR.cpp +104 -102
data/vendor/faiss/faiss/IndexIVFPQR.h +33 -28
data/vendor/faiss/faiss/IndexIVFSpectralHash.cpp +125 -133
data/vendor/faiss/faiss/IndexIVFSpectralHash.h +19 -21
data/vendor/faiss/faiss/IndexLSH.cpp +75 -96
data/vendor/faiss/faiss/IndexLSH.h +21 -26
data/vendor/faiss/faiss/IndexLattice.cpp +42 -56
data/vendor/faiss/faiss/IndexLattice.h +11 -16
data/vendor/faiss/faiss/IndexNNDescent.cpp +231 -0
data/vendor/faiss/faiss/IndexNNDescent.h +72 -0
data/vendor/faiss/faiss/IndexNSG.cpp +303 -0
data/vendor/faiss/faiss/IndexNSG.h +85 -0
data/vendor/faiss/faiss/IndexPQ.cpp +405 -464
data/vendor/faiss/faiss/IndexPQ.h +64 -67
data/vendor/faiss/faiss/IndexPQFastScan.cpp +143 -170
data/vendor/faiss/faiss/IndexPQFastScan.h +46 -32
data/vendor/faiss/faiss/IndexPreTransform.cpp +120 -150
data/vendor/faiss/faiss/IndexPreTransform.h +33 -36
data/vendor/faiss/faiss/IndexRefine.cpp +115 -131
data/vendor/faiss/faiss/IndexRefine.h +22 -23
data/vendor/faiss/faiss/IndexReplicas.cpp +147 -153
data/vendor/faiss/faiss/IndexReplicas.h +62 -56
data/vendor/faiss/faiss/IndexResidual.cpp +291 -0
data/vendor/faiss/faiss/IndexResidual.h +152 -0
data/vendor/faiss/faiss/IndexScalarQuantizer.cpp +120 -155
data/vendor/faiss/faiss/IndexScalarQuantizer.h +41 -45
data/vendor/faiss/faiss/IndexShards.cpp +256 -240
data/vendor/faiss/faiss/IndexShards.h +85 -73
data/vendor/faiss/faiss/MatrixStats.cpp +112 -97
data/vendor/faiss/faiss/MatrixStats.h +7 -10
data/vendor/faiss/faiss/MetaIndexes.cpp +135 -157
data/vendor/faiss/faiss/MetaIndexes.h +40 -34
data/vendor/faiss/faiss/MetricType.h +7 -7
data/vendor/faiss/faiss/VectorTransform.cpp +652 -474
data/vendor/faiss/faiss/VectorTransform.h +61 -89
data/vendor/faiss/faiss/clone_index.cpp +77 -73
data/vendor/faiss/faiss/clone_index.h +4 -9
data/vendor/faiss/faiss/gpu/GpuAutoTune.cpp +33 -38
data/vendor/faiss/faiss/gpu/GpuAutoTune.h +11 -9
data/vendor/faiss/faiss/gpu/GpuCloner.cpp +197 -170
data/vendor/faiss/faiss/gpu/GpuCloner.h +53 -35
data/vendor/faiss/faiss/gpu/GpuClonerOptions.cpp +12 -14
data/vendor/faiss/faiss/gpu/GpuClonerOptions.h +27 -25
data/vendor/faiss/faiss/gpu/GpuDistance.h +116 -112
data/vendor/faiss/faiss/gpu/GpuFaissAssert.h +1 -2
data/vendor/faiss/faiss/gpu/GpuIndex.h +134 -137
data/vendor/faiss/faiss/gpu/GpuIndexBinaryFlat.h +76 -73
data/vendor/faiss/faiss/gpu/GpuIndexFlat.h +173 -162
data/vendor/faiss/faiss/gpu/GpuIndexIVF.h +67 -64
data/vendor/faiss/faiss/gpu/GpuIndexIVFFlat.h +89 -86
data/vendor/faiss/faiss/gpu/GpuIndexIVFPQ.h +150 -141
data/vendor/faiss/faiss/gpu/GpuIndexIVFScalarQuantizer.h +101 -103
data/vendor/faiss/faiss/gpu/GpuIndicesOptions.h +17 -16
data/vendor/faiss/faiss/gpu/GpuResources.cpp +116 -128
data/vendor/faiss/faiss/gpu/GpuResources.h +182 -186
data/vendor/faiss/faiss/gpu/StandardGpuResources.cpp +433 -422
data/vendor/faiss/faiss/gpu/StandardGpuResources.h +131 -130
data/vendor/faiss/faiss/gpu/impl/InterleavedCodes.cpp +468 -456
data/vendor/faiss/faiss/gpu/impl/InterleavedCodes.h +25 -19
data/vendor/faiss/faiss/gpu/impl/RemapIndices.cpp +22 -20
data/vendor/faiss/faiss/gpu/impl/RemapIndices.h +9 -8
data/vendor/faiss/faiss/gpu/perf/IndexWrapper-inl.h +39 -44
data/vendor/faiss/faiss/gpu/perf/IndexWrapper.h +16 -14
data/vendor/faiss/faiss/gpu/perf/PerfClustering.cpp +77 -71
data/vendor/faiss/faiss/gpu/perf/PerfIVFPQAdd.cpp +109 -88
data/vendor/faiss/faiss/gpu/perf/WriteIndex.cpp +75 -64
data/vendor/faiss/faiss/gpu/test/TestCodePacking.cpp +230 -215
data/vendor/faiss/faiss/gpu/test/TestGpuIndexBinaryFlat.cpp +80 -86
data/vendor/faiss/faiss/gpu/test/TestGpuIndexFlat.cpp +284 -277
data/vendor/faiss/faiss/gpu/test/TestGpuIndexIVFFlat.cpp +416 -416
data/vendor/faiss/faiss/gpu/test/TestGpuIndexIVFPQ.cpp +611 -517
data/vendor/faiss/faiss/gpu/test/TestGpuIndexIVFScalarQuantizer.cpp +166 -164
data/vendor/faiss/faiss/gpu/test/TestGpuMemoryException.cpp +61 -53
data/vendor/faiss/faiss/gpu/test/TestUtils.cpp +274 -238
data/vendor/faiss/faiss/gpu/test/TestUtils.h +73 -57
data/vendor/faiss/faiss/gpu/test/demo_ivfpq_indexing_gpu.cpp +47 -50
data/vendor/faiss/faiss/gpu/utils/DeviceUtils.h +79 -72
data/vendor/faiss/faiss/gpu/utils/StackDeviceMemory.cpp +140 -146
data/vendor/faiss/faiss/gpu/utils/StackDeviceMemory.h +69 -71
data/vendor/faiss/faiss/gpu/utils/StaticUtils.h +21 -16
data/vendor/faiss/faiss/gpu/utils/Timer.cpp +25 -29
data/vendor/faiss/faiss/gpu/utils/Timer.h +30 -29
data/vendor/faiss/faiss/impl/AdditiveQuantizer.cpp +270 -0
data/vendor/faiss/faiss/impl/AdditiveQuantizer.h +115 -0
data/vendor/faiss/faiss/impl/AuxIndexStructures.cpp +90 -120
data/vendor/faiss/faiss/impl/AuxIndexStructures.h +81 -65
data/vendor/faiss/faiss/impl/FaissAssert.h +73 -58
data/vendor/faiss/faiss/impl/FaissException.cpp +56 -48
data/vendor/faiss/faiss/impl/FaissException.h +41 -29
data/vendor/faiss/faiss/impl/HNSW.cpp +595 -611
data/vendor/faiss/faiss/impl/HNSW.h +179 -200
data/vendor/faiss/faiss/impl/LocalSearchQuantizer.cpp +672 -0
data/vendor/faiss/faiss/impl/LocalSearchQuantizer.h +172 -0
data/vendor/faiss/faiss/impl/NNDescent.cpp +487 -0
data/vendor/faiss/faiss/impl/NNDescent.h +154 -0
data/vendor/faiss/faiss/impl/NSG.cpp +682 -0
data/vendor/faiss/faiss/impl/NSG.h +199 -0
data/vendor/faiss/faiss/impl/PolysemousTraining.cpp +484 -454
data/vendor/faiss/faiss/impl/PolysemousTraining.h +52 -55
data/vendor/faiss/faiss/impl/ProductQuantizer-inl.h +26 -47
data/vendor/faiss/faiss/impl/ProductQuantizer.cpp +469 -459
data/vendor/faiss/faiss/impl/ProductQuantizer.h +76 -87
data/vendor/faiss/faiss/impl/ResidualQuantizer.cpp +448 -0
data/vendor/faiss/faiss/impl/ResidualQuantizer.h +130 -0
data/vendor/faiss/faiss/impl/ResultHandler.h +96 -132
data/vendor/faiss/faiss/impl/ScalarQuantizer.cpp +648 -701
data/vendor/faiss/faiss/impl/ScalarQuantizer.h +48 -46
data/vendor/faiss/faiss/impl/ThreadedIndex-inl.h +129 -131
data/vendor/faiss/faiss/impl/ThreadedIndex.h +61 -55
data/vendor/faiss/faiss/impl/index_read.cpp +547 -479
data/vendor/faiss/faiss/impl/index_write.cpp +497 -407
data/vendor/faiss/faiss/impl/io.cpp +75 -94
data/vendor/faiss/faiss/impl/io.h +31 -41
data/vendor/faiss/faiss/impl/io_macros.h +40 -29
data/vendor/faiss/faiss/impl/lattice_Zn.cpp +137 -186
data/vendor/faiss/faiss/impl/lattice_Zn.h +40 -51
data/vendor/faiss/faiss/impl/platform_macros.h +29 -8
data/vendor/faiss/faiss/impl/pq4_fast_scan.cpp +77 -124
data/vendor/faiss/faiss/impl/pq4_fast_scan.h +39 -48
data/vendor/faiss/faiss/impl/pq4_fast_scan_search_1.cpp +41 -52
data/vendor/faiss/faiss/impl/pq4_fast_scan_search_qbs.cpp +80 -117
data/vendor/faiss/faiss/impl/simd_result_handlers.h +109 -137
data/vendor/faiss/faiss/index_factory.cpp +269 -218
data/vendor/faiss/faiss/index_factory.h +6 -7
data/vendor/faiss/faiss/index_io.h +23 -26
data/vendor/faiss/faiss/invlists/BlockInvertedLists.cpp +67 -75
data/vendor/faiss/faiss/invlists/BlockInvertedLists.h +22 -24
data/vendor/faiss/faiss/invlists/DirectMap.cpp +96 -112
data/vendor/faiss/faiss/invlists/DirectMap.h +29 -33
data/vendor/faiss/faiss/invlists/InvertedLists.cpp +307 -364
data/vendor/faiss/faiss/invlists/InvertedLists.h +151 -151
data/vendor/faiss/faiss/invlists/InvertedListsIOHook.cpp +29 -34
data/vendor/faiss/faiss/invlists/InvertedListsIOHook.h +17 -18
data/vendor/faiss/faiss/invlists/OnDiskInvertedLists.cpp +257 -293
data/vendor/faiss/faiss/invlists/OnDiskInvertedLists.h +50 -45
data/vendor/faiss/faiss/python/python_callbacks.cpp +23 -26
data/vendor/faiss/faiss/python/python_callbacks.h +9 -16
data/vendor/faiss/faiss/utils/AlignedTable.h +79 -44
data/vendor/faiss/faiss/utils/Heap.cpp +40 -48
data/vendor/faiss/faiss/utils/Heap.h +186 -209
data/vendor/faiss/faiss/utils/WorkerThread.cpp +67 -76
data/vendor/faiss/faiss/utils/WorkerThread.h +32 -33
data/vendor/faiss/faiss/utils/distances.cpp +301 -310
data/vendor/faiss/faiss/utils/distances.h +133 -118
data/vendor/faiss/faiss/utils/distances_simd.cpp +456 -516
data/vendor/faiss/faiss/utils/extra_distances-inl.h +117 -0
data/vendor/faiss/faiss/utils/extra_distances.cpp +113 -232
data/vendor/faiss/faiss/utils/extra_distances.h +30 -29
data/vendor/faiss/faiss/utils/hamming-inl.h +260 -209
data/vendor/faiss/faiss/utils/hamming.cpp +375 -469
data/vendor/faiss/faiss/utils/hamming.h +62 -85
data/vendor/faiss/faiss/utils/ordered_key_value.h +16 -18
data/vendor/faiss/faiss/utils/partitioning.cpp +393 -318
data/vendor/faiss/faiss/utils/partitioning.h +26 -21
data/vendor/faiss/faiss/utils/quantize_lut.cpp +78 -66
data/vendor/faiss/faiss/utils/quantize_lut.h +22 -20
data/vendor/faiss/faiss/utils/random.cpp +39 -63
data/vendor/faiss/faiss/utils/random.h +13 -16
data/vendor/faiss/faiss/utils/simdlib.h +4 -2
data/vendor/faiss/faiss/utils/simdlib_avx2.h +88 -85
data/vendor/faiss/faiss/utils/simdlib_emulated.h +226 -165
data/vendor/faiss/faiss/utils/simdlib_neon.h +832 -0
data/vendor/faiss/faiss/utils/utils.cpp +304 -287
data/vendor/faiss/faiss/utils/utils.h +53 -48
metadata +20 -2

data/vendor/faiss/faiss/gpu/GpuIndexIVFFlat.h CHANGED Viewed

@@ -5,108 +5,111 @@
  * LICENSE file in the root directory of this source tree.
  */
 #pragma once
 #include <faiss/gpu/GpuIndexIVF.h>
 #include <memory>
-namespace faiss { struct IndexIVFFlat; }
+namespace faiss {
+struct IndexIVFFlat;
+}
-namespace faiss { namespace gpu {
+namespace faiss {
+namespace gpu {
 class IVFFlat;
 class GpuIndexFlat;
 struct GpuIndexIVFFlatConfig : public GpuIndexIVFConfig {
-  inline GpuIndexIVFFlatConfig()
-      : interleavedLayout(true) {
-  }
+    inline GpuIndexIVFFlatConfig() : interleavedLayout(true) {}
-  /// Use the alternative memory layout for the IVF lists
-  /// (currently the default)
-  bool interleavedLayout;
+    /// Use the alternative memory layout for the IVF lists
+    /// (currently the default)
+    bool interleavedLayout;
 };
 /// Wrapper around the GPU implementation that looks like
 /// faiss::IndexIVFFlat
 class GpuIndexIVFFlat : public GpuIndexIVF {
- public:
-  /// Construct from a pre-existing faiss::IndexIVFFlat instance, copying
-  /// data over to the given GPU, if the input index is trained.
-  GpuIndexIVFFlat(GpuResourcesProvider* provider,
-                  const faiss::IndexIVFFlat* index,
-                  GpuIndexIVFFlatConfig config = GpuIndexIVFFlatConfig());
-  /// Constructs a new instance with an empty flat quantizer; the user
-  /// provides the number of lists desired.
-  GpuIndexIVFFlat(GpuResourcesProvider* provider,
-                  int dims,
-                  int nlist,
-                  faiss::MetricType metric,
-                  GpuIndexIVFFlatConfig config = GpuIndexIVFFlatConfig());
-  ~GpuIndexIVFFlat() override;
-  /// Reserve GPU memory in our inverted lists for this number of vectors
-  void reserveMemory(size_t numVecs);
-  /// Initialize ourselves from the given CPU index; will overwrite
-  /// all data in ourselves
-  void copyFrom(const faiss::IndexIVFFlat* index);
-  /// Copy ourselves to the given CPU index; will overwrite all data
-  /// in the index instance
-  void copyTo(faiss::IndexIVFFlat* index) const;
-  /// After adding vectors, one can call this to reclaim device memory
-  /// to exactly the amount needed. Returns space reclaimed in bytes
-  size_t reclaimMemory();
-  /// Clears out all inverted lists, but retains the coarse centroid information
-  void reset() override;
-  /// Trains the coarse quantizer based on the given vector data
-  void train(Index::idx_t n, const float* x) override;
-  /// Returns the number of vectors present in a particular inverted list
-  int getListLength(int listId) const override;
-  /// Return the encoded vector data contained in a particular inverted list,
-  /// for debugging purposes.
-  /// If gpuFormat is true, the data is returned as it is encoded in the
-  /// GPU-side representation.
-  /// Otherwise, it is converted to the CPU format.
-  /// compliant format, while the native GPU format may differ.
-  std::vector<uint8_t>
-  getListVectorData(int listId, bool gpuFormat = false) const override;
-  /// Return the vector indices contained in a particular inverted list, for
-  /// debugging purposes.
-  std::vector<Index::idx_t> getListIndices(int listId) const override;
- protected:
-  /// Called from GpuIndex for add/add_with_ids
-  void addImpl_(int n,
-                const float* x,
-                const Index::idx_t* ids) override;
-  /// Called from GpuIndex for search
-  void searchImpl_(int n,
-                   const float* x,
-                   int k,
-                   float* distances,
-                   Index::idx_t* labels) const override;
- protected:
-  /// Our configuration options
-  const GpuIndexIVFFlatConfig ivfFlatConfig_;
-  /// Desired inverted list memory reservation
-  size_t reserveMemoryVecs_;
-  /// Instance that we own; contains the inverted list
-  std::unique_ptr<IVFFlat> index_;
+   public:
+    /// Construct from a pre-existing faiss::IndexIVFFlat instance, copying
+    /// data over to the given GPU, if the input index is trained.
+    GpuIndexIVFFlat(
+            GpuResourcesProvider* provider,
+            const faiss::IndexIVFFlat* index,
+            GpuIndexIVFFlatConfig config = GpuIndexIVFFlatConfig());
+    /// Constructs a new instance with an empty flat quantizer; the user
+    /// provides the number of lists desired.
+    GpuIndexIVFFlat(
+            GpuResourcesProvider* provider,
+            int dims,
+            int nlist,
+            faiss::MetricType metric,
+            GpuIndexIVFFlatConfig config = GpuIndexIVFFlatConfig());
+    ~GpuIndexIVFFlat() override;
+    /// Reserve GPU memory in our inverted lists for this number of vectors
+    void reserveMemory(size_t numVecs);
+    /// Initialize ourselves from the given CPU index; will overwrite
+    /// all data in ourselves
+    void copyFrom(const faiss::IndexIVFFlat* index);
+    /// Copy ourselves to the given CPU index; will overwrite all data
+    /// in the index instance
+    void copyTo(faiss::IndexIVFFlat* index) const;
+    /// After adding vectors, one can call this to reclaim device memory
+    /// to exactly the amount needed. Returns space reclaimed in bytes
+    size_t reclaimMemory();
+    /// Clears out all inverted lists, but retains the coarse centroid
+    /// information
+    void reset() override;
+    /// Trains the coarse quantizer based on the given vector data
+    void train(Index::idx_t n, const float* x) override;
+    /// Returns the number of vectors present in a particular inverted list
+    int getListLength(int listId) const override;
+    /// Return the encoded vector data contained in a particular inverted list,
+    /// for debugging purposes.
+    /// If gpuFormat is true, the data is returned as it is encoded in the
+    /// GPU-side representation.
+    /// Otherwise, it is converted to the CPU format.
+    /// compliant format, while the native GPU format may differ.
+    std::vector<uint8_t> getListVectorData(int listId, bool gpuFormat = false)
+            const override;
+    /// Return the vector indices contained in a particular inverted list, for
+    /// debugging purposes.
+    std::vector<Index::idx_t> getListIndices(int listId) const override;
+   protected:
+    /// Called from GpuIndex for add/add_with_ids
+    void addImpl_(int n, const float* x, const Index::idx_t* ids) override;
+    /// Called from GpuIndex for search
+    void searchImpl_(
+            int n,
+            const float* x,
+            int k,
+            float* distances,
+            Index::idx_t* labels) const override;
+   protected:
+    /// Our configuration options
+    const GpuIndexIVFFlatConfig ivfFlatConfig_;
+    /// Desired inverted list memory reservation
+    size_t reserveMemoryVecs_;
+    /// Instance that we own; contains the inverted list
+    std::unique_ptr<IVFFlat> index_;
 };
-} } // namespace
+} // namespace gpu
+} // namespace faiss

data/vendor/faiss/faiss/gpu/GpuIndexIVFPQ.h CHANGED Viewed

@@ -5,166 +5,175 @@
  * LICENSE file in the root directory of this source tree.
  */
 #pragma once
 #include <faiss/gpu/GpuIndexIVF.h>
+#include <faiss/impl/ProductQuantizer.h>
 #include <memory>
 #include <vector>
-namespace faiss { struct IndexIVFPQ; }
+namespace faiss {
+struct IndexIVFPQ;
+}
-namespace faiss { namespace gpu {
+namespace faiss {
+namespace gpu {
 class GpuIndexFlat;
 class IVFPQ;
 struct GpuIndexIVFPQConfig : public GpuIndexIVFConfig {
-  inline GpuIndexIVFPQConfig()
-      : useFloat16LookupTables(false),
-        usePrecomputedTables(false),
-        interleavedLayout(false),
-        useMMCodeDistance(false) {
-  }
-  /// Whether or not float16 residual distance tables are used in the
-  /// list scanning kernels. When subQuantizers * 2^bitsPerCode >
-  /// 16384, this is required.
-  bool useFloat16LookupTables;
-  /// Whether or not we enable the precomputed table option for
-  /// search, which can substantially increase the memory requirement.
-  bool usePrecomputedTables;
-  /// Use the alternative memory layout for the IVF lists
-  /// WARNING: this is a feature under development, do not use!
-  bool interleavedLayout;
-  /// Use GEMM-backed computation of PQ code distances for the no precomputed
-  /// table version of IVFPQ.
-  /// This is for debugging purposes, it should not substantially affect the
-  /// results one way for another.
-  ///
-  /// Note that MM code distance is enabled automatically if one uses a number
-  /// of dimensions per sub-quantizer that is not natively specialized (an odd
-  /// number like 7 or so).
-  bool useMMCodeDistance;
+    inline GpuIndexIVFPQConfig()
+            : useFloat16LookupTables(false),
+              usePrecomputedTables(false),
+              interleavedLayout(false),
+              useMMCodeDistance(false) {}
+    /// Whether or not float16 residual distance tables are used in the
+    /// list scanning kernels. When subQuantizers * 2^bitsPerCode >
+    /// 16384, this is required.
+    bool useFloat16LookupTables;
+    /// Whether or not we enable the precomputed table option for
+    /// search, which can substantially increase the memory requirement.
+    bool usePrecomputedTables;
+    /// Use the alternative memory layout for the IVF lists
+    /// WARNING: this is a feature under development, do not use!
+    bool interleavedLayout;
+    /// Use GEMM-backed computation of PQ code distances for the no precomputed
+    /// table version of IVFPQ.
+    /// This is for debugging purposes, it should not substantially affect the
+    /// results one way for another.
+    ///
+    /// Note that MM code distance is enabled automatically if one uses a number
+    /// of dimensions per sub-quantizer that is not natively specialized (an odd
+    /// number like 7 or so).
+    bool useMMCodeDistance;
 };
 /// IVFPQ index for the GPU
 class GpuIndexIVFPQ : public GpuIndexIVF {
- public:
-  /// Construct from a pre-existing faiss::IndexIVFPQ instance, copying
-  /// data over to the given GPU, if the input index is trained.
-  GpuIndexIVFPQ(GpuResourcesProvider* provider,
-                const faiss::IndexIVFPQ* index,
-                GpuIndexIVFPQConfig config = GpuIndexIVFPQConfig());
+   public:
+    /// Construct from a pre-existing faiss::IndexIVFPQ instance, copying
+    /// data over to the given GPU, if the input index is trained.
+    GpuIndexIVFPQ(
+            GpuResourcesProvider* provider,
+            const faiss::IndexIVFPQ* index,
+            GpuIndexIVFPQConfig config = GpuIndexIVFPQConfig());
+    /// Construct an empty index
+    GpuIndexIVFPQ(
+            GpuResourcesProvider* provider,
+            int dims,
+            int nlist,
+            int subQuantizers,
+            int bitsPerCode,
+            faiss::MetricType metric,
+            GpuIndexIVFPQConfig config = GpuIndexIVFPQConfig());
+    ~GpuIndexIVFPQ() override;
+    /// Reserve space on the GPU for the inverted lists for `num`
+    /// vectors, assumed equally distributed among
+    /// Initialize ourselves from the given CPU index; will overwrite
+    /// all data in ourselves
+    void copyFrom(const faiss::IndexIVFPQ* index);
+    /// Copy ourselves to the given CPU index; will overwrite all data
+    /// in the index instance
+    void copyTo(faiss::IndexIVFPQ* index) const;
+    /// Reserve GPU memory in our inverted lists for this number of vectors
+    void reserveMemory(size_t numVecs);
+    /// Enable or disable pre-computed codes
+    void setPrecomputedCodes(bool enable);
+    /// Are pre-computed codes enabled?
+    bool getPrecomputedCodes() const;
+    /// Return the number of sub-quantizers we are using
+    int getNumSubQuantizers() const;
+    /// Return the number of bits per PQ code
+    int getBitsPerCode() const;
+    /// Return the number of centroids per PQ code (2^bits per code)
+    int getCentroidsPerSubQuantizer() const;
+    /// After adding vectors, one can call this to reclaim device memory
+    /// to exactly the amount needed. Returns space reclaimed in bytes
+    size_t reclaimMemory();
+    /// Clears out all inverted lists, but retains the coarse and
+    /// product centroid information
+    void reset() override;
+    /// Trains the coarse and product quantizer based on the given vector data
+    void train(Index::idx_t n, const float* x) override;
+    /// Returns the number of vectors present in a particular inverted list
+    int getListLength(int listId) const override;
+    /// Return the encoded vector data contained in a particular inverted list,
+    /// for debugging purposes.
+    /// If gpuFormat is true, the data is returned as it is encoded in the
+    /// GPU-side representation.
+    /// Otherwise, it is converted to the CPU format.
+    /// compliant format, while the native GPU format may differ.
+    std::vector<uint8_t> getListVectorData(int listId, bool gpuFormat = false)
+            const override;
+    /// Return the vector indices contained in a particular inverted list, for
+    /// debugging purposes.
+    std::vector<Index::idx_t> getListIndices(int listId) const override;
+   public:
+    /// Like the CPU version, we expose a publically-visible ProductQuantizer
+    /// for manipulation
+    ProductQuantizer pq;
+   protected:
+    /// Called from GpuIndex for add/add_with_ids
+    void addImpl_(int n, const float* x, const Index::idx_t* ids) override;
+    /// Called from GpuIndex for search
+    void searchImpl_(
+            int n,
+            const float* x,
+            int k,
+            float* distances,
+            Index::idx_t* labels) const override;
+    /// Throws errors if configuration settings are improper
+    void verifySettings_() const;
+    /// Trains the PQ quantizer based on the given vector data
+    void trainResidualQuantizer_(Index::idx_t n, const float* x);
+   protected:
+    /// Our configuration options that we were initialized with
+    const GpuIndexIVFPQConfig ivfpqConfig_;
+    /// Runtime override: whether or not we use precomputed tables
+    bool usePrecomputedTables_;
-  /// Construct an empty index
-  GpuIndexIVFPQ(GpuResourcesProvider* provider,
-                int dims,
-                int nlist,
-                int subQuantizers,
-                int bitsPerCode,
-                faiss::MetricType metric,
-                GpuIndexIVFPQConfig config = GpuIndexIVFPQConfig());
-  ~GpuIndexIVFPQ() override;
-  /// Reserve space on the GPU for the inverted lists for `num`
-  /// vectors, assumed equally distributed among
-  /// Initialize ourselves from the given CPU index; will overwrite
-  /// all data in ourselves
-  void copyFrom(const faiss::IndexIVFPQ* index);
-  /// Copy ourselves to the given CPU index; will overwrite all data
-  /// in the index instance
-  void copyTo(faiss::IndexIVFPQ* index) const;
-  /// Reserve GPU memory in our inverted lists for this number of vectors
-  void reserveMemory(size_t numVecs);
-  /// Enable or disable pre-computed codes
-  void setPrecomputedCodes(bool enable);
-  /// Are pre-computed codes enabled?
-  bool getPrecomputedCodes() const;
-  /// Return the number of sub-quantizers we are using
-  int getNumSubQuantizers() const;
-  /// Return the number of bits per PQ code
-  int getBitsPerCode() const;
-  /// Return the number of centroids per PQ code (2^bits per code)
-  int getCentroidsPerSubQuantizer() const;
-  /// After adding vectors, one can call this to reclaim device memory
-  /// to exactly the amount needed. Returns space reclaimed in bytes
-  size_t reclaimMemory();
-  /// Clears out all inverted lists, but retains the coarse and
-  /// product centroid information
-  void reset() override;
-  /// Trains the coarse and product quantizer based on the given vector data
-  void train(Index::idx_t n, const float* x) override;
-  /// Returns the number of vectors present in a particular inverted list
-  int getListLength(int listId) const override;
-  /// Return the encoded vector data contained in a particular inverted list,
-  /// for debugging purposes.
-  /// If gpuFormat is true, the data is returned as it is encoded in the
-  /// GPU-side representation.
-  /// Otherwise, it is converted to the CPU format.
-  /// compliant format, while the native GPU format may differ.
-  std::vector<uint8_t>
-  getListVectorData(int listId, bool gpuFormat = false) const override;
-  /// Return the vector indices contained in a particular inverted list, for
-  /// debugging purposes.
-  std::vector<Index::idx_t> getListIndices(int listId) const override;
- protected:
-  /// Called from GpuIndex for add/add_with_ids
-  void addImpl_(int n,
-                const float* x,
-                const Index::idx_t* ids) override;
-  /// Called from GpuIndex for search
-  void searchImpl_(int n,
-                   const float* x,
-                   int k,
-                   float* distances,
-                   Index::idx_t* labels) const override;
-  /// Throws errors if configuration settings are improper
-  void verifySettings_() const;
-  /// Trains the PQ quantizer based on the given vector data
-  void trainResidualQuantizer_(Index::idx_t n, const float* x);
- protected:
-  /// Our configuration options that we were initialized with
-  const GpuIndexIVFPQConfig ivfpqConfig_;
-  /// Runtime override: whether or not we use precomputed tables
-  bool usePrecomputedTables_;
-  /// Number of sub-quantizers per encoded vector
-  int subQuantizers_;
+    /// Number of sub-quantizers per encoded vector
+    int subQuantizers_;
-  /// Bits per sub-quantizer code
-  int bitsPerCode_;
+    /// Bits per sub-quantizer code
+    int bitsPerCode_;
-  /// Desired inverted list memory reservation
-  size_t reserveMemoryVecs_;
+    /// Desired inverted list memory reservation
+    size_t reserveMemoryVecs_;
-  /// The product quantizer instance that we own; contains the
-  /// inverted lists
-  std::unique_ptr<IVFPQ> index_;
+    /// The product quantizer instance that we own; contains the
+    /// inverted lists
+    std::unique_ptr<IVFPQ> index_;
 };
-} } // namespace
+} // namespace gpu
+} // namespace faiss