RubyGems - faiss - Versions diffs - 0.2.0 → 0.2.4 - Mend

faiss 0.2.0 → 0.2.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (215) hide show

checksums.yaml +4 -4
data/CHANGELOG.md +16 -0
data/LICENSE.txt +1 -1
data/README.md +7 -7
data/ext/faiss/extconf.rb +6 -3
data/ext/faiss/numo.hpp +4 -4
data/ext/faiss/utils.cpp +1 -1
data/ext/faiss/utils.h +1 -1
data/lib/faiss/version.rb +1 -1
data/vendor/faiss/faiss/AutoTune.cpp +292 -291
data/vendor/faiss/faiss/AutoTune.h +55 -56
data/vendor/faiss/faiss/Clustering.cpp +365 -194
data/vendor/faiss/faiss/Clustering.h +102 -35
data/vendor/faiss/faiss/IVFlib.cpp +171 -195
data/vendor/faiss/faiss/IVFlib.h +48 -51
data/vendor/faiss/faiss/Index.cpp +85 -103
data/vendor/faiss/faiss/Index.h +54 -48
data/vendor/faiss/faiss/Index2Layer.cpp +126 -224
data/vendor/faiss/faiss/Index2Layer.h +22 -36
data/vendor/faiss/faiss/IndexAdditiveQuantizer.cpp +407 -0
data/vendor/faiss/faiss/IndexAdditiveQuantizer.h +195 -0
data/vendor/faiss/faiss/IndexBinary.cpp +45 -37
data/vendor/faiss/faiss/IndexBinary.h +140 -132
data/vendor/faiss/faiss/IndexBinaryFlat.cpp +73 -53
data/vendor/faiss/faiss/IndexBinaryFlat.h +29 -24
data/vendor/faiss/faiss/IndexBinaryFromFloat.cpp +46 -43
data/vendor/faiss/faiss/IndexBinaryFromFloat.h +16 -15
data/vendor/faiss/faiss/IndexBinaryHNSW.cpp +215 -232
data/vendor/faiss/faiss/IndexBinaryHNSW.h +25 -24
data/vendor/faiss/faiss/IndexBinaryHash.cpp +182 -177
data/vendor/faiss/faiss/IndexBinaryHash.h +41 -34
data/vendor/faiss/faiss/IndexBinaryIVF.cpp +489 -461
data/vendor/faiss/faiss/IndexBinaryIVF.h +97 -68
data/vendor/faiss/faiss/IndexFlat.cpp +115 -176
data/vendor/faiss/faiss/IndexFlat.h +42 -59
data/vendor/faiss/faiss/IndexFlatCodes.cpp +67 -0
data/vendor/faiss/faiss/IndexFlatCodes.h +47 -0
data/vendor/faiss/faiss/IndexHNSW.cpp +372 -348
data/vendor/faiss/faiss/IndexHNSW.h +57 -41
data/vendor/faiss/faiss/IndexIVF.cpp +545 -453
data/vendor/faiss/faiss/IndexIVF.h +169 -118
data/vendor/faiss/faiss/IndexIVFAdditiveQuantizer.cpp +316 -0
data/vendor/faiss/faiss/IndexIVFAdditiveQuantizer.h +121 -0
data/vendor/faiss/faiss/IndexIVFFlat.cpp +247 -252
data/vendor/faiss/faiss/IndexIVFFlat.h +48 -51
data/vendor/faiss/faiss/IndexIVFPQ.cpp +459 -517
data/vendor/faiss/faiss/IndexIVFPQ.h +75 -67
data/vendor/faiss/faiss/IndexIVFPQFastScan.cpp +406 -372
data/vendor/faiss/faiss/IndexIVFPQFastScan.h +82 -57
data/vendor/faiss/faiss/IndexIVFPQR.cpp +104 -102
data/vendor/faiss/faiss/IndexIVFPQR.h +33 -28
data/vendor/faiss/faiss/IndexIVFSpectralHash.cpp +163 -150
data/vendor/faiss/faiss/IndexIVFSpectralHash.h +38 -25
data/vendor/faiss/faiss/IndexLSH.cpp +66 -113
data/vendor/faiss/faiss/IndexLSH.h +20 -38
data/vendor/faiss/faiss/IndexLattice.cpp +42 -56
data/vendor/faiss/faiss/IndexLattice.h +11 -16
data/vendor/faiss/faiss/IndexNNDescent.cpp +229 -0
data/vendor/faiss/faiss/IndexNNDescent.h +72 -0
data/vendor/faiss/faiss/IndexNSG.cpp +301 -0
data/vendor/faiss/faiss/IndexNSG.h +85 -0
data/vendor/faiss/faiss/IndexPQ.cpp +387 -495
data/vendor/faiss/faiss/IndexPQ.h +64 -82
data/vendor/faiss/faiss/IndexPQFastScan.cpp +143 -170
data/vendor/faiss/faiss/IndexPQFastScan.h +46 -32
data/vendor/faiss/faiss/IndexPreTransform.cpp +120 -150
data/vendor/faiss/faiss/IndexPreTransform.h +33 -36
data/vendor/faiss/faiss/IndexRefine.cpp +139 -127
data/vendor/faiss/faiss/IndexRefine.h +32 -23
data/vendor/faiss/faiss/IndexReplicas.cpp +147 -153
data/vendor/faiss/faiss/IndexReplicas.h +62 -56
data/vendor/faiss/faiss/IndexScalarQuantizer.cpp +111 -172
data/vendor/faiss/faiss/IndexScalarQuantizer.h +41 -59
data/vendor/faiss/faiss/IndexShards.cpp +256 -240
data/vendor/faiss/faiss/IndexShards.h +85 -73
data/vendor/faiss/faiss/MatrixStats.cpp +112 -97
data/vendor/faiss/faiss/MatrixStats.h +7 -10
data/vendor/faiss/faiss/MetaIndexes.cpp +135 -157
data/vendor/faiss/faiss/MetaIndexes.h +40 -34
data/vendor/faiss/faiss/MetricType.h +7 -7
data/vendor/faiss/faiss/VectorTransform.cpp +654 -475
data/vendor/faiss/faiss/VectorTransform.h +64 -89
data/vendor/faiss/faiss/clone_index.cpp +78 -73
data/vendor/faiss/faiss/clone_index.h +4 -9
data/vendor/faiss/faiss/gpu/GpuAutoTune.cpp +33 -38
data/vendor/faiss/faiss/gpu/GpuAutoTune.h +11 -9
data/vendor/faiss/faiss/gpu/GpuCloner.cpp +198 -171
data/vendor/faiss/faiss/gpu/GpuCloner.h +53 -35
data/vendor/faiss/faiss/gpu/GpuClonerOptions.cpp +12 -14
data/vendor/faiss/faiss/gpu/GpuClonerOptions.h +27 -25
data/vendor/faiss/faiss/gpu/GpuDistance.h +116 -112
data/vendor/faiss/faiss/gpu/GpuFaissAssert.h +1 -2
data/vendor/faiss/faiss/gpu/GpuIcmEncoder.h +60 -0
data/vendor/faiss/faiss/gpu/GpuIndex.h +134 -137
data/vendor/faiss/faiss/gpu/GpuIndexBinaryFlat.h +76 -73
data/vendor/faiss/faiss/gpu/GpuIndexFlat.h +173 -162
data/vendor/faiss/faiss/gpu/GpuIndexIVF.h +67 -64
data/vendor/faiss/faiss/gpu/GpuIndexIVFFlat.h +89 -86
data/vendor/faiss/faiss/gpu/GpuIndexIVFPQ.h +150 -141
data/vendor/faiss/faiss/gpu/GpuIndexIVFScalarQuantizer.h +101 -103
data/vendor/faiss/faiss/gpu/GpuIndicesOptions.h +17 -16
data/vendor/faiss/faiss/gpu/GpuResources.cpp +116 -128
data/vendor/faiss/faiss/gpu/GpuResources.h +182 -186
data/vendor/faiss/faiss/gpu/StandardGpuResources.cpp +433 -422
data/vendor/faiss/faiss/gpu/StandardGpuResources.h +131 -130
data/vendor/faiss/faiss/gpu/impl/InterleavedCodes.cpp +468 -456
data/vendor/faiss/faiss/gpu/impl/InterleavedCodes.h +25 -19
data/vendor/faiss/faiss/gpu/impl/RemapIndices.cpp +22 -20
data/vendor/faiss/faiss/gpu/impl/RemapIndices.h +9 -8
data/vendor/faiss/faiss/gpu/perf/IndexWrapper-inl.h +39 -44
data/vendor/faiss/faiss/gpu/perf/IndexWrapper.h +16 -14
data/vendor/faiss/faiss/gpu/perf/PerfClustering.cpp +77 -71
data/vendor/faiss/faiss/gpu/perf/PerfIVFPQAdd.cpp +109 -88
data/vendor/faiss/faiss/gpu/perf/WriteIndex.cpp +75 -64
data/vendor/faiss/faiss/gpu/test/TestCodePacking.cpp +230 -215
data/vendor/faiss/faiss/gpu/test/TestGpuIndexBinaryFlat.cpp +80 -86
data/vendor/faiss/faiss/gpu/test/TestGpuIndexFlat.cpp +284 -277
data/vendor/faiss/faiss/gpu/test/TestGpuIndexIVFFlat.cpp +416 -416
data/vendor/faiss/faiss/gpu/test/TestGpuIndexIVFPQ.cpp +611 -517
data/vendor/faiss/faiss/gpu/test/TestGpuIndexIVFScalarQuantizer.cpp +166 -164
data/vendor/faiss/faiss/gpu/test/TestGpuMemoryException.cpp +61 -53
data/vendor/faiss/faiss/gpu/test/TestUtils.cpp +274 -238
data/vendor/faiss/faiss/gpu/test/TestUtils.h +73 -57
data/vendor/faiss/faiss/gpu/test/demo_ivfpq_indexing_gpu.cpp +47 -50
data/vendor/faiss/faiss/gpu/utils/DeviceUtils.h +79 -72
data/vendor/faiss/faiss/gpu/utils/StackDeviceMemory.cpp +140 -146
data/vendor/faiss/faiss/gpu/utils/StackDeviceMemory.h +69 -71
data/vendor/faiss/faiss/gpu/utils/StaticUtils.h +21 -16
data/vendor/faiss/faiss/gpu/utils/Timer.cpp +25 -29
data/vendor/faiss/faiss/gpu/utils/Timer.h +30 -29
data/vendor/faiss/faiss/impl/AdditiveQuantizer.cpp +503 -0
data/vendor/faiss/faiss/impl/AdditiveQuantizer.h +175 -0
data/vendor/faiss/faiss/impl/AuxIndexStructures.cpp +90 -120
data/vendor/faiss/faiss/impl/AuxIndexStructures.h +81 -65
data/vendor/faiss/faiss/impl/FaissAssert.h +73 -58
data/vendor/faiss/faiss/impl/FaissException.cpp +56 -48
data/vendor/faiss/faiss/impl/FaissException.h +41 -29
data/vendor/faiss/faiss/impl/HNSW.cpp +606 -617
data/vendor/faiss/faiss/impl/HNSW.h +179 -200
data/vendor/faiss/faiss/impl/LocalSearchQuantizer.cpp +855 -0
data/vendor/faiss/faiss/impl/LocalSearchQuantizer.h +244 -0
data/vendor/faiss/faiss/impl/NNDescent.cpp +487 -0
data/vendor/faiss/faiss/impl/NNDescent.h +154 -0
data/vendor/faiss/faiss/impl/NSG.cpp +679 -0
data/vendor/faiss/faiss/impl/NSG.h +199 -0
data/vendor/faiss/faiss/impl/PolysemousTraining.cpp +484 -454
data/vendor/faiss/faiss/impl/PolysemousTraining.h +52 -55
data/vendor/faiss/faiss/impl/ProductQuantizer-inl.h +26 -47
data/vendor/faiss/faiss/impl/ProductQuantizer.cpp +469 -459
data/vendor/faiss/faiss/impl/ProductQuantizer.h +76 -87
data/vendor/faiss/faiss/impl/ResidualQuantizer.cpp +758 -0
data/vendor/faiss/faiss/impl/ResidualQuantizer.h +188 -0
data/vendor/faiss/faiss/impl/ResultHandler.h +96 -132
data/vendor/faiss/faiss/impl/ScalarQuantizer.cpp +647 -707
data/vendor/faiss/faiss/impl/ScalarQuantizer.h +48 -46
data/vendor/faiss/faiss/impl/ThreadedIndex-inl.h +129 -131
data/vendor/faiss/faiss/impl/ThreadedIndex.h +61 -55
data/vendor/faiss/faiss/impl/index_read.cpp +631 -480
data/vendor/faiss/faiss/impl/index_write.cpp +547 -407
data/vendor/faiss/faiss/impl/io.cpp +76 -95
data/vendor/faiss/faiss/impl/io.h +31 -41
data/vendor/faiss/faiss/impl/io_macros.h +60 -29
data/vendor/faiss/faiss/impl/kmeans1d.cpp +301 -0
data/vendor/faiss/faiss/impl/kmeans1d.h +48 -0
data/vendor/faiss/faiss/impl/lattice_Zn.cpp +137 -186
data/vendor/faiss/faiss/impl/lattice_Zn.h +40 -51
data/vendor/faiss/faiss/impl/platform_macros.h +29 -8
data/vendor/faiss/faiss/impl/pq4_fast_scan.cpp +77 -124
data/vendor/faiss/faiss/impl/pq4_fast_scan.h +39 -48
data/vendor/faiss/faiss/impl/pq4_fast_scan_search_1.cpp +41 -52
data/vendor/faiss/faiss/impl/pq4_fast_scan_search_qbs.cpp +80 -117
data/vendor/faiss/faiss/impl/simd_result_handlers.h +109 -137
data/vendor/faiss/faiss/index_factory.cpp +619 -397
data/vendor/faiss/faiss/index_factory.h +8 -6
data/vendor/faiss/faiss/index_io.h +23 -26
data/vendor/faiss/faiss/invlists/BlockInvertedLists.cpp +67 -75
data/vendor/faiss/faiss/invlists/BlockInvertedLists.h +22 -24
data/vendor/faiss/faiss/invlists/DirectMap.cpp +96 -112
data/vendor/faiss/faiss/invlists/DirectMap.h +29 -33
data/vendor/faiss/faiss/invlists/InvertedLists.cpp +307 -364
data/vendor/faiss/faiss/invlists/InvertedLists.h +151 -151
data/vendor/faiss/faiss/invlists/InvertedListsIOHook.cpp +29 -34
data/vendor/faiss/faiss/invlists/InvertedListsIOHook.h +17 -18
data/vendor/faiss/faiss/invlists/OnDiskInvertedLists.cpp +257 -293
data/vendor/faiss/faiss/invlists/OnDiskInvertedLists.h +50 -45
data/vendor/faiss/faiss/python/python_callbacks.cpp +23 -26
data/vendor/faiss/faiss/python/python_callbacks.h +9 -16
data/vendor/faiss/faiss/utils/AlignedTable.h +79 -44
data/vendor/faiss/faiss/utils/Heap.cpp +40 -48
data/vendor/faiss/faiss/utils/Heap.h +186 -209
data/vendor/faiss/faiss/utils/WorkerThread.cpp +67 -76
data/vendor/faiss/faiss/utils/WorkerThread.h +32 -33
data/vendor/faiss/faiss/utils/distances.cpp +305 -312
data/vendor/faiss/faiss/utils/distances.h +170 -122
data/vendor/faiss/faiss/utils/distances_simd.cpp +498 -508
data/vendor/faiss/faiss/utils/extra_distances-inl.h +117 -0
data/vendor/faiss/faiss/utils/extra_distances.cpp +113 -232
data/vendor/faiss/faiss/utils/extra_distances.h +30 -29
data/vendor/faiss/faiss/utils/hamming-inl.h +260 -209
data/vendor/faiss/faiss/utils/hamming.cpp +375 -469
data/vendor/faiss/faiss/utils/hamming.h +62 -85
data/vendor/faiss/faiss/utils/ordered_key_value.h +16 -18
data/vendor/faiss/faiss/utils/partitioning.cpp +393 -318
data/vendor/faiss/faiss/utils/partitioning.h +26 -21
data/vendor/faiss/faiss/utils/quantize_lut.cpp +78 -66
data/vendor/faiss/faiss/utils/quantize_lut.h +22 -20
data/vendor/faiss/faiss/utils/random.cpp +39 -63
data/vendor/faiss/faiss/utils/random.h +13 -16
data/vendor/faiss/faiss/utils/simdlib.h +4 -2
data/vendor/faiss/faiss/utils/simdlib_avx2.h +88 -85
data/vendor/faiss/faiss/utils/simdlib_emulated.h +226 -165
data/vendor/faiss/faiss/utils/simdlib_neon.h +832 -0
data/vendor/faiss/faiss/utils/utils.cpp +304 -287
data/vendor/faiss/faiss/utils/utils.h +54 -49
metadata +29 -4

data/vendor/faiss/faiss/gpu/test/TestGpuIndexFlat.cpp CHANGED Viewed

@@ -5,12 +5,11 @@
  * LICENSE file in the root directory of this source tree.
  */
 #include <faiss/IndexFlat.h>
 #include <faiss/gpu/GpuIndexFlat.h>
 #include <faiss/gpu/StandardGpuResources.h>
-#include <faiss/gpu/utils/DeviceUtils.h>
 #include <faiss/gpu/test/TestUtils.h>
+#include <faiss/gpu/utils/DeviceUtils.h>
 #include <gtest/gtest.h>
 #include <sstream>
 #include <vector>
@@ -20,93 +19,109 @@ constexpr float kF16MaxRelErr = 0.07f;
 constexpr float kF32MaxRelErr = 6e-3f;
 struct TestFlatOptions {
-  TestFlatOptions()
-      : metric(faiss::MetricType::METRIC_L2),
-        metricArg(0),
-        useFloat16(false),
-        useTransposed(false),
-        numVecsOverride(-1),
-        numQueriesOverride(-1),
-        kOverride(-1),
-        dimOverride(-1) {
-  }
-  faiss::MetricType metric;
-  float metricArg;
-  bool useFloat16;
-  bool useTransposed;
-  int numVecsOverride;
-  int numQueriesOverride;
-  int kOverride;
-  int dimOverride;
+    TestFlatOptions()
+            : metric(faiss::MetricType::METRIC_L2),
+              metricArg(0),
+              useFloat16(false),
+              useTransposed(false),
+              numVecsOverride(-1),
+              numQueriesOverride(-1),
+              kOverride(-1),
+              dimOverride(-1) {}
+    faiss::MetricType metric;
+    float metricArg;
+    bool useFloat16;
+    bool useTransposed;
+    int numVecsOverride;
+    int numQueriesOverride;
+    int kOverride;
+    int dimOverride;
 };
 void testFlat(const TestFlatOptions& opt) {
-  int numVecs = opt.numVecsOverride > 0 ?
-    opt.numVecsOverride : faiss::gpu::randVal(1000, 5000);
-  int dim = opt.dimOverride > 0 ?
-    opt.dimOverride : faiss::gpu::randVal(50, 800);
-  int numQuery = opt.numQueriesOverride > 0 ?
-    opt.numQueriesOverride : faiss::gpu::randVal(1, 512);
-  // Due to loss of precision in a float16 accumulator, for large k,
-  // the number of differences is pretty huge. Restrict ourselves to a
-  // fairly small `k` for float16
-  int k = opt.useFloat16 ?
-    std::min(faiss::gpu::randVal(1, 50), numVecs) :
-    std::min(faiss::gpu::randVal(1, faiss::gpu::getMaxKSelection()), numVecs);
-  if (opt.kOverride > 0) {
-    k = opt.kOverride;
-  }
-  faiss::IndexFlat cpuIndex(dim, opt.metric);
-  cpuIndex.metric_arg = opt.metricArg;
-  // Construct on a random device to test multi-device, if we have
-  // multiple devices
-  int device = faiss::gpu::randVal(0, faiss::gpu::getNumDevices() - 1);
-  faiss::gpu::StandardGpuResources res;
-  res.noTempMemory();
-  faiss::gpu::GpuIndexFlatConfig config;
-  config.device = device;
-  config.useFloat16 = opt.useFloat16;
-  config.storeTransposed = opt.useTransposed;
-  faiss::gpu::GpuIndexFlat gpuIndex(&res, dim, opt.metric, config);
-  gpuIndex.metric_arg = opt.metricArg;
-  std::vector<float> vecs = faiss::gpu::randVecs(numVecs, dim);
-  cpuIndex.add(numVecs, vecs.data());
-  gpuIndex.add(numVecs, vecs.data());
-  std::stringstream str;
-  str << "metric " << opt.metric
-      << " marg " << opt.metricArg
-      << " numVecs " << numVecs
-      << " dim " << dim
-      << " useFloat16 " << opt.useFloat16
-      << " transposed " << opt.useTransposed
-      << " numQuery " << numQuery
-      << " k " << k;
-  // To some extent, we depend upon the relative error for the test
-  // for float16
-  faiss::gpu::compareIndices(cpuIndex, gpuIndex, numQuery, dim, k, str.str(),
-                             opt.useFloat16 ? kF16MaxRelErr : kF32MaxRelErr,
-                             // FIXME: the fp16 bounds are
-                             // useless when math (the accumulator) is
-                             // in fp16. Figure out another way to test
-                             opt.useFloat16 ? 0.99f : 0.1f,
-                             opt.useFloat16 ? 0.65f : 0.015f);
+    int numVecs = opt.numVecsOverride > 0 ? opt.numVecsOverride
+                                          : faiss::gpu::randVal(1000, 5000);
+    int dim = opt.dimOverride > 0 ? opt.dimOverride
+                                  : faiss::gpu::randVal(50, 800);
+    int numQuery = opt.numQueriesOverride > 0 ? opt.numQueriesOverride
+                                              : faiss::gpu::randVal(1, 512);
+    // Due to loss of precision in a float16 accumulator, for large k,
+    // the number of differences is pretty huge. Restrict ourselves to a
+    // fairly small `k` for float16
+    int k = opt.useFloat16
+            ? std::min(faiss::gpu::randVal(1, 50), numVecs)
+            : std::min(
+                      faiss::gpu::randVal(1, faiss::gpu::getMaxKSelection()),
+                      numVecs);
+    if (opt.kOverride > 0) {
+        k = opt.kOverride;
+    }
+    faiss::IndexFlat cpuIndex(dim, opt.metric);
+    cpuIndex.metric_arg = opt.metricArg;
+    // Construct on a random device to test multi-device, if we have
+    // multiple devices
+    int device = faiss::gpu::randVal(0, faiss::gpu::getNumDevices() - 1);
+    faiss::gpu::StandardGpuResources res;
+    res.noTempMemory();
+    faiss::gpu::GpuIndexFlatConfig config;
+    config.device = device;
+    config.useFloat16 = opt.useFloat16;
+    config.storeTransposed = opt.useTransposed;
+    faiss::gpu::GpuIndexFlat gpuIndex(&res, dim, opt.metric, config);
+    gpuIndex.metric_arg = opt.metricArg;
+    std::vector<float> vecs = faiss::gpu::randVecs(numVecs, dim);
+    cpuIndex.add(numVecs, vecs.data());
+    gpuIndex.add(numVecs, vecs.data());
+    std::stringstream str;
+    str << "metric " << opt.metric << " marg " << opt.metricArg << " numVecs "
+        << numVecs << " dim " << dim << " useFloat16 " << opt.useFloat16
+        << " transposed " << opt.useTransposed << " numQuery " << numQuery
+        << " k " << k;
+    // To some extent, we depend upon the relative error for the test
+    // for float16
+    faiss::gpu::compareIndices(
+            cpuIndex,
+            gpuIndex,
+            numQuery,
+            dim,
+            k,
+            str.str(),
+            opt.useFloat16 ? kF16MaxRelErr : kF32MaxRelErr,
+            // FIXME: the fp16 bounds are
+            // useless when math (the accumulator) is
+            // in fp16. Figure out another way to test
+            opt.useFloat16 ? 0.99f : 0.1f,
+            opt.useFloat16 ? 0.65f : 0.015f);
 }
 TEST(TestGpuIndexFlat, IP_Float32) {
-  for (int tries = 0; tries < 3; ++tries) {
+    for (int tries = 0; tries < 3; ++tries) {
+        TestFlatOptions opt;
+        opt.metric = faiss::MetricType::METRIC_INNER_PRODUCT;
+        opt.useFloat16 = false;
+        opt.useTransposed = false;
+        testFlat(opt);
+        opt.useTransposed = true;
+        testFlat(opt);
+    }
+}
+TEST(TestGpuIndexFlat, L1_Float32) {
     TestFlatOptions opt;
-    opt.metric = faiss::MetricType::METRIC_INNER_PRODUCT;
+    opt.metric = faiss::MetricType::METRIC_L1;
     opt.useFloat16 = false;
     opt.useTransposed = false;
@@ -114,280 +129,272 @@ TEST(TestGpuIndexFlat, IP_Float32) {
     opt.useTransposed = true;
     testFlat(opt);
-  }
-}
-TEST(TestGpuIndexFlat, L1_Float32) {
-  TestFlatOptions opt;
-  opt.metric = faiss::MetricType::METRIC_L1;
-  opt.useFloat16 = false;
-  opt.useTransposed = false;
-  testFlat(opt);
-  opt.useTransposed = true;
-  testFlat(opt);
 }
 TEST(TestGpuIndexFlat, Lp_Float32) {
-  TestFlatOptions opt;
-  opt.metric = faiss::MetricType::METRIC_Lp;
-  opt.metricArg = 5;
-  opt.useFloat16 = false;
-  opt.useTransposed = false;
+    TestFlatOptions opt;
+    opt.metric = faiss::MetricType::METRIC_Lp;
+    opt.metricArg = 5;
+    opt.useFloat16 = false;
+    opt.useTransposed = false;
-  testFlat(opt);
+    testFlat(opt);
-  // Don't bother testing the transposed version, the L1 test should be good
-  // enough for that
+    // Don't bother testing the transposed version, the L1 test should be good
+    // enough for that
 }
 TEST(TestGpuIndexFlat, L2_Float32) {
-  for (int tries = 0; tries < 3; ++tries) {
-    TestFlatOptions opt;
-    opt.metric = faiss::MetricType::METRIC_L2;
+    for (int tries = 0; tries < 3; ++tries) {
+        TestFlatOptions opt;
+        opt.metric = faiss::MetricType::METRIC_L2;
-    opt.useFloat16 = false;
-    opt.useTransposed = false;
+        opt.useFloat16 = false;
+        opt.useTransposed = false;
-    testFlat(opt);
+        testFlat(opt);
-    opt.useTransposed = true;
-    testFlat(opt);
-  }
+        opt.useTransposed = true;
+        testFlat(opt);
+    }
 }
 // test specialized k == 1 codepath
 TEST(TestGpuIndexFlat, L2_Float32_K1) {
-  for (int tries = 0; tries < 3; ++tries) {
-    TestFlatOptions opt;
-    opt.metric = faiss::MetricType::METRIC_L2;
-    opt.useFloat16 = false;
-    opt.useTransposed = false;
-    opt.kOverride = 1;
-    testFlat(opt);
-  }
+    for (int tries = 0; tries < 3; ++tries) {
+        TestFlatOptions opt;
+        opt.metric = faiss::MetricType::METRIC_L2;
+        opt.useFloat16 = false;
+        opt.useTransposed = false;
+        opt.kOverride = 1;
+        testFlat(opt);
+    }
 }
 TEST(TestGpuIndexFlat, IP_Float16) {
-  for (int tries = 0; tries < 3; ++tries) {
-    TestFlatOptions opt;
-    opt.metric = faiss::MetricType::METRIC_INNER_PRODUCT;
-    opt.useFloat16 = true;
-    opt.useTransposed = false;
+    for (int tries = 0; tries < 3; ++tries) {
+        TestFlatOptions opt;
+        opt.metric = faiss::MetricType::METRIC_INNER_PRODUCT;
+        opt.useFloat16 = true;
+        opt.useTransposed = false;
-    testFlat(opt);
+        testFlat(opt);
-    opt.useTransposed = true;
-    testFlat(opt);
-  }
+        opt.useTransposed = true;
+        testFlat(opt);
+    }
 }
 TEST(TestGpuIndexFlat, L2_Float16) {
-  for (int tries = 0; tries < 3; ++tries) {
-    TestFlatOptions opt;
-    opt.metric = faiss::MetricType::METRIC_L2;
-    opt.useFloat16 = true;
-    opt.useTransposed = false;
+    for (int tries = 0; tries < 3; ++tries) {
+        TestFlatOptions opt;
+        opt.metric = faiss::MetricType::METRIC_L2;
+        opt.useFloat16 = true;
+        opt.useTransposed = false;
-    testFlat(opt);
+        testFlat(opt);
-    opt.useTransposed = true;
-    testFlat(opt);
-  }
+        opt.useTransposed = true;
+        testFlat(opt);
+    }
 }
 // test specialized k == 1 codepath
 TEST(TestGpuIndexFlat, L2_Float16_K1) {
-  for (int tries = 0; tries < 3; ++tries) {
-    TestFlatOptions opt;
-    opt.metric = faiss::MetricType::METRIC_L2;
-    opt.useFloat16 = true;
-    opt.useTransposed = false;
-    opt.kOverride = 1;
-    testFlat(opt);
-  }
+    for (int tries = 0; tries < 3; ++tries) {
+        TestFlatOptions opt;
+        opt.metric = faiss::MetricType::METRIC_L2;
+        opt.useFloat16 = true;
+        opt.useTransposed = false;
+        opt.kOverride = 1;
+        testFlat(opt);
+    }
 }
 // test tiling along a huge vector set
 TEST(TestGpuIndexFlat, L2_Tiling) {
-  for (int tries = 0; tries < 2; ++tries) {
-    TestFlatOptions opt;
-    opt.metric = faiss::MetricType::METRIC_L2;
-    opt.useFloat16 = false;
-    opt.useTransposed = false;
-    opt.numVecsOverride = 1000000;
-    // keep the rest of the problem reasonably small
-    opt.numQueriesOverride = 4;
-    opt.dimOverride = 64;
-    opt.kOverride = 64;
-    testFlat(opt);
-  }
+    for (int tries = 0; tries < 2; ++tries) {
+        TestFlatOptions opt;
+        opt.metric = faiss::MetricType::METRIC_L2;
+        opt.useFloat16 = false;
+        opt.useTransposed = false;
+        opt.numVecsOverride = 1000000;
+        // keep the rest of the problem reasonably small
+        opt.numQueriesOverride = 4;
+        opt.dimOverride = 64;
+        opt.kOverride = 64;
+        testFlat(opt);
+    }
 }
 TEST(TestGpuIndexFlat, QueryEmpty) {
-  faiss::gpu::StandardGpuResources res;
-  res.noTempMemory();
+    faiss::gpu::StandardGpuResources res;
+    res.noTempMemory();
-  faiss::gpu::GpuIndexFlatConfig config;
-  config.device = 0;
-  config.useFloat16 = false;
-  config.storeTransposed = false;
+    faiss::gpu::GpuIndexFlatConfig config;
+    config.device = 0;
+    config.useFloat16 = false;
+    config.storeTransposed = false;
-  int dim = 128;
-  faiss::gpu::GpuIndexFlatL2 gpuIndex(&res, dim, config);
+    int dim = 128;
+    faiss::gpu::GpuIndexFlatL2 gpuIndex(&res, dim, config);
-  // Querying an empty index should not blow up, and just return
-  // (FLT_MAX, -1)
-  int numQuery = 10;
-  int k = 50;
-  std::vector<float> queries(numQuery * dim, 1.0f);
+    // Querying an empty index should not blow up, and just return
+    // (FLT_MAX, -1)
+    int numQuery = 10;
+    int k = 50;
+    std::vector<float> queries(numQuery * dim, 1.0f);
-  std::vector<float> dist(numQuery * k, 0);
-  std::vector<faiss::Index::idx_t> ind(numQuery * k);
+    std::vector<float> dist(numQuery * k, 0);
+    std::vector<faiss::Index::idx_t> ind(numQuery * k);
-  gpuIndex.search(numQuery, queries.data(), k, dist.data(), ind.data());
+    gpuIndex.search(numQuery, queries.data(), k, dist.data(), ind.data());
-  for (auto d : dist) {
-    EXPECT_EQ(d, std::numeric_limits<float>::max());
-  }
+    for (auto d : dist) {
+        EXPECT_EQ(d, std::numeric_limits<float>::max());
+    }
-  for (auto i : ind) {
-    EXPECT_EQ(i, -1);
-  }
+    for (auto i : ind) {
+        EXPECT_EQ(i, -1);
+    }
 }
 TEST(TestGpuIndexFlat, CopyFrom) {
-  int numVecs = faiss::gpu::randVal(100, 200);
-  int dim = faiss::gpu::randVal(1, 1000);
+    int numVecs = faiss::gpu::randVal(100, 200);
+    int dim = faiss::gpu::randVal(1, 1000);
-  faiss::IndexFlatL2 cpuIndex(dim);
+    faiss::IndexFlatL2 cpuIndex(dim);
-  std::vector<float> vecs = faiss::gpu::randVecs(numVecs, dim);
-  cpuIndex.add(numVecs, vecs.data());
+    std::vector<float> vecs = faiss::gpu::randVecs(numVecs, dim);
+    cpuIndex.add(numVecs, vecs.data());
-  faiss::gpu::StandardGpuResources res;
-  res.noTempMemory();
+    faiss::gpu::StandardGpuResources res;
+    res.noTempMemory();
-  // Fill with garbage values
-  int device = faiss::gpu::randVal(0, faiss::gpu::getNumDevices() - 1);
+    // Fill with garbage values
+    int device = faiss::gpu::randVal(0, faiss::gpu::getNumDevices() - 1);
-  faiss::gpu::GpuIndexFlatConfig config;
-  config.device = device;
-  config.useFloat16 = false;
-  config.storeTransposed = false;
+    faiss::gpu::GpuIndexFlatConfig config;
+    config.device = device;
+    config.useFloat16 = false;
+    config.storeTransposed = false;
-  faiss::gpu::GpuIndexFlatL2 gpuIndex(&res, 2000, config);
-  gpuIndex.copyFrom(&cpuIndex);
+    faiss::gpu::GpuIndexFlatL2 gpuIndex(&res, 2000, config);
+    gpuIndex.copyFrom(&cpuIndex);
-  EXPECT_EQ(cpuIndex.ntotal, gpuIndex.ntotal);
-  EXPECT_EQ(gpuIndex.ntotal, numVecs);
+    EXPECT_EQ(cpuIndex.ntotal, gpuIndex.ntotal);
+    EXPECT_EQ(gpuIndex.ntotal, numVecs);
-  EXPECT_EQ(cpuIndex.d, gpuIndex.d);
-  EXPECT_EQ(cpuIndex.d, dim);
+    EXPECT_EQ(cpuIndex.d, gpuIndex.d);
+    EXPECT_EQ(cpuIndex.d, dim);
-  int idx = faiss::gpu::randVal(0, numVecs - 1);
+    int idx = faiss::gpu::randVal(0, numVecs - 1);
-  std::vector<float> gpuVals(dim);
-  gpuIndex.reconstruct(idx, gpuVals.data());
+    std::vector<float> gpuVals(dim);
+    gpuIndex.reconstruct(idx, gpuVals.data());
-  std::vector<float> cpuVals(dim);
-  cpuIndex.reconstruct(idx, cpuVals.data());
+    std::vector<float> cpuVals(dim);
+    cpuIndex.reconstruct(idx, cpuVals.data());
-  EXPECT_EQ(gpuVals, cpuVals);
+    EXPECT_EQ(gpuVals, cpuVals);
 }
 TEST(TestGpuIndexFlat, CopyTo) {
-  faiss::gpu::StandardGpuResources res;
-  res.noTempMemory();
+    faiss::gpu::StandardGpuResources res;
+    res.noTempMemory();
-  int numVecs = faiss::gpu::randVal(100, 200);
-  int dim = faiss::gpu::randVal(1, 1000);
+    int numVecs = faiss::gpu::randVal(100, 200);
+    int dim = faiss::gpu::randVal(1, 1000);
-  int device = faiss::gpu::randVal(0, faiss::gpu::getNumDevices() - 1);
+    int device = faiss::gpu::randVal(0, faiss::gpu::getNumDevices() - 1);
-  faiss::gpu::GpuIndexFlatConfig config;
-  config.device = device;
-  config.useFloat16 = false;
-  config.storeTransposed = false;
+    faiss::gpu::GpuIndexFlatConfig config;
+    config.device = device;
+    config.useFloat16 = false;
+    config.storeTransposed = false;
-  faiss::gpu::GpuIndexFlatL2 gpuIndex(&res, dim, config);
+    faiss::gpu::GpuIndexFlatL2 gpuIndex(&res, dim, config);
-  std::vector<float> vecs = faiss::gpu::randVecs(numVecs, dim);
-  gpuIndex.add(numVecs, vecs.data());
+    std::vector<float> vecs = faiss::gpu::randVecs(numVecs, dim);
+    gpuIndex.add(numVecs, vecs.data());
-  // Fill with garbage values
-  faiss::IndexFlatL2 cpuIndex(2000);
-  gpuIndex.copyTo(&cpuIndex);
+    // Fill with garbage values
+    faiss::IndexFlatL2 cpuIndex(2000);
+    gpuIndex.copyTo(&cpuIndex);
-  EXPECT_EQ(cpuIndex.ntotal, gpuIndex.ntotal);
-  EXPECT_EQ(gpuIndex.ntotal, numVecs);
+    EXPECT_EQ(cpuIndex.ntotal, gpuIndex.ntotal);
+    EXPECT_EQ(gpuIndex.ntotal, numVecs);
-  EXPECT_EQ(cpuIndex.d, gpuIndex.d);
-  EXPECT_EQ(cpuIndex.d, dim);
+    EXPECT_EQ(cpuIndex.d, gpuIndex.d);
+    EXPECT_EQ(cpuIndex.d, dim);
-  int idx = faiss::gpu::randVal(0, numVecs - 1);
+    int idx = faiss::gpu::randVal(0, numVecs - 1);
-  std::vector<float> gpuVals(dim);
-  gpuIndex.reconstruct(idx, gpuVals.data());
+    std::vector<float> gpuVals(dim);
+    gpuIndex.reconstruct(idx, gpuVals.data());
-  std::vector<float> cpuVals(dim);
-  cpuIndex.reconstruct(idx, cpuVals.data());
+    std::vector<float> cpuVals(dim);
+    cpuIndex.reconstruct(idx, cpuVals.data());
-  EXPECT_EQ(gpuVals, cpuVals);
+    EXPECT_EQ(gpuVals, cpuVals);
 }
 TEST(TestGpuIndexFlat, UnifiedMemory) {
-  // Construct on a random device to test multi-device, if we have
-  // multiple devices
-  int device = faiss::gpu::randVal(0, faiss::gpu::getNumDevices() - 1);
-  if (!faiss::gpu::getFullUnifiedMemSupport(device)) {
-    return;
-  }
-  int dim = 256;
-  // FIXME: GpuIndexFlat doesn't support > 2^31 (vecs * dims) due to
-  // kernel indexing, so we can't test unified memory for memory
-  // oversubscription.
-  size_t numVecs = 50000;
-  int numQuery = 10;
-  int k = 10;
-  faiss::IndexFlatL2 cpuIndexL2(dim);
-  faiss::gpu::StandardGpuResources res;
-  res.noTempMemory();
-  faiss::gpu::GpuIndexFlatConfig config;
-  config.device = device;
-  config.memorySpace = faiss::gpu::MemorySpace::Unified;
-  faiss::gpu::GpuIndexFlatL2 gpuIndexL2(&res, dim, config);
-  std::vector<float> vecs = faiss::gpu::randVecs(numVecs, dim);
-  cpuIndexL2.add(numVecs, vecs.data());
-  gpuIndexL2.add(numVecs, vecs.data());
-  // To some extent, we depend upon the relative error for the test
-  // for float16
-  faiss::gpu::compareIndices(cpuIndexL2, gpuIndexL2,
-                             numQuery, dim, k, "Unified Memory",
-                             kF32MaxRelErr,
-                             0.1f,
-                             0.015f);
+    // Construct on a random device to test multi-device, if we have
+    // multiple devices
+    int device = faiss::gpu::randVal(0, faiss::gpu::getNumDevices() - 1);
+    if (!faiss::gpu::getFullUnifiedMemSupport(device)) {
+        return;
+    }
+    int dim = 256;
+    // FIXME: GpuIndexFlat doesn't support > 2^31 (vecs * dims) due to
+    // kernel indexing, so we can't test unified memory for memory
+    // oversubscription.
+    size_t numVecs = 50000;
+    int numQuery = 10;
+    int k = 10;
+    faiss::IndexFlatL2 cpuIndexL2(dim);
+    faiss::gpu::StandardGpuResources res;
+    res.noTempMemory();
+    faiss::gpu::GpuIndexFlatConfig config;
+    config.device = device;
+    config.memorySpace = faiss::gpu::MemorySpace::Unified;
+    faiss::gpu::GpuIndexFlatL2 gpuIndexL2(&res, dim, config);
+    std::vector<float> vecs = faiss::gpu::randVecs(numVecs, dim);
+    cpuIndexL2.add(numVecs, vecs.data());
+    gpuIndexL2.add(numVecs, vecs.data());
+    // To some extent, we depend upon the relative error for the test
+    // for float16
+    faiss::gpu::compareIndices(
+            cpuIndexL2,
+            gpuIndexL2,
+            numQuery,
+            dim,
+            k,
+            "Unified Memory",
+            kF32MaxRelErr,
+            0.1f,
+            0.015f);
 }
 int main(int argc, char** argv) {
-  testing::InitGoogleTest(&argc, argv);
+    testing::InitGoogleTest(&argc, argv);
-  // just run with a fixed test seed
-  faiss::gpu::setTestSeed(100);
+    // just run with a fixed test seed
+    faiss::gpu::setTestSeed(100);
-  return RUN_ALL_TESTS();
+    return RUN_ALL_TESTS();
 }