RubyGems - faiss - Versions diffs - 0.2.0 → 0.2.4 - Mend

faiss 0.2.0 → 0.2.4

Files changed (215) hide show

checksums.yaml +4 -4
data/CHANGELOG.md +16 -0
data/LICENSE.txt +1 -1
data/README.md +7 -7
data/ext/faiss/extconf.rb +6 -3
data/ext/faiss/numo.hpp +4 -4
data/ext/faiss/utils.cpp +1 -1
data/ext/faiss/utils.h +1 -1
data/lib/faiss/version.rb +1 -1
data/vendor/faiss/faiss/AutoTune.cpp +292 -291
data/vendor/faiss/faiss/AutoTune.h +55 -56
data/vendor/faiss/faiss/Clustering.cpp +365 -194
data/vendor/faiss/faiss/Clustering.h +102 -35
data/vendor/faiss/faiss/IVFlib.cpp +171 -195
data/vendor/faiss/faiss/IVFlib.h +48 -51
data/vendor/faiss/faiss/Index.cpp +85 -103
data/vendor/faiss/faiss/Index.h +54 -48
data/vendor/faiss/faiss/Index2Layer.cpp +126 -224
data/vendor/faiss/faiss/Index2Layer.h +22 -36
data/vendor/faiss/faiss/IndexAdditiveQuantizer.cpp +407 -0
data/vendor/faiss/faiss/IndexAdditiveQuantizer.h +195 -0
data/vendor/faiss/faiss/IndexBinary.cpp +45 -37
data/vendor/faiss/faiss/IndexBinary.h +140 -132
data/vendor/faiss/faiss/IndexBinaryFlat.cpp +73 -53
data/vendor/faiss/faiss/IndexBinaryFlat.h +29 -24
data/vendor/faiss/faiss/IndexBinaryFromFloat.cpp +46 -43
data/vendor/faiss/faiss/IndexBinaryFromFloat.h +16 -15
data/vendor/faiss/faiss/IndexBinaryHNSW.cpp +215 -232
data/vendor/faiss/faiss/IndexBinaryHNSW.h +25 -24
data/vendor/faiss/faiss/IndexBinaryHash.cpp +182 -177
data/vendor/faiss/faiss/IndexBinaryHash.h +41 -34
data/vendor/faiss/faiss/IndexBinaryIVF.cpp +489 -461
data/vendor/faiss/faiss/IndexBinaryIVF.h +97 -68
data/vendor/faiss/faiss/IndexFlat.cpp +115 -176
data/vendor/faiss/faiss/IndexFlat.h +42 -59
data/vendor/faiss/faiss/IndexFlatCodes.cpp +67 -0
data/vendor/faiss/faiss/IndexFlatCodes.h +47 -0
data/vendor/faiss/faiss/IndexHNSW.cpp +372 -348
data/vendor/faiss/faiss/IndexHNSW.h +57 -41
data/vendor/faiss/faiss/IndexIVF.cpp +545 -453
data/vendor/faiss/faiss/IndexIVF.h +169 -118
data/vendor/faiss/faiss/IndexIVFAdditiveQuantizer.cpp +316 -0
data/vendor/faiss/faiss/IndexIVFAdditiveQuantizer.h +121 -0
data/vendor/faiss/faiss/IndexIVFFlat.cpp +247 -252
data/vendor/faiss/faiss/IndexIVFFlat.h +48 -51
data/vendor/faiss/faiss/IndexIVFPQ.cpp +459 -517
data/vendor/faiss/faiss/IndexIVFPQ.h +75 -67
data/vendor/faiss/faiss/IndexIVFPQFastScan.cpp +406 -372
data/vendor/faiss/faiss/IndexIVFPQFastScan.h +82 -57
data/vendor/faiss/faiss/IndexIVFPQR.cpp +104 -102
data/vendor/faiss/faiss/IndexIVFPQR.h +33 -28
data/vendor/faiss/faiss/IndexIVFSpectralHash.cpp +163 -150
data/vendor/faiss/faiss/IndexIVFSpectralHash.h +38 -25
data/vendor/faiss/faiss/IndexLSH.cpp +66 -113
data/vendor/faiss/faiss/IndexLSH.h +20 -38
data/vendor/faiss/faiss/IndexLattice.cpp +42 -56
data/vendor/faiss/faiss/IndexLattice.h +11 -16
data/vendor/faiss/faiss/IndexNNDescent.cpp +229 -0
data/vendor/faiss/faiss/IndexNNDescent.h +72 -0
data/vendor/faiss/faiss/IndexNSG.cpp +301 -0
data/vendor/faiss/faiss/IndexNSG.h +85 -0
data/vendor/faiss/faiss/IndexPQ.cpp +387 -495
data/vendor/faiss/faiss/IndexPQ.h +64 -82
data/vendor/faiss/faiss/IndexPQFastScan.cpp +143 -170
data/vendor/faiss/faiss/IndexPQFastScan.h +46 -32
data/vendor/faiss/faiss/IndexPreTransform.cpp +120 -150
data/vendor/faiss/faiss/IndexPreTransform.h +33 -36
data/vendor/faiss/faiss/IndexRefine.cpp +139 -127
data/vendor/faiss/faiss/IndexRefine.h +32 -23
data/vendor/faiss/faiss/IndexReplicas.cpp +147 -153
data/vendor/faiss/faiss/IndexReplicas.h +62 -56
data/vendor/faiss/faiss/IndexScalarQuantizer.cpp +111 -172
data/vendor/faiss/faiss/IndexScalarQuantizer.h +41 -59
data/vendor/faiss/faiss/IndexShards.cpp +256 -240
data/vendor/faiss/faiss/IndexShards.h +85 -73
data/vendor/faiss/faiss/MatrixStats.cpp +112 -97
data/vendor/faiss/faiss/MatrixStats.h +7 -10
data/vendor/faiss/faiss/MetaIndexes.cpp +135 -157
data/vendor/faiss/faiss/MetaIndexes.h +40 -34
data/vendor/faiss/faiss/MetricType.h +7 -7
data/vendor/faiss/faiss/VectorTransform.cpp +654 -475
data/vendor/faiss/faiss/VectorTransform.h +64 -89
data/vendor/faiss/faiss/clone_index.cpp +78 -73
data/vendor/faiss/faiss/clone_index.h +4 -9
data/vendor/faiss/faiss/gpu/GpuAutoTune.cpp +33 -38
data/vendor/faiss/faiss/gpu/GpuAutoTune.h +11 -9
data/vendor/faiss/faiss/gpu/GpuCloner.cpp +198 -171
data/vendor/faiss/faiss/gpu/GpuCloner.h +53 -35
data/vendor/faiss/faiss/gpu/GpuClonerOptions.cpp +12 -14
data/vendor/faiss/faiss/gpu/GpuClonerOptions.h +27 -25
data/vendor/faiss/faiss/gpu/GpuDistance.h +116 -112
data/vendor/faiss/faiss/gpu/GpuFaissAssert.h +1 -2
data/vendor/faiss/faiss/gpu/GpuIcmEncoder.h +60 -0
data/vendor/faiss/faiss/gpu/GpuIndex.h +134 -137
data/vendor/faiss/faiss/gpu/GpuIndexBinaryFlat.h +76 -73
data/vendor/faiss/faiss/gpu/GpuIndexFlat.h +173 -162
data/vendor/faiss/faiss/gpu/GpuIndexIVF.h +67 -64
data/vendor/faiss/faiss/gpu/GpuIndexIVFFlat.h +89 -86
data/vendor/faiss/faiss/gpu/GpuIndexIVFPQ.h +150 -141
data/vendor/faiss/faiss/gpu/GpuIndexIVFScalarQuantizer.h +101 -103
data/vendor/faiss/faiss/gpu/GpuIndicesOptions.h +17 -16
data/vendor/faiss/faiss/gpu/GpuResources.cpp +116 -128
data/vendor/faiss/faiss/gpu/GpuResources.h +182 -186
data/vendor/faiss/faiss/gpu/StandardGpuResources.cpp +433 -422
data/vendor/faiss/faiss/gpu/StandardGpuResources.h +131 -130
data/vendor/faiss/faiss/gpu/impl/InterleavedCodes.cpp +468 -456
data/vendor/faiss/faiss/gpu/impl/InterleavedCodes.h +25 -19
data/vendor/faiss/faiss/gpu/impl/RemapIndices.cpp +22 -20
data/vendor/faiss/faiss/gpu/impl/RemapIndices.h +9 -8
data/vendor/faiss/faiss/gpu/perf/IndexWrapper-inl.h +39 -44
data/vendor/faiss/faiss/gpu/perf/IndexWrapper.h +16 -14
data/vendor/faiss/faiss/gpu/perf/PerfClustering.cpp +77 -71
data/vendor/faiss/faiss/gpu/perf/PerfIVFPQAdd.cpp +109 -88
data/vendor/faiss/faiss/gpu/perf/WriteIndex.cpp +75 -64
data/vendor/faiss/faiss/gpu/test/TestCodePacking.cpp +230 -215
data/vendor/faiss/faiss/gpu/test/TestGpuIndexBinaryFlat.cpp +80 -86
data/vendor/faiss/faiss/gpu/test/TestGpuIndexFlat.cpp +284 -277
data/vendor/faiss/faiss/gpu/test/TestGpuIndexIVFFlat.cpp +416 -416
data/vendor/faiss/faiss/gpu/test/TestGpuIndexIVFPQ.cpp +611 -517
data/vendor/faiss/faiss/gpu/test/TestGpuIndexIVFScalarQuantizer.cpp +166 -164
data/vendor/faiss/faiss/gpu/test/TestGpuMemoryException.cpp +61 -53
data/vendor/faiss/faiss/gpu/test/TestUtils.cpp +274 -238
data/vendor/faiss/faiss/gpu/test/TestUtils.h +73 -57
data/vendor/faiss/faiss/gpu/test/demo_ivfpq_indexing_gpu.cpp +47 -50
data/vendor/faiss/faiss/gpu/utils/DeviceUtils.h +79 -72
data/vendor/faiss/faiss/gpu/utils/StackDeviceMemory.cpp +140 -146
data/vendor/faiss/faiss/gpu/utils/StackDeviceMemory.h +69 -71
data/vendor/faiss/faiss/gpu/utils/StaticUtils.h +21 -16
data/vendor/faiss/faiss/gpu/utils/Timer.cpp +25 -29
data/vendor/faiss/faiss/gpu/utils/Timer.h +30 -29
data/vendor/faiss/faiss/impl/AdditiveQuantizer.cpp +503 -0
data/vendor/faiss/faiss/impl/AdditiveQuantizer.h +175 -0
data/vendor/faiss/faiss/impl/AuxIndexStructures.cpp +90 -120
data/vendor/faiss/faiss/impl/AuxIndexStructures.h +81 -65
data/vendor/faiss/faiss/impl/FaissAssert.h +73 -58
data/vendor/faiss/faiss/impl/FaissException.cpp +56 -48
data/vendor/faiss/faiss/impl/FaissException.h +41 -29
data/vendor/faiss/faiss/impl/HNSW.cpp +606 -617
data/vendor/faiss/faiss/impl/HNSW.h +179 -200
data/vendor/faiss/faiss/impl/LocalSearchQuantizer.cpp +855 -0
data/vendor/faiss/faiss/impl/LocalSearchQuantizer.h +244 -0
data/vendor/faiss/faiss/impl/NNDescent.cpp +487 -0
data/vendor/faiss/faiss/impl/NNDescent.h +154 -0
data/vendor/faiss/faiss/impl/NSG.cpp +679 -0
data/vendor/faiss/faiss/impl/NSG.h +199 -0
data/vendor/faiss/faiss/impl/PolysemousTraining.cpp +484 -454
data/vendor/faiss/faiss/impl/PolysemousTraining.h +52 -55
data/vendor/faiss/faiss/impl/ProductQuantizer-inl.h +26 -47
data/vendor/faiss/faiss/impl/ProductQuantizer.cpp +469 -459
data/vendor/faiss/faiss/impl/ProductQuantizer.h +76 -87
data/vendor/faiss/faiss/impl/ResidualQuantizer.cpp +758 -0
data/vendor/faiss/faiss/impl/ResidualQuantizer.h +188 -0
data/vendor/faiss/faiss/impl/ResultHandler.h +96 -132
data/vendor/faiss/faiss/impl/ScalarQuantizer.cpp +647 -707
data/vendor/faiss/faiss/impl/ScalarQuantizer.h +48 -46
data/vendor/faiss/faiss/impl/ThreadedIndex-inl.h +129 -131
data/vendor/faiss/faiss/impl/ThreadedIndex.h +61 -55
data/vendor/faiss/faiss/impl/index_read.cpp +631 -480
data/vendor/faiss/faiss/impl/index_write.cpp +547 -407
data/vendor/faiss/faiss/impl/io.cpp +76 -95
data/vendor/faiss/faiss/impl/io.h +31 -41
data/vendor/faiss/faiss/impl/io_macros.h +60 -29
data/vendor/faiss/faiss/impl/kmeans1d.cpp +301 -0
data/vendor/faiss/faiss/impl/kmeans1d.h +48 -0
data/vendor/faiss/faiss/impl/lattice_Zn.cpp +137 -186
data/vendor/faiss/faiss/impl/lattice_Zn.h +40 -51
data/vendor/faiss/faiss/impl/platform_macros.h +29 -8
data/vendor/faiss/faiss/impl/pq4_fast_scan.cpp +77 -124
data/vendor/faiss/faiss/impl/pq4_fast_scan.h +39 -48
data/vendor/faiss/faiss/impl/pq4_fast_scan_search_1.cpp +41 -52
data/vendor/faiss/faiss/impl/pq4_fast_scan_search_qbs.cpp +80 -117
data/vendor/faiss/faiss/impl/simd_result_handlers.h +109 -137
data/vendor/faiss/faiss/index_factory.cpp +619 -397
data/vendor/faiss/faiss/index_factory.h +8 -6
data/vendor/faiss/faiss/index_io.h +23 -26
data/vendor/faiss/faiss/invlists/BlockInvertedLists.cpp +67 -75
data/vendor/faiss/faiss/invlists/BlockInvertedLists.h +22 -24
data/vendor/faiss/faiss/invlists/DirectMap.cpp +96 -112
data/vendor/faiss/faiss/invlists/DirectMap.h +29 -33
data/vendor/faiss/faiss/invlists/InvertedLists.cpp +307 -364
data/vendor/faiss/faiss/invlists/InvertedLists.h +151 -151
data/vendor/faiss/faiss/invlists/InvertedListsIOHook.cpp +29 -34
data/vendor/faiss/faiss/invlists/InvertedListsIOHook.h +17 -18
data/vendor/faiss/faiss/invlists/OnDiskInvertedLists.cpp +257 -293
data/vendor/faiss/faiss/invlists/OnDiskInvertedLists.h +50 -45
data/vendor/faiss/faiss/python/python_callbacks.cpp +23 -26
data/vendor/faiss/faiss/python/python_callbacks.h +9 -16
data/vendor/faiss/faiss/utils/AlignedTable.h +79 -44
data/vendor/faiss/faiss/utils/Heap.cpp +40 -48
data/vendor/faiss/faiss/utils/Heap.h +186 -209
data/vendor/faiss/faiss/utils/WorkerThread.cpp +67 -76
data/vendor/faiss/faiss/utils/WorkerThread.h +32 -33
data/vendor/faiss/faiss/utils/distances.cpp +305 -312
data/vendor/faiss/faiss/utils/distances.h +170 -122
data/vendor/faiss/faiss/utils/distances_simd.cpp +498 -508
data/vendor/faiss/faiss/utils/extra_distances-inl.h +117 -0
data/vendor/faiss/faiss/utils/extra_distances.cpp +113 -232
data/vendor/faiss/faiss/utils/extra_distances.h +30 -29
data/vendor/faiss/faiss/utils/hamming-inl.h +260 -209
data/vendor/faiss/faiss/utils/hamming.cpp +375 -469
data/vendor/faiss/faiss/utils/hamming.h +62 -85
data/vendor/faiss/faiss/utils/ordered_key_value.h +16 -18
data/vendor/faiss/faiss/utils/partitioning.cpp +393 -318
data/vendor/faiss/faiss/utils/partitioning.h +26 -21
data/vendor/faiss/faiss/utils/quantize_lut.cpp +78 -66
data/vendor/faiss/faiss/utils/quantize_lut.h +22 -20
data/vendor/faiss/faiss/utils/random.cpp +39 -63
data/vendor/faiss/faiss/utils/random.h +13 -16
data/vendor/faiss/faiss/utils/simdlib.h +4 -2
data/vendor/faiss/faiss/utils/simdlib_avx2.h +88 -85
data/vendor/faiss/faiss/utils/simdlib_emulated.h +226 -165
data/vendor/faiss/faiss/utils/simdlib_neon.h +832 -0
data/vendor/faiss/faiss/utils/utils.cpp +304 -287
data/vendor/faiss/faiss/utils/utils.h +54 -49
metadata +29 -4

data/vendor/faiss/faiss/VectorTransform.cpp CHANGED Viewed

@@ -10,20 +10,19 @@
 #include <faiss/VectorTransform.h>
 #include <cinttypes>
-#include <cstdio>
 #include <cmath>
+#include <cstdio>
 #include <cstring>
 #include <memory>
+#include <faiss/IndexPQ.h>
+#include <faiss/impl/FaissAssert.h>
 #include <faiss/utils/distances.h>
 #include <faiss/utils/random.h>
 #include <faiss/utils/utils.h>
-#include <faiss/impl/FaissAssert.h>
-#include <faiss/IndexPQ.h>
 using namespace faiss;
 extern "C" {
 // this is to keep the clang syntax checker happy
@@ -31,134 +30,183 @@ extern "C" {
 #define FINTEGER int
 #endif
 /* declare BLAS functions, see http://www.netlib.org/clapack/cblas/ */
-int sgemm_ (
-        const char *transa, const char *transb, FINTEGER *m, FINTEGER *
-        n, FINTEGER *k, const float *alpha, const float *a,
-        FINTEGER *lda, const float *b,
-        FINTEGER *ldb, float *beta,
-        float *c, FINTEGER *ldc);
-int dgemm_ (
-        const char *transa, const char *transb, FINTEGER *m, FINTEGER *
-        n, FINTEGER *k, const double *alpha, const double *a,
-        FINTEGER *lda, const double *b,
-        FINTEGER *ldb, double *beta,
-        double *c, FINTEGER *ldc);
-int ssyrk_ (
-        const char *uplo, const char *trans, FINTEGER *n, FINTEGER *k,
-        float *alpha, float *a, FINTEGER *lda,
-        float *beta, float *c, FINTEGER *ldc);
+int sgemm_(
+        const char* transa,
+        const char* transb,
+        FINTEGER* m,
+        FINTEGER* n,
+        FINTEGER* k,
+        const float* alpha,
+        const float* a,
+        FINTEGER* lda,
+        const float* b,
+        FINTEGER* ldb,
+        float* beta,
+        float* c,
+        FINTEGER* ldc);
+int dgemm_(
+        const char* transa,
+        const char* transb,
+        FINTEGER* m,
+        FINTEGER* n,
+        FINTEGER* k,
+        const double* alpha,
+        const double* a,
+        FINTEGER* lda,
+        const double* b,
+        FINTEGER* ldb,
+        double* beta,
+        double* c,
+        FINTEGER* ldc);
+int ssyrk_(
+        const char* uplo,
+        const char* trans,
+        FINTEGER* n,
+        FINTEGER* k,
+        float* alpha,
+        float* a,
+        FINTEGER* lda,
+        float* beta,
+        float* c,
+        FINTEGER* ldc);
 /* Lapack functions from http://www.netlib.org/clapack/old/single/ */
-int ssyev_ (
-        const char *jobz, const char *uplo, FINTEGER *n, float *a,
-        FINTEGER *lda, float *w, float *work, FINTEGER *lwork,
-        FINTEGER *info);
-int dsyev_ (
-        const char *jobz, const char *uplo, FINTEGER *n, double *a,
-        FINTEGER *lda, double *w, double *work, FINTEGER *lwork,
-        FINTEGER *info);
+int ssyev_(
+        const char* jobz,
+        const char* uplo,
+        FINTEGER* n,
+        float* a,
+        FINTEGER* lda,
+        float* w,
+        float* work,
+        FINTEGER* lwork,
+        FINTEGER* info);
+int dsyev_(
+        const char* jobz,
+        const char* uplo,
+        FINTEGER* n,
+        double* a,
+        FINTEGER* lda,
+        double* w,
+        double* work,
+        FINTEGER* lwork,
+        FINTEGER* info);
 int sgesvd_(
-        const char *jobu, const char *jobvt, FINTEGER *m, FINTEGER *n,
-        float *a, FINTEGER *lda, float *s, float *u, FINTEGER *ldu, float *vt,
-        FINTEGER *ldvt, float *work, FINTEGER *lwork, FINTEGER *info);
+        const char* jobu,
+        const char* jobvt,
+        FINTEGER* m,
+        FINTEGER* n,
+        float* a,
+        FINTEGER* lda,
+        float* s,
+        float* u,
+        FINTEGER* ldu,
+        float* vt,
+        FINTEGER* ldvt,
+        float* work,
+        FINTEGER* lwork,
+        FINTEGER* info);
 int dgesvd_(
-     const char *jobu, const char *jobvt, FINTEGER *m, FINTEGER *n,
-     double *a, FINTEGER *lda, double *s, double *u, FINTEGER *ldu, double *vt,
-     FINTEGER *ldvt, double *work, FINTEGER *lwork, FINTEGER *info);
+        const char* jobu,
+        const char* jobvt,
+        FINTEGER* m,
+        FINTEGER* n,
+        double* a,
+        FINTEGER* lda,
+        double* s,
+        double* u,
+        FINTEGER* ldu,
+        double* vt,
+        FINTEGER* ldvt,
+        double* work,
+        FINTEGER* lwork,
+        FINTEGER* info);
 }
 /*********************************************
  * VectorTransform
  *********************************************/
-float * VectorTransform::apply (Index::idx_t n, const float * x) const
-{
-    float * xt = new float[n * d_out];
-    apply_noalloc (n, x, xt);
+float* VectorTransform::apply(Index::idx_t n, const float* x) const {
+    float* xt = new float[n * d_out];
+    apply_noalloc(n, x, xt);
     return xt;
 }
-void VectorTransform::train (idx_t, const float *) {
+void VectorTransform::train(idx_t, const float*) {
     // does nothing by default
 }
-void VectorTransform::reverse_transform (
-             idx_t , const float *,
-             float *) const
-{
-    FAISS_THROW_MSG ("reverse transform not implemented");
+void VectorTransform::reverse_transform(idx_t, const float*, float*) const {
+    FAISS_THROW_MSG("reverse transform not implemented");
 }
 /*********************************************
  * LinearTransform
  *********************************************/
 /// both d_in > d_out and d_out < d_in are supported
-LinearTransform::LinearTransform (int d_in, int d_out,
-                                  bool have_bias):
-    VectorTransform (d_in, d_out), have_bias (have_bias),
-    is_orthonormal (false), verbose (false)
-{
+LinearTransform::LinearTransform(int d_in, int d_out, bool have_bias)
+        : VectorTransform(d_in, d_out),
+          have_bias(have_bias),
+          is_orthonormal(false),
+          verbose(false) {
     is_trained = false; // will be trained when A and b are initialized
 }
-void LinearTransform::apply_noalloc (Index::idx_t n, const float * x,
-                               float * xt) const
-{
+void LinearTransform::apply_noalloc(Index::idx_t n, const float* x, float* xt)
+        const {
     FAISS_THROW_IF_NOT_MSG(is_trained, "Transformation not trained yet");
     float c_factor;
     if (have_bias) {
-        FAISS_THROW_IF_NOT_MSG (b.size() == d_out, "Bias not initialized");
-        float * xi = xt;
+        FAISS_THROW_IF_NOT_MSG(b.size() == d_out, "Bias not initialized");
+        float* xi = xt;
         for (int i = 0; i < n; i++)
-            for(int j = 0; j < d_out; j++)
+            for (int j = 0; j < d_out; j++)
                 *xi++ = b[j];
         c_factor = 1.0;
     } else {
         c_factor = 0.0;
     }
-    FAISS_THROW_IF_NOT_MSG (A.size() == d_out * d_in,
-                      "Transformation matrix not initialized");
+    FAISS_THROW_IF_NOT_MSG(
+            A.size() == d_out * d_in, "Transformation matrix not initialized");
     float one = 1;
     FINTEGER nbiti = d_out, ni = n, di = d_in;
-    sgemm_ ("Transposed", "Not transposed",
-            &nbiti, &ni, &di,
-            &one, A.data(), &di, x, &di, &c_factor, xt, &nbiti);
+    sgemm_("Transposed",
+           "Not transposed",
+           &nbiti,
+           &ni,
+           &di,
+           &one,
+           A.data(),
+           &di,
+           x,
+           &di,
+           &c_factor,
+           xt,
+           &nbiti);
 }
-void LinearTransform::transform_transpose (idx_t n, const float * y,
-                                           float *x) const
-{
+void LinearTransform::transform_transpose(idx_t n, const float* y, float* x)
+        const {
     if (have_bias) { // allocate buffer to store bias-corrected data
-        float *y_new = new float [n * d_out];
-        const float *yr = y;
-        float *yw = y_new;
+        float* y_new = new float[n * d_out];
+        const float* yr = y;
+        float* yw = y_new;
         for (idx_t i = 0; i < n; i++) {
             for (int j = 0; j < d_out; j++) {
-                *yw++ = *yr++ - b [j];
+                *yw++ = *yr++ - b[j];
             }
         }
         y = y_new;
@@ -167,15 +215,26 @@ void LinearTransform::transform_transpose (idx_t n, const float * y,
     {
         FINTEGER dii = d_in, doi = d_out, ni = n;
         float one = 1.0, zero = 0.0;
-        sgemm_ ("Not", "Not", &dii, &ni, &doi,
-                &one, A.data (), &dii, y, &doi, &zero, x, &dii);
+        sgemm_("Not",
+               "Not",
+               &dii,
+               &ni,
+               &doi,
+               &one,
+               A.data(),
+               &dii,
+               y,
+               &doi,
+               &zero,
+               x,
+               &dii);
     }
-    if (have_bias) delete [] y;
+    if (have_bias)
+        delete[] y;
 }
-void LinearTransform::set_is_orthonormal ()
-{
+void LinearTransform::set_is_orthonormal() {
     if (d_out > d_in) {
         // not clear what we should do in this case
         is_orthonormal = false;
@@ -193,44 +252,53 @@ void LinearTransform::set_is_orthonormal ()
         FINTEGER dii = d_in, doi = d_out;
         float one = 1.0, zero = 0.0;
-        sgemm_ ("Transposed", "Not", &doi, &doi, &dii,
-                &one, A.data (), &dii,
-                A.data(), &dii,
-                &zero, ATA.data(), &doi);
+        sgemm_("Transposed",
+               "Not",
+               &doi,
+               &doi,
+               &dii,
+               &one,
+               A.data(),
+               &dii,
+               A.data(),
+               &dii,
+               &zero,
+               ATA.data(),
+               &doi);
         is_orthonormal = true;
         for (long i = 0; i < d_out; i++) {
             for (long j = 0; j < d_out; j++) {
                 float v = ATA[i + j * d_out];
-                if (i == j) v-= 1;
+                if (i == j)
+                    v -= 1;
                 if (fabs(v) > eps) {
                     is_orthonormal = false;
                 }
             }
         }
     }
 }
-void LinearTransform::reverse_transform (idx_t n, const float * xt,
-                                         float *x) const
-{
+void LinearTransform::reverse_transform(idx_t n, const float* xt, float* x)
+        const {
     if (is_orthonormal) {
-        transform_transpose (n, xt, x);
+        transform_transpose(n, xt, x);
     } else {
-        FAISS_THROW_MSG ("reverse transform not implemented for non-orthonormal matrices");
+        FAISS_THROW_MSG(
+                "reverse transform not implemented for non-orthonormal matrices");
     }
 }
-void LinearTransform::print_if_verbose (
-         const char*name, const std::vector<double> &mat,
-         int n, int d) const
-{
-    if (!verbose) return;
+void LinearTransform::print_if_verbose(
+        const char* name,
+        const std::vector<double>& mat,
+        int n,
+        int d) const {
+    if (!verbose)
+        return;
     printf("matrix %s: %d*%d [\n", name, n, d);
-    FAISS_THROW_IF_NOT (mat.size() >= n * d);
+    FAISS_THROW_IF_NOT(mat.size() >= n * d);
     for (int i = 0; i < n; i++) {
         for (int j = 0; j < d; j++) {
             printf("%10.5g ", mat[i * d + j]);
@@ -244,24 +312,22 @@ void LinearTransform::print_if_verbose (
  * RandomRotationMatrix
  *********************************************/
-void RandomRotationMatrix::init (int seed)
-{
-    if(d_out <= d_in) {
-        A.resize (d_out * d_in);
-        float *q = A.data();
+void RandomRotationMatrix::init(int seed) {
+    if (d_out <= d_in) {
+        A.resize(d_out * d_in);
+        float* q = A.data();
         float_randn(q, d_out * d_in, seed);
         matrix_qr(d_in, d_out, q);
     } else {
         // use tight-frame transformation
-        A.resize (d_out * d_out);
-        float *q = A.data();
+        A.resize(d_out * d_out);
+        float* q = A.data();
         float_randn(q, d_out * d_out, seed);
         matrix_qr(d_out, d_out, q);
         // remove columns
         int i, j;
         for (i = 0; i < d_out; i++) {
-            for(j = 0; j < d_in; j++) {
+            for (j = 0; j < d_in; j++) {
                 q[i * d_in + j] = q[i * d_out + j];
             }
         }
@@ -271,247 +337,281 @@ void RandomRotationMatrix::init (int seed)
     is_trained = true;
 }
-void RandomRotationMatrix::train (Index::idx_t /*n*/, const float * /*x*/)
-{
+void RandomRotationMatrix::train(Index::idx_t /*n*/, const float* /*x*/) {
     // initialize with some arbitrary seed
-    init (12345);
+    init(12345);
 }
 /*********************************************
  * PCAMatrix
  *********************************************/
-PCAMatrix::PCAMatrix (int d_in, int d_out,
-                      float eigen_power, bool random_rotation):
-    LinearTransform(d_in, d_out, true),
-    eigen_power(eigen_power), random_rotation(random_rotation)
-{
+PCAMatrix::PCAMatrix(
+        int d_in,
+        int d_out,
+        float eigen_power,
+        bool random_rotation)
+        : LinearTransform(d_in, d_out, true),
+          eigen_power(eigen_power),
+          random_rotation(random_rotation) {
     is_trained = false;
     max_points_per_d = 1000;
     balanced_bins = 0;
+    epsilon = 0;
 }
 namespace {
 /// Compute the eigenvalue decomposition of symmetric matrix cov,
 /// dimensions d_in-by-d_in. Output eigenvectors in cov.
-void eig(size_t d_in, double *cov, double *eigenvalues, int verbose)
-{
+void eig(size_t d_in, double* cov, double* eigenvalues, int verbose) {
     { // compute eigenvalues and vectors
         FINTEGER info = 0, lwork = -1, di = d_in;
         double workq;
-        dsyev_ ("Vectors as well", "Upper",
-                &di, cov, &di, eigenvalues, &workq, &lwork, &info);
+        dsyev_("Vectors as well",
+               "Upper",
+               &di,
+               cov,
+               &di,
+               eigenvalues,
+               &workq,
+               &lwork,
+               &info);
         lwork = FINTEGER(workq);
-        double *work = new double[lwork];
+        double* work = new double[lwork];
-        dsyev_ ("Vectors as well", "Upper",
-                &di, cov, &di, eigenvalues, work, &lwork, &info);
+        dsyev_("Vectors as well",
+               "Upper",
+               &di,
+               cov,
+               &di,
+               eigenvalues,
+               work,
+               &lwork,
+               &info);
-        delete [] work;
+        delete[] work;
         if (info != 0) {
-            fprintf (stderr, "WARN ssyev info returns %d, "
-                     "a very bad PCA matrix is learnt\n",
-                     int(info));
+            fprintf(stderr,
+                    "WARN ssyev info returns %d, "
+                    "a very bad PCA matrix is learnt\n",
+                    int(info));
             // do not throw exception, as the matrix could still be useful
         }
-        if(verbose && d_in <= 10) {
+        if (verbose && d_in <= 10) {
             printf("info=%ld new eigvals=[", long(info));
-            for(int j = 0; j < d_in; j++) printf("%g ", eigenvalues[j]);
+            for (int j = 0; j < d_in; j++)
+                printf("%g ", eigenvalues[j]);
             printf("]\n");
-            double *ci = cov;
+            double* ci = cov;
             printf("eigenvecs=\n");
-            for(int i = 0; i < d_in; i++) {
-                for(int j = 0; j < d_in; j++)
+            for (int i = 0; i < d_in; i++) {
+                for (int j = 0; j < d_in; j++)
                     printf("%10.4g ", *ci++);
                 printf("\n");
             }
         }
     }
     // revert order of eigenvectors & values
-    for(int i = 0; i < d_in / 2; i++) {
+    for (int i = 0; i < d_in / 2; i++) {
         std::swap(eigenvalues[i], eigenvalues[d_in - 1 - i]);
-        double *v1 = cov + i * d_in;
-        double *v2 = cov + (d_in - 1 - i) * d_in;
-        for(int j = 0; j < d_in; j++)
+        double* v1 = cov + i * d_in;
+        double* v2 = cov + (d_in - 1 - i) * d_in;
+        for (int j = 0; j < d_in; j++)
             std::swap(v1[j], v2[j]);
     }
 }
+} // namespace
-}
-void PCAMatrix::train (Index::idx_t n, const float *x)
-{
-    const float * x_in = x;
+void PCAMatrix::train(Index::idx_t n, const float* x) {
+    const float* x_in = x;
-    x = fvecs_maybe_subsample (d_in, (size_t*)&n,
-                               max_points_per_d * d_in, x, verbose);
+    x = fvecs_maybe_subsample(
+            d_in, (size_t*)&n, max_points_per_d * d_in, x, verbose);
-    ScopeDeleter<float> del_x (x != x_in ? x : nullptr);
+    ScopeDeleter<float> del_x(x != x_in ? x : nullptr);
     // compute mean
-    mean.clear(); mean.resize(d_in, 0.0);
+    mean.clear();
+    mean.resize(d_in, 0.0);
     if (have_bias) { // we may want to skip the bias
-        const float *xi = x;
+        const float* xi = x;
         for (int i = 0; i < n; i++) {
-            for(int j = 0; j < d_in; j++)
+            for (int j = 0; j < d_in; j++)
                 mean[j] += *xi++;
         }
-        for(int j = 0; j < d_in; j++)
+        for (int j = 0; j < d_in; j++)
             mean[j] /= n;
     }
-    if(verbose) {
+    if (verbose) {
         printf("mean=[");
-        for(int j = 0; j < d_in; j++) printf("%g ", mean[j]);
+        for (int j = 0; j < d_in; j++)
+            printf("%g ", mean[j]);
         printf("]\n");
     }
-    if(n >= d_in) {
+    if (n >= d_in) {
         // compute covariance matrix, store it in PCA matrix
         PCAMat.resize(d_in * d_in);
-        float * cov = PCAMat.data();
+        float* cov = PCAMat.data();
         { // initialize with  mean * mean^T term
-            float *ci = cov;
-            for(int i = 0; i < d_in; i++) {
-                for(int j = 0; j < d_in; j++)
-                    *ci++ = - n * mean[i] * mean[j];
+            float* ci = cov;
+            for (int i = 0; i < d_in; i++) {
+                for (int j = 0; j < d_in; j++)
+                    *ci++ = -n * mean[i] * mean[j];
             }
         }
         {
             FINTEGER di = d_in, ni = n;
             float one = 1.0;
-            ssyrk_ ("Up", "Non transposed",
-                    &di, &ni, &one, (float*)x, &di, &one, cov, &di);
+            ssyrk_("Up",
+                   "Non transposed",
+                   &di,
+                   &ni,
+                   &one,
+                   (float*)x,
+                   &di,
+                   &one,
+                   cov,
+                   &di);
         }
-        if(verbose && d_in <= 10) {
-            float *ci = cov;
+        if (verbose && d_in <= 10) {
+            float* ci = cov;
             printf("cov=\n");
-            for(int i = 0; i < d_in; i++) {
-                for(int j = 0; j < d_in; j++)
+            for (int i = 0; i < d_in; i++) {
+                for (int j = 0; j < d_in; j++)
                     printf("%10g ", *ci++);
                 printf("\n");
             }
         }
-        std::vector<double> covd (d_in * d_in);
-        for (size_t i = 0; i < d_in * d_in; i++) covd [i] = cov [i];
+        std::vector<double> covd(d_in * d_in);
+        for (size_t i = 0; i < d_in * d_in; i++)
+            covd[i] = cov[i];
-        std::vector<double> eigenvaluesd (d_in);
+        std::vector<double> eigenvaluesd(d_in);
-        eig (d_in, covd.data (), eigenvaluesd.data (), verbose);
+        eig(d_in, covd.data(), eigenvaluesd.data(), verbose);
-        for (size_t i = 0; i < d_in * d_in; i++) PCAMat [i] = covd [i];
-        eigenvalues.resize (d_in);
+        for (size_t i = 0; i < d_in * d_in; i++)
+            PCAMat[i] = covd[i];
+        eigenvalues.resize(d_in);
         for (size_t i = 0; i < d_in; i++)
-            eigenvalues [i] = eigenvaluesd [i];
+            eigenvalues[i] = eigenvaluesd[i];
     } else {
-        std::vector<float> xc (n * d_in);
+        std::vector<float> xc(n * d_in);
         for (size_t i = 0; i < n; i++)
-            for(size_t j = 0; j < d_in; j++)
-                xc [i * d_in + j] = x [i * d_in + j] - mean[j];
+            for (size_t j = 0; j < d_in; j++)
+                xc[i * d_in + j] = x[i * d_in + j] - mean[j];
         // compute Gram matrix
-        std::vector<float> gram (n * n);
+        std::vector<float> gram(n * n);
         {
             FINTEGER di = d_in, ni = n;
             float one = 1.0, zero = 0.0;
-            ssyrk_ ("Up", "Transposed",
-                    &ni, &di, &one, xc.data(), &di, &zero, gram.data(), &ni);
+            ssyrk_("Up",
+                   "Transposed",
+                   &ni,
+                   &di,
+                   &one,
+                   xc.data(),
+                   &di,
+                   &zero,
+                   gram.data(),
+                   &ni);
         }
-        if(verbose && d_in <= 10) {
-            float *ci = gram.data();
+        if (verbose && d_in <= 10) {
+            float* ci = gram.data();
             printf("gram=\n");
-            for(int i = 0; i < n; i++) {
-                for(int j = 0; j < n; j++)
+            for (int i = 0; i < n; i++) {
+                for (int j = 0; j < n; j++)
                     printf("%10g ", *ci++);
                 printf("\n");
             }
         }
-        std::vector<double> gramd (n * n);
+        std::vector<double> gramd(n * n);
         for (size_t i = 0; i < n * n; i++)
-            gramd [i] = gram [i];
+            gramd[i] = gram[i];
-        std::vector<double> eigenvaluesd (n);
+        std::vector<double> eigenvaluesd(n);
         // eig will fill in only the n first eigenvals
-        eig (n, gramd.data (), eigenvaluesd.data (), verbose);
+        eig(n, gramd.data(), eigenvaluesd.data(), verbose);
         PCAMat.resize(d_in * n);
         for (size_t i = 0; i < n * n; i++)
-            gram [i] = gramd [i];
+            gram[i] = gramd[i];
-        eigenvalues.resize (d_in);
+        eigenvalues.resize(d_in);
         // fill in only the n first ones
         for (size_t i = 0; i < n; i++)
-            eigenvalues [i] = eigenvaluesd [i];
+            eigenvalues[i] = eigenvaluesd[i];
         { // compute PCAMat = x' * v
             FINTEGER di = d_in, ni = n;
             float one = 1.0;
-            sgemm_ ("Non", "Non Trans",
-                    &di, &ni, &ni,
-                    &one, xc.data(), &di, gram.data(), &ni,
-                    &one, PCAMat.data(), &di);
+            sgemm_("Non",
+                   "Non Trans",
+                   &di,
+                   &ni,
+                   &ni,
+                   &one,
+                   xc.data(),
+                   &di,
+                   gram.data(),
+                   &ni,
+                   &one,
+                   PCAMat.data(),
+                   &di);
         }
-        if(verbose && d_in <= 10) {
-            float *ci = PCAMat.data();
+        if (verbose && d_in <= 10) {
+            float* ci = PCAMat.data();
             printf("PCAMat=\n");
-            for(int i = 0; i < n; i++) {
-                for(int j = 0; j < d_in; j++)
+            for (int i = 0; i < n; i++) {
+                for (int j = 0; j < d_in; j++)
                     printf("%10g ", *ci++);
                 printf("\n");
             }
         }
-        fvec_renorm_L2 (d_in, n, PCAMat.data());
+        fvec_renorm_L2(d_in, n, PCAMat.data());
     }
     prepare_Ab();
     is_trained = true;
 }
-void PCAMatrix::copy_from (const PCAMatrix & other)
-{
-    FAISS_THROW_IF_NOT (other.is_trained);
+void PCAMatrix::copy_from(const PCAMatrix& other) {
+    FAISS_THROW_IF_NOT(other.is_trained);
     mean = other.mean;
     eigenvalues = other.eigenvalues;
     PCAMat = other.PCAMat;
-    prepare_Ab ();
+    prepare_Ab();
     is_trained = true;
 }
-void PCAMatrix::prepare_Ab ()
-{
-    FAISS_THROW_IF_NOT_FMT (
+void PCAMatrix::prepare_Ab() {
+    FAISS_THROW_IF_NOT_FMT(
             d_out * d_in <= PCAMat.size(),
             "PCA matrix cannot output %d dimensions from %d ",
-            d_out, d_in);
+            d_out,
+            d_in);
     if (!random_rotation) {
         A = PCAMat;
@@ -519,23 +619,23 @@ void PCAMatrix::prepare_Ab ()
         // first scale the components
         if (eigen_power != 0) {
-            float *ai = A.data();
+            float* ai = A.data();
             for (int i = 0; i < d_out; i++) {
-                float factor = pow(eigenvalues[i], eigen_power);
-                for(int j = 0; j < d_in; j++)
+                float factor = pow(eigenvalues[i] + epsilon, eigen_power);
+                for (int j = 0; j < d_in; j++)
                     *ai++ *= factor;
             }
         }
         if (balanced_bins != 0) {
-            FAISS_THROW_IF_NOT (d_out % balanced_bins == 0);
+            FAISS_THROW_IF_NOT(d_out % balanced_bins == 0);
             int dsub = d_out / balanced_bins;
-            std::vector <float> Ain;
+            std::vector<float> Ain;
             std::swap(A, Ain);
             A.resize(d_out * d_in);
-            std::vector <float> accu(balanced_bins);
-            std::vector <int> counter(balanced_bins);
+            std::vector<float> accu(balanced_bins);
+            std::vector<int> counter(balanced_bins);
             // greedy assignment
             for (int i = 0; i < d_out; i++) {
@@ -550,9 +650,8 @@ void PCAMatrix::prepare_Ab ()
                 }
                 int row_dst = best_j * dsub + counter[best_j];
                 accu[best_j] += eigenvalues[i];
-                counter[best_j] ++;
-                memcpy (&A[row_dst * d_in], &Ain[i * d_in],
-                        d_in * sizeof (A[0]));
+                counter[best_j]++;
+                memcpy(&A[row_dst * d_in], &Ain[i * d_in], d_in * sizeof(A[0]));
             }
             if (verbose) {
@@ -563,11 +662,11 @@ void PCAMatrix::prepare_Ab ()
             }
         }
     } else {
-        FAISS_THROW_IF_NOT_MSG (balanced_bins == 0,
-             "both balancing bins and applying a random rotation "
-             "does not make sense");
+        FAISS_THROW_IF_NOT_MSG(
+                balanced_bins == 0,
+                "both balancing bins and applying a random rotation "
+                "does not make sense");
         RandomRotationMatrix rr(d_out, d_out);
         rr.init(5);
@@ -576,8 +675,8 @@ void PCAMatrix::prepare_Ab ()
         if (eigen_power != 0) {
             for (int i = 0; i < d_out; i++) {
                 float factor = pow(eigenvalues[i], eigen_power);
-                for(int j = 0; j < d_out; j++)
-                   rr.A[j * d_out + i] *= factor;
+                for (int j = 0; j < d_out; j++)
+                    rr.A[j * d_out + i] *= factor;
             }
         }
@@ -586,15 +685,24 @@ void PCAMatrix::prepare_Ab ()
             FINTEGER dii = d_in, doo = d_out;
             float one = 1.0, zero = 0.0;
-            sgemm_ ("Not", "Not", &dii, &doo, &doo,
-                    &one, PCAMat.data(), &dii, rr.A.data(), &doo, &zero,
-                    A.data(), &dii);
+            sgemm_("Not",
+                   "Not",
+                   &dii,
+                   &doo,
+                   &doo,
+                   &one,
+                   PCAMat.data(),
+                   &dii,
+                   rr.A.data(),
+                   &doo,
+                   &zero,
+                   A.data(),
+                   &dii);
         }
     }
-    b.clear(); b.resize(d_out);
+    b.clear();
+    b.resize(d_out);
     for (int i = 0; i < d_out; i++) {
         float accu = 0;
@@ -604,57 +712,61 @@ void PCAMatrix::prepare_Ab ()
     }
     is_orthonormal = eigen_power == 0;
 }
 /*********************************************
  * ITQMatrix
  *********************************************/
-ITQMatrix::ITQMatrix (int d):
-    LinearTransform(d, d, false),
-    max_iter (50),
-    seed (123)
-{
-}
+ITQMatrix::ITQMatrix(int d)
+        : LinearTransform(d, d, false), max_iter(50), seed(123) {}
 /** translated from fbcode/deeplearning/catalyzer/catalyzer/quantizers.py */
-void ITQMatrix::train (Index::idx_t n, const float* xf)
-{
+void ITQMatrix::train(Index::idx_t n, const float* xf) {
     size_t d = d_in;
-    std::vector<double> rotation (d * d);
+    std::vector<double> rotation(d * d);
     if (init_rotation.size() == d * d) {
-        memcpy (rotation.data(), init_rotation.data(),
-                d * d * sizeof(rotation[0]));
+        memcpy(rotation.data(),
+               init_rotation.data(),
+               d * d * sizeof(rotation[0]));
     } else {
-        RandomRotationMatrix rrot (d, d);
-        rrot.init (seed);
+        RandomRotationMatrix rrot(d, d);
+        rrot.init(seed);
         for (size_t i = 0; i < d * d; i++) {
             rotation[i] = rrot.A[i];
         }
     }
-    std::vector<double> x (n * d);
+    std::vector<double> x(n * d);
     for (size_t i = 0; i < n * d; i++) {
         x[i] = xf[i];
     }
-    std::vector<double> rotated_x (n * d), cov_mat (d * d);
-    std::vector<double> u (d * d), vt (d * d), singvals (d);
+    std::vector<double> rotated_x(n * d), cov_mat(d * d);
+    std::vector<double> u(d * d), vt(d * d), singvals(d);
     for (int i = 0; i < max_iter; i++) {
-        print_if_verbose ("rotation", rotation, d, d);
+        print_if_verbose("rotation", rotation, d, d);
         { // rotated_data = np.dot(training_data, rotation)
             FINTEGER di = d, ni = n;
             double one = 1, zero = 0;
-            dgemm_ ("N", "N", &di, &ni, &di,
-                    &one, rotation.data(), &di, x.data(), &di,
-                    &zero, rotated_x.data(), &di);
+            dgemm_("N",
+                   "N",
+                   &di,
+                   &ni,
+                   &di,
+                   &one,
+                   rotation.data(),
+                   &di,
+                   x.data(),
+                   &di,
+                   &zero,
+                   rotated_x.data(),
+                   &di);
         }
-        print_if_verbose ("rotated_x", rotated_x, n, d);
+        print_if_verbose("rotated_x", rotated_x, n, d);
         // binarize
         for (size_t j = 0; j < n * d; j++) {
             rotated_x[j] = rotated_x[j] < 0 ? -1 : 1;
@@ -663,88 +775,119 @@ void ITQMatrix::train (Index::idx_t n, const float* xf)
         { // rotated_data = np.dot(training_data, rotation)
             FINTEGER di = d, ni = n;
             double one = 1, zero = 0;
-            dgemm_ ("N", "T", &di, &di, &ni,
-                    &one, rotated_x.data(), &di, x.data(), &di,
-                    &zero, cov_mat.data(), &di);
+            dgemm_("N",
+                   "T",
+                   &di,
+                   &di,
+                   &ni,
+                   &one,
+                   rotated_x.data(),
+                   &di,
+                   x.data(),
+                   &di,
+                   &zero,
+                   cov_mat.data(),
+                   &di);
         }
-        print_if_verbose ("cov_mat", cov_mat, d, d);
+        print_if_verbose("cov_mat", cov_mat, d, d);
         // SVD
         {
             FINTEGER di = d;
             FINTEGER lwork = -1, info;
             double lwork1;
             // workspace query
-            dgesvd_ ("A", "A", &di, &di, cov_mat.data(), &di,
-                     singvals.data(), u.data(), &di,
-                     vt.data(), &di,
-                     &lwork1, &lwork, &info);
-            FAISS_THROW_IF_NOT (info == 0);
-            lwork = size_t (lwork1);
-            std::vector<double> work (lwork);
-            dgesvd_ ("A", "A", &di, &di, cov_mat.data(), &di,
-                     singvals.data(), u.data(), &di,
-                     vt.data(), &di,
-                     work.data(), &lwork, &info);
-            FAISS_THROW_IF_NOT_FMT (info == 0, "sgesvd returned info=%d", info);
+            dgesvd_("A",
+                    "A",
+                    &di,
+                    &di,
+                    cov_mat.data(),
+                    &di,
+                    singvals.data(),
+                    u.data(),
+                    &di,
+                    vt.data(),
+                    &di,
+                    &lwork1,
+                    &lwork,
+                    &info);
+            FAISS_THROW_IF_NOT(info == 0);
+            lwork = size_t(lwork1);
+            std::vector<double> work(lwork);
+            dgesvd_("A",
+                    "A",
+                    &di,
+                    &di,
+                    cov_mat.data(),
+                    &di,
+                    singvals.data(),
+                    u.data(),
+                    &di,
+                    vt.data(),
+                    &di,
+                    work.data(),
+                    &lwork,
+                    &info);
+            FAISS_THROW_IF_NOT_FMT(info == 0, "sgesvd returned info=%d", info);
         }
-        print_if_verbose ("u", u, d, d);
-        print_if_verbose ("vt", vt, d, d);
+        print_if_verbose("u", u, d, d);
+        print_if_verbose("vt", vt, d, d);
         // update rotation
         {
             FINTEGER di = d;
             double one = 1, zero = 0;
-            dgemm_ ("N", "T", &di, &di, &di,
-                    &one, u.data(), &di, vt.data(), &di,
-                    &zero, rotation.data(), &di);
+            dgemm_("N",
+                   "T",
+                   &di,
+                   &di,
+                   &di,
+                   &one,
+                   u.data(),
+                   &di,
+                   vt.data(),
+                   &di,
+                   &zero,
+                   rotation.data(),
+                   &di);
         }
-        print_if_verbose ("final rot", rotation, d, d);
+        print_if_verbose("final rot", rotation, d, d);
     }
-    A.resize (d * d);
+    A.resize(d * d);
     for (size_t i = 0; i < d; i++) {
         for (size_t j = 0; j < d; j++) {
             A[i + d * j] = rotation[j + d * i];
         }
     }
     is_trained = true;
 }
-ITQTransform::ITQTransform (int d_in, int d_out, bool do_pca):
-    VectorTransform (d_in, d_out),
-    do_pca (do_pca),
-    itq (d_out),
-    pca_then_itq (d_in, d_out, false)
-{
+ITQTransform::ITQTransform(int d_in, int d_out, bool do_pca)
+        : VectorTransform(d_in, d_out),
+          do_pca(do_pca),
+          itq(d_out),
+          pca_then_itq(d_in, d_out, false) {
     if (!do_pca) {
-        FAISS_THROW_IF_NOT (d_in == d_out);
+        FAISS_THROW_IF_NOT(d_in == d_out);
     }
     max_train_per_dim = 10;
     is_trained = false;
 }
+void ITQTransform::train(idx_t n, const float* x) {
+    FAISS_THROW_IF_NOT(!is_trained);
-void ITQTransform::train (idx_t n, const float *x)
-{
-    FAISS_THROW_IF_NOT (!is_trained);
-    const float * x_in = x;
+    const float* x_in = x;
     size_t max_train_points = std::max(d_in * max_train_per_dim, 32768);
-    x = fvecs_maybe_subsample (d_in, (size_t*)&n, max_train_points, x);
+    x = fvecs_maybe_subsample(d_in, (size_t*)&n, max_train_points, x);
-    ScopeDeleter<float> del_x (x != x_in ? x : nullptr);
+    ScopeDeleter<float> del_x(x != x_in ? x : nullptr);
-    std::unique_ptr<float []> x_norm(new float[n * d_in]);
+    std::unique_ptr<float[]> x_norm(new float[n * d_in]);
     { // normalize
         int d = d_in;
-        mean.resize (d, 0);
+        mean.resize(d, 0);
         for (idx_t i = 0; i < n; i++) {
             for (idx_t j = 0; j < d; j++) {
                 mean[j] += x[i * d + j];
@@ -755,38 +898,47 @@ void ITQTransform::train (idx_t n, const float *x)
         }
         for (idx_t i = 0; i < n; i++) {
             for (idx_t j = 0; j < d; j++) {
-            x_norm[i * d + j] = x[i * d + j] - mean[j];
+                x_norm[i * d + j] = x[i * d + j] - mean[j];
             }
         }
-        fvec_renorm_L2 (d_in, n, x_norm.get());
+        fvec_renorm_L2(d_in, n, x_norm.get());
     }
     // train PCA
-    PCAMatrix pca (d_in, d_out);
-    float *x_pca;
-    std::unique_ptr<float []> x_pca_del;
+    PCAMatrix pca(d_in, d_out);
+    float* x_pca;
+    std::unique_ptr<float[]> x_pca_del;
     if (do_pca) {
-        pca.have_bias = false;  // for consistency with reference implem
-        pca.train (n, x_norm.get());
-        x_pca = pca.apply (n, x_norm.get());
+        pca.have_bias = false; // for consistency with reference implem
+        pca.train(n, x_norm.get());
+        x_pca = pca.apply(n, x_norm.get());
         x_pca_del.reset(x_pca);
     } else {
         x_pca = x_norm.get();
     }
     // train ITQ
-    itq.train (n, x_pca);
+    itq.train(n, x_pca);
     // merge PCA and ITQ
     if (do_pca) {
         FINTEGER di = d_out, dini = d_in;
         float one = 1, zero = 0;
         pca_then_itq.A.resize(d_in * d_out);
-        sgemm_ ("N", "N", &dini, &di, &di,
-                &one, pca.A.data(), &dini,
-                itq.A.data(), &di,
-                &zero, pca_then_itq.A.data(), &dini);
+        sgemm_("N",
+               "N",
+               &dini,
+               &di,
+               &di,
+               &one,
+               pca.A.data(),
+               &dini,
+               itq.A.data(),
+               &di,
+               &zero,
+               pca_then_itq.A.data(),
+               &dini);
     } else {
         pca_then_itq.A = itq.A;
     }
@@ -794,12 +946,11 @@ void ITQTransform::train (idx_t n, const float *x)
     is_trained = true;
 }
-void ITQTransform::apply_noalloc (Index::idx_t n, const float * x,
-                               float * xt) const
-{
+void ITQTransform::apply_noalloc(Index::idx_t n, const float* x, float* xt)
+        const {
     FAISS_THROW_IF_NOT_MSG(is_trained, "Transformation not trained yet");
-    std::unique_ptr<float []> x_norm(new float[n * d_in]);
+    std::unique_ptr<float[]> x_norm(new float[n * d_in]);
     { // normalize
         int d = d_in;
         for (idx_t i = 0; i < n; i++) {
@@ -809,41 +960,36 @@ void ITQTransform::apply_noalloc (Index::idx_t n, const float * x,
         }
         // this is not really useful if we are going to binarize right
         // afterwards but OK
-        fvec_renorm_L2 (d_in, n, x_norm.get());
+        fvec_renorm_L2(d_in, n, x_norm.get());
     }
-    pca_then_itq.apply_noalloc (n, x_norm.get(), xt);
+    pca_then_itq.apply_noalloc(n, x_norm.get(), xt);
 }
 /*********************************************
  * OPQMatrix
  *********************************************/
-OPQMatrix::OPQMatrix (int d, int M, int d2):
-    LinearTransform (d, d2 == -1 ? d : d2, false), M(M),
-    niter (50),
-    niter_pq (4), niter_pq_0 (40),
-    verbose(false),
-    pq(nullptr)
-{
+OPQMatrix::OPQMatrix(int d, int M, int d2)
+        : LinearTransform(d, d2 == -1 ? d : d2, false),
+          M(M),
+          niter(50),
+          niter_pq(4),
+          niter_pq_0(40),
+          verbose(false),
+          pq(nullptr) {
     is_trained = false;
     // OPQ is quite expensive to train, so set this right.
     max_train_points = 256 * 256;
     pq = nullptr;
 }
+void OPQMatrix::train(Index::idx_t n, const float* x) {
+    const float* x_in = x;
+    x = fvecs_maybe_subsample(d_in, (size_t*)&n, max_train_points, x, verbose);
-void OPQMatrix::train (Index::idx_t n, const float *x)
-{
-    const float * x_in = x;
-    x = fvecs_maybe_subsample (d_in, (size_t*)&n,
-                               max_train_points, x, verbose);
-    ScopeDeleter<float> del_x (x != x_in ? x : nullptr);
+    ScopeDeleter<float> del_x(x != x_in ? x : nullptr);
     // To support d_out > d_in, we pad input vectors with 0s to d_out
     size_t d = d_out <= d_in ? d_in : d_out;
@@ -867,22 +1013,26 @@ void OPQMatrix::train (Index::idx_t n, const float *x)
 #endif
     if (verbose) {
-        printf ("OPQMatrix::train: training an OPQ rotation matrix "
-                "for M=%d from %" PRId64 " vectors in %dD -> %dD\n",
-                M, n, d_in, d_out);
+        printf("OPQMatrix::train: training an OPQ rotation matrix "
+               "for M=%d from %" PRId64 " vectors in %dD -> %dD\n",
+               M,
+               n,
+               d_in,
+               d_out);
     }
-    std::vector<float> xtrain (n * d);
+    std::vector<float> xtrain(n * d);
     // center x
     {
-        std::vector<float> sum (d);
-        const float *xi = x;
+        std::vector<float> sum(d);
+        const float* xi = x;
         for (size_t i = 0; i < n; i++) {
             for (int j = 0; j < d_in; j++)
-                sum [j] += *xi++;
+                sum[j] += *xi++;
         }
-        for (int i = 0; i < d; i++) sum[i] /= n;
-        float *yi = xtrain.data();
+        for (int i = 0; i < d; i++)
+            sum[i] /= n;
+        float* yi = xtrain.data();
         xi = x;
         for (size_t i = 0; i < n; i++) {
             for (int j = 0; j < d_in; j++)
@@ -890,71 +1040,80 @@ void OPQMatrix::train (Index::idx_t n, const float *x)
             yi += d - d_in;
         }
     }
-    float *rotation;
+    float* rotation;
-    if (A.size () == 0) {
-        A.resize (d * d);
+    if (A.size() == 0) {
+        A.resize(d * d);
         rotation = A.data();
         if (verbose)
             printf("  OPQMatrix::train: making random %zd*%zd rotation\n",
-                   d, d);
-        float_randn (rotation, d * d, 1234);
-        matrix_qr (d, d, rotation);
+                   d,
+                   d);
+        float_randn(rotation, d * d, 1234);
+        matrix_qr(d, d, rotation);
         // we use only the d * d2 upper part of the matrix
-        A.resize (d * d2);
+        A.resize(d * d2);
     } else {
-        FAISS_THROW_IF_NOT (A.size() == d * d2);
+        FAISS_THROW_IF_NOT(A.size() == d * d2);
         rotation = A.data();
     }
-    std::vector<float>
-        xproj (d2 * n), pq_recons (d2 * n), xxr (d * n),
-        tmp(d * d * 4);
+    std::vector<float> xproj(d2 * n), pq_recons(d2 * n), xxr(d * n),
+            tmp(d * d * 4);
-    ProductQuantizer pq_default (d2, M, 8);
-    ProductQuantizer &pq_regular = pq ? *pq : pq_default;
-    std::vector<uint8_t> codes (pq_regular.code_size * n);
+    ProductQuantizer pq_default(d2, M, 8);
+    ProductQuantizer& pq_regular = pq ? *pq : pq_default;
+    std::vector<uint8_t> codes(pq_regular.code_size * n);
     double t0 = getmillisecs();
     for (int iter = 0; iter < niter; iter++) {
         { // torch.mm(xtrain, rotation:t())
             FINTEGER di = d, d2i = d2, ni = n;
             float zero = 0, one = 1;
-            sgemm_ ("Transposed", "Not transposed",
-                    &d2i, &ni, &di,
-                    &one, rotation, &di,
-                    xtrain.data(), &di,
-                    &zero, xproj.data(), &d2i);
+            sgemm_("Transposed",
+                   "Not transposed",
+                   &d2i,
+                   &ni,
+                   &di,
+                   &one,
+                   rotation,
+                   &di,
+                   xtrain.data(),
+                   &di,
+                   &zero,
+                   xproj.data(),
+                   &d2i);
         }
         pq_regular.cp.max_points_per_centroid = 1000;
         pq_regular.cp.niter = iter == 0 ? niter_pq_0 : niter_pq;
         pq_regular.verbose = verbose;
-        pq_regular.train (n, xproj.data());
+        pq_regular.train(n, xproj.data());
         if (verbose) {
             printf("    encode / decode\n");
         }
         if (pq_regular.assign_index) {
-            pq_regular.compute_codes_with_assign_index
-                (xproj.data(), codes.data(), n);
+            pq_regular.compute_codes_with_assign_index(
+                    xproj.data(), codes.data(), n);
         } else {
-            pq_regular.compute_codes (xproj.data(), codes.data(), n);
+            pq_regular.compute_codes(xproj.data(), codes.data(), n);
         }
-        pq_regular.decode (codes.data(), pq_recons.data(), n);
+        pq_regular.decode(codes.data(), pq_recons.data(), n);
-        float pq_err = fvec_L2sqr (pq_recons.data(), xproj.data(), n * d2) / n;
+        float pq_err = fvec_L2sqr(pq_recons.data(), xproj.data(), n * d2) / n;
         if (verbose)
-            printf ("    Iteration %d (%d PQ iterations):"
-                    "%.3f s, obj=%g\n", iter, pq_regular.cp.niter,
-                    (getmillisecs () - t0) / 1000.0, pq_err);
+            printf("    Iteration %d (%d PQ iterations):"
+                   "%.3f s, obj=%g\n",
+                   iter,
+                   pq_regular.cp.niter,
+                   (getmillisecs() - t0) / 1000.0,
+                   pq_err);
         {
-            float *u = tmp.data(), *vt = &tmp [d * d];
-            float *sing_val = &tmp [2 * d * d];
+            float *u = tmp.data(), *vt = &tmp[d * d];
+            float* sing_val = &tmp[2 * d * d];
             FINTEGER di = d, d2i = d2, ni = n;
             float one = 1, zero = 0;
@@ -962,36 +1121,69 @@ void OPQMatrix::train (Index::idx_t n, const float *x)
                 printf("    X * recons\n");
             }
             // torch.mm(xtrain:t(), pq_recons)
-            sgemm_ ("Not", "Transposed",
-                    &d2i, &di, &ni,
-                    &one, pq_recons.data(), &d2i,
-                    xtrain.data(), &di,
-                    &zero, xxr.data(), &d2i);
+            sgemm_("Not",
+                   "Transposed",
+                   &d2i,
+                   &di,
+                   &ni,
+                   &one,
+                   pq_recons.data(),
+                   &d2i,
+                   xtrain.data(),
+                   &di,
+                   &zero,
+                   xxr.data(),
+                   &d2i);
             FINTEGER lwork = -1, info = -1;
             float worksz;
             // workspace query
-            sgesvd_ ("All", "All",
-                     &d2i, &di, xxr.data(), &d2i,
-                     sing_val,
-                     vt, &d2i, u, &di,
-                     &worksz, &lwork, &info);
+            sgesvd_("All",
+                    "All",
+                    &d2i,
+                    &di,
+                    xxr.data(),
+                    &d2i,
+                    sing_val,
+                    vt,
+                    &d2i,
+                    u,
+                    &di,
+                    &worksz,
+                    &lwork,
+                    &info);
             lwork = int(worksz);
-            std::vector<float> work (lwork);
+            std::vector<float> work(lwork);
             // u and vt swapped
-            sgesvd_ ("All", "All",
-                     &d2i, &di, xxr.data(), &d2i,
-                     sing_val,
-                     vt, &d2i, u, &di,
-                     work.data(), &lwork, &info);
-            sgemm_ ("Transposed", "Transposed",
-                    &di, &d2i, &d2i,
-                    &one, u, &di, vt, &d2i,
-                    &zero, rotation, &di);
+            sgesvd_("All",
+                    "All",
+                    &d2i,
+                    &di,
+                    xxr.data(),
+                    &d2i,
+                    sing_val,
+                    vt,
+                    &d2i,
+                    u,
+                    &di,
+                    work.data(),
+                    &lwork,
+                    &info);
+            sgemm_("Transposed",
+                   "Transposed",
+                   &di,
+                   &d2i,
+                   &d2i,
+                   &one,
+                   u,
+                   &di,
+                   vt,
+                   &d2i,
+                   &zero,
+                   rotation,
+                   &di);
         }
         pq_regular.train_type = ProductQuantizer::Train_hot_start;
     }
@@ -999,59 +1191,52 @@ void OPQMatrix::train (Index::idx_t n, const float *x)
     // revert A matrix
     if (d > d_in) {
         for (long i = 0; i < d_out; i++)
-            memmove (&A[i * d_in], &A[i * d], sizeof(A[0]) * d_in);
-        A.resize (d_in * d_out);
+            memmove(&A[i * d_in], &A[i * d], sizeof(A[0]) * d_in);
+        A.resize(d_in * d_out);
     }
     is_trained = true;
     is_orthonormal = true;
 }
 /*********************************************
  * NormalizationTransform
  *********************************************/
-NormalizationTransform::NormalizationTransform (int d, float norm):
-    VectorTransform (d, d), norm (norm)
-{
-}
+NormalizationTransform::NormalizationTransform(int d, float norm)
+        : VectorTransform(d, d), norm(norm) {}
-NormalizationTransform::NormalizationTransform ():
-    VectorTransform (-1, -1), norm (-1)
-{
-}
+NormalizationTransform::NormalizationTransform()
+        : VectorTransform(-1, -1), norm(-1) {}
-void NormalizationTransform::apply_noalloc
-      (idx_t n, const float* x, float* xt) const
-{
+void NormalizationTransform::apply_noalloc(idx_t n, const float* x, float* xt)
+        const {
     if (norm == 2.0) {
-        memcpy (xt, x, sizeof (x[0]) * n * d_in);
-        fvec_renorm_L2 (d_in, n, xt);
+        memcpy(xt, x, sizeof(x[0]) * n * d_in);
+        fvec_renorm_L2(d_in, n, xt);
     } else {
-        FAISS_THROW_MSG ("not implemented");
+        FAISS_THROW_MSG("not implemented");
     }
 }
-void NormalizationTransform::reverse_transform (idx_t n, const float* xt,
-                                                float* x) const
-{
-    memcpy (x, xt, sizeof (xt[0]) * n * d_in);
+void NormalizationTransform::reverse_transform(
+        idx_t n,
+        const float* xt,
+        float* x) const {
+    memcpy(x, xt, sizeof(xt[0]) * n * d_in);
 }
 /*********************************************
  * CenteringTransform
  *********************************************/
-CenteringTransform::CenteringTransform (int d):
-    VectorTransform (d, d)
-{
+CenteringTransform::CenteringTransform(int d) : VectorTransform(d, d) {
     is_trained = false;
 }
-void CenteringTransform::train(Index::idx_t n, const float *x) {
+void CenteringTransform::train(Index::idx_t n, const float* x) {
     FAISS_THROW_IF_NOT_MSG(n > 0, "need at least one training vector");
-    mean.resize (d_in, 0);
+    mean.resize(d_in, 0);
     for (idx_t i = 0; i < n; i++) {
         for (size_t j = 0; j < d_in; j++) {
             mean[j] += *x++;
@@ -1064,11 +1249,9 @@ void CenteringTransform::train(Index::idx_t n, const float *x) {
     is_trained = true;
 }
-void CenteringTransform::apply_noalloc
-      (idx_t n, const float* x, float* xt) const
-{
-    FAISS_THROW_IF_NOT (is_trained);
+void CenteringTransform::apply_noalloc(idx_t n, const float* x, float* xt)
+        const {
+    FAISS_THROW_IF_NOT(is_trained);
     for (idx_t i = 0; i < n; i++) {
         for (size_t j = 0; j < d_in; j++) {
@@ -1077,64 +1260,58 @@ void CenteringTransform::apply_noalloc
     }
 }
-void CenteringTransform::reverse_transform (idx_t n, const float* xt,
-                                                float* x) const
-{
-    FAISS_THROW_IF_NOT (is_trained);
+void CenteringTransform::reverse_transform(idx_t n, const float* xt, float* x)
+        const {
+    FAISS_THROW_IF_NOT(is_trained);
     for (idx_t i = 0; i < n; i++) {
         for (size_t j = 0; j < d_in; j++) {
             *x++ = *xt++ + mean[j];
         }
     }
 }
 /*********************************************
  * RemapDimensionsTransform
  *********************************************/
-RemapDimensionsTransform::RemapDimensionsTransform (
-        int d_in, int d_out, const int *map_in):
-    VectorTransform (d_in, d_out)
-{
-    map.resize (d_out);
+RemapDimensionsTransform::RemapDimensionsTransform(
+        int d_in,
+        int d_out,
+        const int* map_in)
+        : VectorTransform(d_in, d_out) {
+    map.resize(d_out);
     for (int i = 0; i < d_out; i++) {
         map[i] = map_in[i];
-        FAISS_THROW_IF_NOT (map[i] == -1 || (map[i] >= 0 && map[i] < d_in));
+        FAISS_THROW_IF_NOT(map[i] == -1 || (map[i] >= 0 && map[i] < d_in));
     }
 }
-RemapDimensionsTransform::RemapDimensionsTransform (
-      int d_in, int d_out, bool uniform): VectorTransform (d_in, d_out)
-{
-    map.resize (d_out, -1);
+RemapDimensionsTransform::RemapDimensionsTransform(
+        int d_in,
+        int d_out,
+        bool uniform)
+        : VectorTransform(d_in, d_out) {
+    map.resize(d_out, -1);
     if (uniform) {
         if (d_in < d_out) {
             for (int i = 0; i < d_in; i++) {
-                map [i * d_out / d_in] = i;
-        }
+                map[i * d_out / d_in] = i;
+            }
         } else {
             for (int i = 0; i < d_out; i++) {
-                map [i] = i * d_in / d_out;
+                map[i] = i * d_in / d_out;
             }
         }
     } else {
         for (int i = 0; i < d_in && i < d_out; i++)
-            map [i] = i;
+            map[i] = i;
     }
 }
-void RemapDimensionsTransform::apply_noalloc (idx_t n, const float * x,
-                                              float *xt) const
-{
+void RemapDimensionsTransform::apply_noalloc(idx_t n, const float* x, float* xt)
+        const {
     for (idx_t i = 0; i < n; i++) {
         for (int j = 0; j < d_out; j++) {
             xt[j] = map[j] < 0 ? 0 : x[map[j]];
@@ -1144,13 +1321,15 @@ void RemapDimensionsTransform::apply_noalloc (idx_t n, const float * x,
     }
 }
-void RemapDimensionsTransform::reverse_transform (idx_t n, const float * xt,
-                                                  float *x) const
-{
-    memset (x, 0, sizeof (*x) * n * d_in);
+void RemapDimensionsTransform::reverse_transform(
+        idx_t n,
+        const float* xt,
+        float* x) const {
+    memset(x, 0, sizeof(*x) * n * d_in);
     for (idx_t i = 0; i < n; i++) {
         for (int j = 0; j < d_out; j++) {
-            if (map[j] >= 0) x[map[j]] = xt[j];
+            if (map[j] >= 0)
+                x[map[j]] = xt[j];
         }
         x += d_in;
         xt += d_out;