RubyGems - faiss - Versions diffs - 0.4.3 → 0.5.1 - Mend

faiss 0.4.3 → 0.5.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (186) hide show

checksums.yaml +4 -4
data/CHANGELOG.md +10 -0
data/README.md +2 -0
data/ext/faiss/index.cpp +33 -6
data/ext/faiss/index_binary.cpp +17 -4
data/ext/faiss/kmeans.cpp +6 -6
data/lib/faiss/version.rb +1 -1
data/vendor/faiss/faiss/AutoTune.cpp +2 -3
data/vendor/faiss/faiss/AutoTune.h +1 -1
data/vendor/faiss/faiss/Clustering.cpp +2 -2
data/vendor/faiss/faiss/Clustering.h +2 -2
data/vendor/faiss/faiss/IVFlib.cpp +26 -51
data/vendor/faiss/faiss/IVFlib.h +1 -1
data/vendor/faiss/faiss/Index.cpp +11 -0
data/vendor/faiss/faiss/Index.h +34 -11
data/vendor/faiss/faiss/Index2Layer.cpp +1 -1
data/vendor/faiss/faiss/Index2Layer.h +2 -2
data/vendor/faiss/faiss/IndexAdditiveQuantizer.cpp +1 -0
data/vendor/faiss/faiss/IndexAdditiveQuantizerFastScan.cpp +9 -4
data/vendor/faiss/faiss/IndexAdditiveQuantizerFastScan.h +5 -1
data/vendor/faiss/faiss/IndexBinary.h +7 -7
data/vendor/faiss/faiss/IndexBinaryFromFloat.h +1 -1
data/vendor/faiss/faiss/IndexBinaryHNSW.cpp +8 -2
data/vendor/faiss/faiss/IndexBinaryHNSW.h +1 -1
data/vendor/faiss/faiss/IndexBinaryHash.cpp +3 -3
data/vendor/faiss/faiss/IndexBinaryHash.h +5 -5
data/vendor/faiss/faiss/IndexBinaryIVF.cpp +7 -6
data/vendor/faiss/faiss/IndexFastScan.cpp +125 -49
data/vendor/faiss/faiss/IndexFastScan.h +102 -7
data/vendor/faiss/faiss/IndexFlat.cpp +374 -4
data/vendor/faiss/faiss/IndexFlat.h +81 -1
data/vendor/faiss/faiss/IndexHNSW.cpp +93 -2
data/vendor/faiss/faiss/IndexHNSW.h +58 -2
data/vendor/faiss/faiss/IndexIDMap.cpp +14 -13
data/vendor/faiss/faiss/IndexIDMap.h +6 -6
data/vendor/faiss/faiss/IndexIVF.cpp +1 -1
data/vendor/faiss/faiss/IndexIVF.h +5 -5
data/vendor/faiss/faiss/IndexIVFAdditiveQuantizer.cpp +1 -1
data/vendor/faiss/faiss/IndexIVFAdditiveQuantizerFastScan.cpp +9 -3
data/vendor/faiss/faiss/IndexIVFAdditiveQuantizerFastScan.h +3 -1
data/vendor/faiss/faiss/IndexIVFFastScan.cpp +176 -90
data/vendor/faiss/faiss/IndexIVFFastScan.h +173 -18
data/vendor/faiss/faiss/IndexIVFFlat.cpp +1 -0
data/vendor/faiss/faiss/IndexIVFFlatPanorama.cpp +251 -0
data/vendor/faiss/faiss/IndexIVFFlatPanorama.h +64 -0
data/vendor/faiss/faiss/IndexIVFPQ.cpp +3 -1
data/vendor/faiss/faiss/IndexIVFPQ.h +1 -1
data/vendor/faiss/faiss/IndexIVFPQFastScan.cpp +134 -2
data/vendor/faiss/faiss/IndexIVFPQFastScan.h +7 -1
data/vendor/faiss/faiss/IndexIVFRaBitQ.cpp +99 -8
data/vendor/faiss/faiss/IndexIVFRaBitQ.h +4 -1
data/vendor/faiss/faiss/IndexIVFRaBitQFastScan.cpp +828 -0
data/vendor/faiss/faiss/IndexIVFRaBitQFastScan.h +252 -0
data/vendor/faiss/faiss/IndexIVFSpectralHash.cpp +1 -1
data/vendor/faiss/faiss/IndexIVFSpectralHash.h +1 -1
data/vendor/faiss/faiss/IndexNNDescent.cpp +1 -1
data/vendor/faiss/faiss/IndexNSG.cpp +1 -1
data/vendor/faiss/faiss/IndexNeuralNetCodec.h +1 -1
data/vendor/faiss/faiss/IndexPQ.cpp +4 -1
data/vendor/faiss/faiss/IndexPQ.h +1 -1
data/vendor/faiss/faiss/IndexPQFastScan.cpp +6 -2
data/vendor/faiss/faiss/IndexPQFastScan.h +5 -1
data/vendor/faiss/faiss/IndexPreTransform.cpp +14 -0
data/vendor/faiss/faiss/IndexPreTransform.h +9 -0
data/vendor/faiss/faiss/IndexRaBitQ.cpp +96 -13
data/vendor/faiss/faiss/IndexRaBitQ.h +11 -2
data/vendor/faiss/faiss/IndexRaBitQFastScan.cpp +731 -0
data/vendor/faiss/faiss/IndexRaBitQFastScan.h +175 -0
data/vendor/faiss/faiss/IndexRefine.cpp +49 -0
data/vendor/faiss/faiss/IndexRefine.h +17 -0
data/vendor/faiss/faiss/IndexShards.cpp +1 -1
data/vendor/faiss/faiss/MatrixStats.cpp +3 -3
data/vendor/faiss/faiss/MetricType.h +1 -1
data/vendor/faiss/faiss/VectorTransform.h +2 -2
data/vendor/faiss/faiss/clone_index.cpp +5 -1
data/vendor/faiss/faiss/gpu/GpuCloner.cpp +1 -1
data/vendor/faiss/faiss/gpu/GpuClonerOptions.h +3 -1
data/vendor/faiss/faiss/gpu/GpuIndex.h +11 -11
data/vendor/faiss/faiss/gpu/GpuIndexBinaryCagra.h +1 -1
data/vendor/faiss/faiss/gpu/GpuIndexBinaryFlat.h +1 -1
data/vendor/faiss/faiss/gpu/GpuIndexCagra.h +11 -7
data/vendor/faiss/faiss/gpu/StandardGpuResources.cpp +1 -1
data/vendor/faiss/faiss/gpu/perf/IndexWrapper-inl.h +2 -0
data/vendor/faiss/faiss/gpu/test/TestGpuIcmEncoder.cpp +7 -0
data/vendor/faiss/faiss/gpu/test/TestGpuIndexIVFFlat.cpp +1 -1
data/vendor/faiss/faiss/impl/AdditiveQuantizer.cpp +1 -1
data/vendor/faiss/faiss/impl/AdditiveQuantizer.h +1 -1
data/vendor/faiss/faiss/impl/AuxIndexStructures.cpp +2 -2
data/vendor/faiss/faiss/impl/AuxIndexStructures.h +1 -1
data/vendor/faiss/faiss/impl/CodePacker.h +2 -2
data/vendor/faiss/faiss/impl/DistanceComputer.h +77 -6
data/vendor/faiss/faiss/impl/FastScanDistancePostProcessing.h +53 -0
data/vendor/faiss/faiss/impl/HNSW.cpp +295 -16
data/vendor/faiss/faiss/impl/HNSW.h +35 -6
data/vendor/faiss/faiss/impl/IDSelector.cpp +2 -2
data/vendor/faiss/faiss/impl/IDSelector.h +4 -4
data/vendor/faiss/faiss/impl/LocalSearchQuantizer.cpp +4 -4
data/vendor/faiss/faiss/impl/LocalSearchQuantizer.h +1 -1
data/vendor/faiss/faiss/impl/LookupTableScaler.h +1 -1
data/vendor/faiss/faiss/impl/NNDescent.cpp +1 -1
data/vendor/faiss/faiss/impl/NNDescent.h +2 -2
data/vendor/faiss/faiss/impl/NSG.cpp +1 -1
data/vendor/faiss/faiss/impl/Panorama.cpp +193 -0
data/vendor/faiss/faiss/impl/Panorama.h +204 -0
data/vendor/faiss/faiss/impl/PanoramaStats.cpp +33 -0
data/vendor/faiss/faiss/impl/PanoramaStats.h +38 -0
data/vendor/faiss/faiss/impl/PolysemousTraining.cpp +5 -5
data/vendor/faiss/faiss/impl/ProductAdditiveQuantizer.cpp +1 -1
data/vendor/faiss/faiss/impl/ProductAdditiveQuantizer.h +1 -1
data/vendor/faiss/faiss/impl/ProductQuantizer-inl.h +2 -0
data/vendor/faiss/faiss/impl/ProductQuantizer.h +1 -1
data/vendor/faiss/faiss/impl/RaBitQStats.cpp +29 -0
data/vendor/faiss/faiss/impl/RaBitQStats.h +56 -0
data/vendor/faiss/faiss/impl/RaBitQUtils.cpp +294 -0
data/vendor/faiss/faiss/impl/RaBitQUtils.h +330 -0
data/vendor/faiss/faiss/impl/RaBitQuantizer.cpp +304 -223
data/vendor/faiss/faiss/impl/RaBitQuantizer.h +72 -4
data/vendor/faiss/faiss/impl/RaBitQuantizerMultiBit.cpp +362 -0
data/vendor/faiss/faiss/impl/RaBitQuantizerMultiBit.h +112 -0
data/vendor/faiss/faiss/impl/ResidualQuantizer.h +1 -1
data/vendor/faiss/faiss/impl/ResultHandler.h +4 -4
data/vendor/faiss/faiss/impl/ScalarQuantizer.cpp +7 -10
data/vendor/faiss/faiss/impl/ScalarQuantizer.h +2 -4
data/vendor/faiss/faiss/impl/ThreadedIndex-inl.h +7 -4
data/vendor/faiss/faiss/impl/index_read.cpp +238 -10
data/vendor/faiss/faiss/impl/index_write.cpp +212 -19
data/vendor/faiss/faiss/impl/io.cpp +2 -2
data/vendor/faiss/faiss/impl/io.h +4 -4
data/vendor/faiss/faiss/impl/kmeans1d.cpp +1 -1
data/vendor/faiss/faiss/impl/kmeans1d.h +1 -1
data/vendor/faiss/faiss/impl/lattice_Zn.h +2 -2
data/vendor/faiss/faiss/impl/mapped_io.cpp +2 -2
data/vendor/faiss/faiss/impl/mapped_io.h +4 -3
data/vendor/faiss/faiss/impl/maybe_owned_vector.h +8 -1
data/vendor/faiss/faiss/impl/platform_macros.h +12 -0
data/vendor/faiss/faiss/impl/pq4_fast_scan.cpp +30 -4
data/vendor/faiss/faiss/impl/pq4_fast_scan.h +14 -8
data/vendor/faiss/faiss/impl/pq4_fast_scan_search_qbs.cpp +5 -6
data/vendor/faiss/faiss/impl/simd_result_handlers.h +55 -11
data/vendor/faiss/faiss/impl/svs_io.cpp +86 -0
data/vendor/faiss/faiss/impl/svs_io.h +67 -0
data/vendor/faiss/faiss/impl/zerocopy_io.h +1 -1
data/vendor/faiss/faiss/index_factory.cpp +217 -8
data/vendor/faiss/faiss/index_factory.h +1 -1
data/vendor/faiss/faiss/index_io.h +1 -1
data/vendor/faiss/faiss/invlists/BlockInvertedLists.h +1 -1
data/vendor/faiss/faiss/invlists/DirectMap.cpp +1 -1
data/vendor/faiss/faiss/invlists/InvertedLists.cpp +115 -1
data/vendor/faiss/faiss/invlists/InvertedLists.h +46 -0
data/vendor/faiss/faiss/invlists/OnDiskInvertedLists.cpp +1 -1
data/vendor/faiss/faiss/invlists/OnDiskInvertedLists.h +1 -1
data/vendor/faiss/faiss/svs/IndexSVSFaissUtils.h +261 -0
data/vendor/faiss/faiss/svs/IndexSVSFlat.cpp +117 -0
data/vendor/faiss/faiss/svs/IndexSVSFlat.h +66 -0
data/vendor/faiss/faiss/svs/IndexSVSVamana.cpp +245 -0
data/vendor/faiss/faiss/svs/IndexSVSVamana.h +137 -0
data/vendor/faiss/faiss/svs/IndexSVSVamanaLVQ.cpp +39 -0
data/vendor/faiss/faiss/svs/IndexSVSVamanaLVQ.h +42 -0
data/vendor/faiss/faiss/svs/IndexSVSVamanaLeanVec.cpp +149 -0
data/vendor/faiss/faiss/svs/IndexSVSVamanaLeanVec.h +58 -0
data/vendor/faiss/faiss/utils/AlignedTable.h +1 -1
data/vendor/faiss/faiss/utils/Heap.cpp +2 -2
data/vendor/faiss/faiss/utils/Heap.h +3 -3
data/vendor/faiss/faiss/utils/NeuralNet.cpp +1 -1
data/vendor/faiss/faiss/utils/NeuralNet.h +3 -3
data/vendor/faiss/faiss/utils/approx_topk/approx_topk.h +2 -2
data/vendor/faiss/faiss/utils/approx_topk/avx2-inl.h +2 -2
data/vendor/faiss/faiss/utils/approx_topk/mode.h +1 -1
data/vendor/faiss/faiss/utils/distances.cpp +0 -3
data/vendor/faiss/faiss/utils/distances.h +2 -2
data/vendor/faiss/faiss/utils/extra_distances-inl.h +3 -1
data/vendor/faiss/faiss/utils/hamming-inl.h +2 -0
data/vendor/faiss/faiss/utils/hamming.cpp +7 -6
data/vendor/faiss/faiss/utils/hamming.h +1 -1
data/vendor/faiss/faiss/utils/hamming_distance/common.h +1 -2
data/vendor/faiss/faiss/utils/partitioning.cpp +5 -5
data/vendor/faiss/faiss/utils/partitioning.h +2 -2
data/vendor/faiss/faiss/utils/rabitq_simd.h +222 -336
data/vendor/faiss/faiss/utils/random.cpp +1 -1
data/vendor/faiss/faiss/utils/simdlib_avx2.h +1 -1
data/vendor/faiss/faiss/utils/simdlib_avx512.h +1 -1
data/vendor/faiss/faiss/utils/simdlib_neon.h +2 -2
data/vendor/faiss/faiss/utils/transpose/transpose-avx512-inl.h +1 -1
data/vendor/faiss/faiss/utils/utils.cpp +9 -2
data/vendor/faiss/faiss/utils/utils.h +2 -2
metadata +29 -1

data/vendor/faiss/faiss/impl/RaBitQuantizer.h CHANGED Viewed

@@ -37,11 +37,28 @@ struct RaBitQuantizer : Quantizer {
     //   possible. Thus, a quantizer has to introduce a metric.
     MetricType metric_type = MetricType::METRIC_L2;
-    RaBitQuantizer(size_t d = 0, MetricType metric = MetricType::METRIC_L2);
+    // Number of bits per dimension (1-9). Default is 1 for backward
+    // compatibility.
+    // - nb_bits = 1: standard 1-bit RaBitQ (sign bits only)
+    // - nb_bits = 2-9: multi-bit RaBitQ (1 sign bit + ex_bits extra bits)
+    size_t nb_bits = 1;
+    RaBitQuantizer(
+            size_t d = 0,
+            MetricType metric = MetricType::METRIC_L2,
+            size_t nb_bits = 1);
+    // Compute code size based on dimensionality and number of bits
+    // Returns: size in bytes for one encoded vector
+    // - nb_bits=1: (d+7)/8 + 8 bytes (1-bit codes + base factors)
+    // - nb_bits>1: (d+7)/8 + 8 + d*ex_bits/8 + 8 bytes
+    //              (1-bit codes + base factors + ex-bit codes + ex factors)
+    size_t compute_code_size(size_t d, size_t num_bits) const;
     void train(size_t n, const float* x) override;
-    // every vector is expected to take (d + 7) / 8 + sizeof(FactorsData) bytes,
+    // every vector is expected to take (d + 7) / 8 + sizeof(SignBitFactors)
+    // bytes,
     void compute_codes(const float* x, uint8_t* codes, size_t n) const override;
     void compute_codes_core(
@@ -71,8 +88,59 @@ struct RaBitQuantizer : Quantizer {
     // specify qb = 0 to get an DC that does not quantize a query
     // specify qb > 0 to have SQ qb-bits query
     FlatCodesDistanceComputer* get_distance_computer(
-            uint8_t qb,
-            const float* centroid_in = nullptr) const;
+            uint8_t qb = 0,
+            const float* centroid = nullptr,
+            bool centered = false) const;
+};
+// RaBitQDistanceComputer: Base class for RaBitQ distance computers
+//
+// This intermediate class exists to provide a unified interface for
+// two-stage multi-bit search. While most Faiss quantizers extend
+// FlatCodesDistanceComputer directly, RaBitQ requires this additional
+// abstraction layer due to its unique split encoding strategy
+// (1 sign bit + magnitude bits) which enables:
+//
+// 1. distance_to_code_1bit() - Fast 1-bit filtering using only sign bits
+// 2. distance_to_code_full() - Accurate multi-bit refinement using all bits
+// 3. lower_bound_distance() - Error-bounded adaptive filtering
+//                              (based on 1-bit estimator)
+//
+// These three methods implement RaBitQ's two-stage search pattern and are
+// shared between the quantized (Q) and non-quantized (NotQ) query variants.
+// The intermediate class allows two-stage search code to work with both
+// variants via a single dynamic_cast.
+struct RaBitQDistanceComputer : FlatCodesDistanceComputer {
+    size_t d = 0;
+    const float* centroid = nullptr;
+    MetricType metric_type = MetricType::METRIC_L2;
+    size_t nb_bits = 1;
+    // Query norm for lower bound computation (g_error in rabitq-library)
+    // This is the L2 norm of the rotated query: ||query - centroid||
+    float g_error = 0.0f;
+    float symmetric_dis(idx_t /*i*/, idx_t /*j*/) override {
+        // Not used for RaBitQ
+        FAISS_THROW_MSG("Not implemented");
+    }
+    // Compute 1-bit distance estimate (fast)
+    virtual float distance_to_code_1bit(const uint8_t* code) = 0;
+    // Compute full multi-bit distance (accurate)
+    virtual float distance_to_code_full(const uint8_t* code) = 0;
+    // Compute lower bound of distance using error bounds
+    // Guarantees: actual_distance >= lower_bound_distance
+    // Used for adaptive filtering in two-stage search
+    virtual float lower_bound_distance(const uint8_t* code);
+    // Override from FlatCodesDistanceComputer
+    // Delegates to distance_to_code_full() for multi-bit distance computation
+    float distance_to_code(const uint8_t* code) final {
+        return distance_to_code_full(code);
+    }
 };
 } // namespace faiss

data/vendor/faiss/faiss/impl/RaBitQuantizerMultiBit.cpp ADDED Viewed

@@ -0,0 +1,362 @@
+/*
+ * Copyright (c) Meta Platforms, Inc. and affiliates.
+ *
+ * This source code is licensed under the MIT license found in the
+ * LICENSE file in the root directory of this source tree.
+ */
+// NOTE: Parts of this implementation are adapted from:
+// RaBitQ-Library/include/rabitqlib/quantization/rabitq_impl.hpp
+// https://github.com/VectorDB-NTU/RaBitQ-Library
+#include <faiss/impl/FaissAssert.h>
+#include <faiss/impl/RaBitQUtils.h>
+#include <faiss/utils/distances.h>
+#include <algorithm>
+#include <cmath>
+#include <cstring>
+#include <queue>
+#include <vector>
+namespace faiss {
+namespace rabitq_multibit {
+using rabitq_utils::ExtraBitsFactors;
+using rabitq_utils::SignBitFactorsWithError;
+constexpr float kTightStart[9] =
+        {0.0f, 0.15f, 0.20f, 0.52f, 0.59f, 0.71f, 0.75f, 0.77f, 0.81f};
+constexpr double kEps = 1e-5;
+/**
+ * Compute optimal scaling factor for ex-bits quantization using priority
+ * queue-based search.
+ *
+ * This function finds the optimal scaling factor 't' that maximizes the
+ * inner product between the normalized quantized vector and the normalized
+ * absolute residual. The algorithm uses a priority queue to efficiently
+ * explore different quantization levels.
+ *
+ *
+ * @param o_abs Normalized absolute residual vector (must be positive, length
+ * d)
+ * @param d Dimensionality of the vector
+ * @param nb_bits Number of bits per dimension (2-9)
+ * @return Optimal scaling factor 't'
+ */
+float compute_optimal_scaling_factor(
+        const float* o_abs,
+        size_t d,
+        size_t nb_bits) {
+    const size_t ex_bits = nb_bits - 1;
+    FAISS_THROW_IF_NOT_MSG(
+            ex_bits >= 1 && ex_bits <= 8, "ex_bits must be in range [1, 8]");
+    const int kNEnum = 10;
+    const int max_code = (1 << ex_bits) - 1;
+    float max_o = *std::max_element(o_abs, o_abs + d);
+    // Determine search range [t_start, t_end]
+    float t_end = static_cast<float>(max_code + kNEnum) / max_o;
+    float t_start = t_end * kTightStart[ex_bits];
+    std::vector<float> inv_o_abs(d);
+    for (size_t i = 0; i < d; ++i) {
+        inv_o_abs[i] = 1.0f / o_abs[i];
+    }
+    std::vector<int> cur_o_bar(d);
+    float sqr_denominator = static_cast<float>(d) * 0.25f;
+    float numerator = 0.0f;
+    for (size_t i = 0; i < d; ++i) {
+        int cur = static_cast<int>((t_start * o_abs[i]) + kEps);
+        cur_o_bar[i] = cur;
+        sqr_denominator += static_cast<float>(cur * cur + cur);
+        numerator += (cur + 0.5f) * o_abs[i];
+    }
+    float inv_sqrt_denom = 1.0f / std::sqrt(sqr_denominator);
+    // Pair: (next_t, dimension_index)
+    // Maximum size is d (one entry per dimension), so reserve exactly d
+    std::vector<std::pair<float, size_t>> pq_storage;
+    pq_storage.reserve(d);
+    std::priority_queue<
+            std::pair<float, size_t>,
+            std::vector<std::pair<float, size_t>>,
+            std::greater<>>
+            next_t(std::greater<>(), std::move(pq_storage));
+    // Initialize queue with next quantization level for each dimension
+    for (size_t i = 0; i < d; ++i) {
+        float t_next = static_cast<float>(cur_o_bar[i] + 1) * inv_o_abs[i];
+        if (t_next < t_end) {
+            next_t.emplace(t_next, i);
+        }
+    }
+    float max_ip = 0.0f;
+    float t = 0.0f;
+    while (!next_t.empty()) {
+        float cur_t = next_t.top().first;
+        size_t update_id = next_t.top().second;
+        next_t.pop();
+        cur_o_bar[update_id]++;
+        int update_o_bar = cur_o_bar[update_id];
+        float delta = 2.0f * update_o_bar;
+        sqr_denominator += delta;
+        numerator += o_abs[update_id];
+        float old_denom = sqr_denominator - delta;
+        inv_sqrt_denom = inv_sqrt_denom *
+                (1.0f - 0.5f * delta / (old_denom + delta * 0.5f));
+        float cur_ip = numerator * inv_sqrt_denom;
+        if (cur_ip > max_ip) {
+            max_ip = cur_ip;
+            t = cur_t;
+        }
+        if (update_o_bar < max_code) {
+            float t_next =
+                    static_cast<float>(update_o_bar + 1) * inv_o_abs[update_id];
+            if (t_next < t_end) {
+                next_t.emplace(t_next, update_id);
+            }
+        }
+    }
+    return t;
+}
+/**
+ * Pack multi-bit codes from integer array to byte array.
+ *
+ * @param tmp_code Integer codes (length d), each value in [0, 2^ex_bits - 1]
+ * @param ex_code Output packed byte array
+ * @param d Dimensionality
+ * @param nb_bits Number of bits per dimension (2-9)
+ */
+void pack_multibit_codes(
+        const int* tmp_code,
+        uint8_t* ex_code,
+        size_t d,
+        size_t nb_bits) {
+    const size_t ex_bits = nb_bits - 1;
+    FAISS_THROW_IF_NOT_MSG(
+            ex_bits >= 1 && ex_bits <= 8, "ex_bits must be in range [1, 8]");
+    size_t total_bits = d * ex_bits;
+    size_t output_size = (total_bits + 7) / 8;
+    memset(ex_code, 0, output_size);
+    size_t bit_pos = 0;
+    for (size_t i = 0; i < d; i++) {
+        int code_value = tmp_code[i];
+        for (size_t bit = 0; bit < ex_bits; bit++) {
+            size_t byte_idx = bit_pos / 8;
+            size_t bit_idx = bit_pos % 8;
+            if (code_value & (1 << bit)) {
+                ex_code[byte_idx] |= (1 << bit_idx);
+            }
+            bit_pos++;
+        }
+    }
+}
+/**
+ * Compute ex-bits factors for distance computation.
+ *
+ * @param residual Original residual vector (data - centroid)
+ * @param centroid Centroid vector (can be nullptr for zero centroid)
+ * @param tmp_code Quantized ex-bit codes (before packing, after bit flipping)
+ * @param d Dimensionality
+ * @param ex_bits Number of extra bits
+ * @param norm L2 norm of residual
+ * @param ipnorm Unnormalized inner product between quantized and normalized
+ * residual
+ * @param ex_factors Output factors structure
+ * @param metric_type Distance metric (L2 or Inner Product)
+ */
+void compute_ex_factors(
+        const float* residual,
+        const float* centroid,
+        const int* tmp_code,
+        size_t d,
+        size_t ex_bits,
+        float norm,
+        double ipnorm,
+        ExtraBitsFactors& ex_factors,
+        MetricType metric_type) {
+    FAISS_THROW_IF_NOT_MSG(
+            metric_type == MetricType::METRIC_L2 ||
+                    metric_type == MetricType::METRIC_INNER_PRODUCT,
+            "Unsupported metric type");
+    // Compute ipnorm_inv = 1 / ipnorm
+    float ipnorm_inv = static_cast<float>(1.0 / ipnorm);
+    if (!std::isnormal(ipnorm_inv)) {
+        ipnorm_inv = 1.0f;
+    }
+    // Reconstruct xu_cb from total_code
+    // total_code was formed from: total_code[i] = (sign << ex_bits) +
+    // ex_code[i] Reconstruction: xu_cb[i] = total_code[i] + cb
+    const float cb = -(static_cast<float>(1 << ex_bits) - 0.5f);
+    std::vector<float> xu_cb(d);
+    for (size_t i = 0; i < d; i++) {
+        xu_cb[i] = static_cast<float>(tmp_code[i]) + cb;
+    }
+    // Compute inner products needed for factors
+    float l2_sqr = norm * norm;
+    float ip_resi_xucb = fvec_inner_product(residual, xu_cb.data(), d);
+    // Compute factors
+    if (metric_type == MetricType::METRIC_L2) {
+        // For L2, no centroid correction needed in IVF setting
+        // because residual = x - centroid, distance computed in residual space
+        ex_factors.f_add_ex = l2_sqr;
+        ex_factors.f_rescale_ex = ipnorm_inv * -2.0f * norm;
+    } else {
+        // For IP, centroid correction is needed
+        float ip_resi_cent = 0;
+        if (centroid != nullptr) {
+            ip_resi_cent = fvec_inner_product(residual, centroid, d);
+        }
+        float ip_cent_xucb = 0;
+        if (centroid != nullptr) {
+            ip_cent_xucb = fvec_inner_product(centroid, xu_cb.data(), d);
+        }
+        // When ip_resi_xucb is zero, the correction term should be zero
+        float correction_term = 0.0f;
+        if (ip_resi_xucb != 0.0f) {
+            correction_term = l2_sqr * ip_cent_xucb / ip_resi_xucb;
+        }
+        ex_factors.f_add_ex = 1 - ip_resi_cent + correction_term;
+        ex_factors.f_rescale_ex = ipnorm_inv * -norm;
+    }
+}
+/**
+ * Quantize residual vector to ex-bits.
+ *
+ * This is the main quantization function that:
+ * 1. Normalizes the residual
+ * 2. Takes absolute value
+ * 3. Finds optimal scaling factor
+ * 4. Quantizes to ex_bits
+ * 5. Handles negative dimensions by flipping bits
+ * 6. Packs codes into byte array
+ * 7. Computes factors for distance computation
+ *
+ * @param residual Input residual vector (data - centroid), length d
+ * @param d Dimensionality
+ * @param nb_bits Number of bits per dimension (2-9)
+ * @param ex_code Output packed ex-bit codes
+ * @param ex_factors Output ex-bits factors
+ * @param metric_type Distance metric (L2 or Inner Product)
+ * @param centroid Optional centroid vector (needed for IP metric)
+ */
+void quantize_ex_bits(
+        const float* residual,
+        size_t d,
+        size_t nb_bits,
+        uint8_t* ex_code,
+        ExtraBitsFactors& ex_factors,
+        MetricType metric_type,
+        const float* centroid) {
+    const size_t ex_bits = nb_bits - 1;
+    FAISS_THROW_IF_NOT_MSG(
+            ex_bits >= 1 && ex_bits <= 8, "ex_bits must be in range [1, 8]");
+    FAISS_THROW_IF_NOT_MSG(residual != nullptr, "residual cannot be null");
+    FAISS_THROW_IF_NOT_MSG(ex_code != nullptr, "ex_code cannot be null");
+    // Step 1: Compute L2 norm of residual
+    float norm_sqr = fvec_norm_L2sqr(residual, d);
+    float norm = std::sqrt(norm_sqr);
+    // Handle degenerate case
+    if (norm < 1e-10f) {
+        size_t code_size = (d * ex_bits + 7) / 8;
+        memset(ex_code, 0, code_size);
+        ex_factors.f_add_ex = 0.0f;
+        ex_factors.f_rescale_ex = 1.0f;
+        return;
+    }
+    // Step 2: Normalize residual
+    std::vector<float> normalized_residual(d);
+    for (size_t i = 0; i < d; i++) {
+        normalized_residual[i] = residual[i] / norm;
+    }
+    // Step 3: Take absolute value
+    std::vector<float> o_abs(d);
+    for (size_t i = 0; i < d; i++) {
+        o_abs[i] = std::abs(normalized_residual[i]);
+    }
+    // Step 4: Find optimal scaling factor
+    float t = compute_optimal_scaling_factor(o_abs.data(), d, nb_bits);
+    // Step 5: Quantize to ex_bits
+    std::vector<int> tmp_code(d);
+    double ipnorm = 0;
+    int max_code = (1 << ex_bits) - 1;
+    for (size_t i = 0; i < d; i++) {
+        tmp_code[i] = std::min(static_cast<int>(t * o_abs[i] + kEps), max_code);
+        // Compute unnormalized inner product
+        ipnorm += (tmp_code[i] + 0.5) * o_abs[i];
+    }
+    // Step 6: Handle negative dimensions (flip bits)
+    // For negative residuals, flip all bits: code' = ~code & max_code
+    for (size_t i = 0; i < d; i++) {
+        if (residual[i] < 0) {
+            tmp_code[i] = (~tmp_code[i]) & max_code;
+        }
+    }
+    // Step 7: Pack codes into byte array
+    pack_multibit_codes(tmp_code.data(), ex_code, d, nb_bits);
+    // Step 8: Compute factors for distance computation
+    // Reconstruct total_code for factor computation
+    std::vector<int> total_code(d);
+    for (size_t i = 0; i < d; i++) {
+        // Form total_code = (sign << ex_bits) + ex_code
+        bool sign_bit = (residual[i] >= 0);
+        total_code[i] = tmp_code[i] + ((sign_bit ? 1 : 0) << ex_bits);
+    }
+    // Compute ex-factors; centroid is needed for IP metric correction
+    compute_ex_factors(
+            residual,
+            centroid, // Pass centroid for IP metric factor computation
+            total_code.data(),
+            d,
+            ex_bits,
+            norm,
+            ipnorm,
+            ex_factors,
+            metric_type);
+}
+} // namespace rabitq_multibit
+} // namespace faiss

data/vendor/faiss/faiss/impl/RaBitQuantizerMultiBit.h ADDED Viewed

@@ -0,0 +1,112 @@
+/*
+ * Copyright (c) Meta Platforms, Inc. and affiliates.
+ *
+ * This source code is licensed under the MIT license found in the
+ * LICENSE file in the root directory of this source tree.
+ */
+// Reference:
+// "Practical and asymptotically optimal quantization of high-dimensional
+// vectors in euclidean space for approximate nearest neighbor search"
+// Jianyang Gao, Yutong Gou, Yuexuan Xu, Yongyi Yang, Cheng Long, Raymond
+// Chi-Wing Wong https://dl.acm.org/doi/pdf/10.1145/3725413
+//
+// Reference implementation: https://github.com/VectorDB-NTU/RaBitQ-Library
+// NOTE: Parts of this implementation are adapted from
+// rabitqlib/quantization/rabitq_impl.hpp in the above repository.
+#pragma once
+#include <faiss/MetricType.h>
+#include <faiss/impl/RaBitQUtils.h>
+#include <cstddef>
+#include <cstdint>
+namespace faiss {
+namespace rabitq_multibit {
+/**
+ * Compute optimal scaling factor for ex-bits quantization.
+ *
+ * Uses priority queue-based search to find the scaling factor that
+ * maximizes the inner product between quantized and original vectors.
+ *
+ * @param o_abs Normalized absolute residual vector (positive values)
+ * @param d Dimensionality
+ * @param nb_bits Number of bits per dimension (2-9)
+ * @return Optimal scaling factor 't'
+ */
+float compute_optimal_scaling_factor(
+        const float* o_abs,
+        size_t d,
+        size_t nb_bits);
+/**
+ * Pack multi-bit codes from integer array to byte array.
+ *
+ * @param tmp_code Integer codes (length d), values in [0, 2^ex_bits - 1]
+ * @param ex_code Output packed byte array
+ * @param d Dimensionality
+ * @param nb_bits Number of bits per dimension (2-9)
+ */
+void pack_multibit_codes(
+        const int* tmp_code,
+        uint8_t* ex_code,
+        size_t d,
+        size_t nb_bits);
+/**
+ * Compute ex-bits factors for distance computation.
+ *
+ * @param residual Original residual vector (data - centroid)
+ * @param centroid Centroid vector (can be nullptr for zero centroid)
+ * @param tmp_code Quantized ex-bit codes (unpacked integers)
+ * @param d Dimensionality
+ * @param ex_bits Number of extra bits
+ * @param norm L2 norm of residual
+ * @param ipnorm Unnormalized inner product
+ * @param ex_factors Output factors structure
+ * @param metric_type Distance metric (L2 or IP)
+ */
+void compute_ex_factors(
+        const float* residual,
+        const float* centroid,
+        const int* tmp_code,
+        size_t d,
+        size_t ex_bits,
+        float norm,
+        double ipnorm,
+        rabitq_utils::ExtraBitsFactors& ex_factors,
+        MetricType metric_type);
+/**
+ * Main quantization function: quantize residual vector to ex-bits.
+ *
+ * Performs the complete multi-bit quantization pipeline:
+ * 1. Normalize residual
+ * 2. Take absolute value
+ * 3. Find optimal scaling factor
+ * 4. Quantize to ex_bits
+ * 5. Handle negative dimensions by bit flipping
+ * 6. Pack codes into byte array
+ * 7. Compute factors for distance computation
+ *
+ * @param residual Input residual vector (data - centroid), length d
+ * @param d Dimensionality
+ * @param nb_bits Number of bits per dimension (2-9)
+ * @param ex_code Output packed ex-bit codes
+ * @param ex_factors Output ex-bits factors
+ * @param metric_type Distance metric (L2 or Inner Product)
+ * @param centroid Optional centroid vector (needed for IP metric)
+ */
+void quantize_ex_bits(
+        const float* residual,
+        size_t d,
+        size_t nb_bits,
+        uint8_t* ex_code,
+        rabitq_utils::ExtraBitsFactors& ex_factors,
+        MetricType metric_type,
+        const float* centroid = nullptr);
+} // namespace rabitq_multibit
+} // namespace faiss

data/vendor/faiss/faiss/impl/ResidualQuantizer.h CHANGED Viewed

@@ -49,7 +49,7 @@ struct ResidualQuantizer : AdditiveQuantizer {
      *  first element of the beam (faster but less accurate) */
     static const int Train_top_beam = 1024;
-    /** set this bit to *not* autmatically compute the codebook tables
+    /** set this bit to *not* automatically compute the codebook tables
      * after training */
     static const int Skip_codebook_tables = 2048;

data/vendor/faiss/faiss/impl/ResultHandler.h CHANGED Viewed

@@ -26,11 +26,11 @@ namespace faiss {
  * The classes below are intended to be used as template arguments
  * they handle results for batches of queries (size nq).
  * They can be called in two ways:
- * - by instanciating a SingleResultHandler that tracks results for a single
+ * - by instantiating a SingleResultHandler that tracks results for a single
  *   query
  * - with begin_multiple/add_results/end_multiple calls where a whole block of
  *   results is submitted
- * All classes are templated on C which to define wheter the min or the max of
+ * All classes are templated on C which to define whether the min or the max of
  * results is to be kept, and on sel, so that the codepaths for with / without
  * selector can be separated at compile time.
  *****************************************************************/
@@ -306,7 +306,7 @@ struct HeapBlockResultHandler : TopkBlockResultHandler<C, use_sel> {
  *
  * A reservoir is a result array of size capacity > n (number of requested
  * results) all results below a threshold are stored in an arbitrary order.
- *When the capacity is reached, a new threshold is chosen by partitionning
+ *When the capacity is reached, a new threshold is chosen by partitioning
  *the distance array.
  *****************************************************************/
@@ -572,7 +572,7 @@ struct RangeSearchBlockResultHandler : BlockResultHandler<C, use_sel> {
         RangeSearchPartialResult* pres;
         // there is one RangeSearchPartialResult structure per j0
         // (= block of columns of the large distance matrix)
-        // it is a bit tricky to find the poper PartialResult structure
+        // it is a bit tricky to find the proper PartialResult structure
         // because the inner loop is on db not on queries.
         if (pr < j0s.size() && j0 == j0s[pr]) {

data/vendor/faiss/faiss/impl/ScalarQuantizer.cpp CHANGED Viewed

@@ -321,7 +321,7 @@ struct Codec6bit {
     static FAISS_ALWAYS_INLINE __m256
     decode_8_components(const uint8_t* code, int i) {
         // // Faster code for Intel CPUs or AMD Zen3+, just keeping it here
-        // // for the reference, maybe, it becomes used oned day.
+        // // for the reference, maybe, it becomes used one day.
         // const uint16_t* data16 = (const uint16_t*)(code + (i >> 2) * 3);
         // const uint32_t* data32 = (const uint32_t*)data16;
         // const uint64_t val = *data32 + ((uint64_t)data16[2] << 32);
@@ -1009,16 +1009,13 @@ void train_Uniform(
     } else if (rs == ScalarQuantizer::RS_quantiles) {
         std::vector<float> x_copy(n);
         memcpy(x_copy.data(), x, n * sizeof(*x));
-        // TODO just do a quickselect
-        std::sort(x_copy.begin(), x_copy.end());
-        int o = int(rs_arg * n);
-        if (o < 0) {
-            o = 0;
-        }
-        if (o > n - o) {
-            o = n / 2;
-        }
+        int temp = int(rs_arg * n);
+        int o = temp < 0 ? 0 : (temp > n / 2 ? n / 2 : temp);
+        std::nth_element(x_copy.begin(), x_copy.begin() + o, x_copy.end());
         vmin = x_copy[o];
+        std::nth_element(
+                x_copy.begin(), x_copy.begin() + (n - 1 - o), x_copy.end());
         vmax = x_copy[n - 1 - o];
     } else if (rs == ScalarQuantizer::RS_optim) {

data/vendor/faiss/faiss/impl/ScalarQuantizer.h CHANGED Viewed

@@ -40,7 +40,7 @@ struct ScalarQuantizer : Quantizer {
     QuantizerType qtype = QT_8bit;
     /** The uniform encoder can estimate the range of representable
-     * values of the unform encoder using different statistics. Here
+     * values of the uniform encoder using different statistics. Here
      * rs = rangestat_arg */
     // rangestat_arg.
@@ -98,9 +98,7 @@ struct ScalarQuantizer : Quantizer {
     SQuantizer* select_quantizer() const;
     struct SQDistanceComputer : FlatCodesDistanceComputer {
-        const float* q;
-        SQDistanceComputer() : q(nullptr) {}
+        SQDistanceComputer() : FlatCodesDistanceComputer(nullptr) {}
         virtual float query_to_code(const uint8_t* code) const = 0;

data/vendor/faiss/faiss/impl/ThreadedIndex-inl.h CHANGED Viewed

@@ -5,6 +5,8 @@
  * LICENSE file in the root directory of this source tree.
  */
+#pragma once
 #include <faiss/impl/FaissAssert.h>
 #include <exception>
 #include <iostream>
@@ -75,10 +77,11 @@ void ThreadedIndex<IndexT>::addIndex(IndexT* index) {
         }
     }
-    indices_.emplace_back(std::make_pair(
-            index,
-            std::unique_ptr<WorkerThread>(
-                    isThreaded_ ? new WorkerThread : nullptr)));
+    indices_.emplace_back(
+            std::make_pair(
+                    index,
+                    std::unique_ptr<WorkerThread>(
+                            isThreaded_ ? new WorkerThread : nullptr)));
     onAfterAddIndex(index);
 }