RubyGems - faiss - Versions diffs - 0.3.4 → 0.4.0 - Mend

faiss 0.3.4 → 0.4.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (70) hide show

checksums.yaml +4 -4
data/CHANGELOG.md +5 -0
data/lib/faiss/version.rb +1 -1
data/vendor/faiss/faiss/AutoTune.cpp +11 -8
data/vendor/faiss/faiss/Clustering.cpp +0 -16
data/vendor/faiss/faiss/IVFlib.cpp +213 -0
data/vendor/faiss/faiss/IVFlib.h +42 -0
data/vendor/faiss/faiss/Index.h +1 -1
data/vendor/faiss/faiss/IndexBinaryFlat.cpp +9 -7
data/vendor/faiss/faiss/IndexBinaryFlat.h +2 -1
data/vendor/faiss/faiss/IndexFlatCodes.cpp +1 -1
data/vendor/faiss/faiss/IndexFlatCodes.h +4 -2
data/vendor/faiss/faiss/IndexHNSW.cpp +13 -20
data/vendor/faiss/faiss/IndexHNSW.h +1 -1
data/vendor/faiss/faiss/IndexIVF.cpp +20 -3
data/vendor/faiss/faiss/IndexIVF.h +5 -2
data/vendor/faiss/faiss/IndexIVFAdditiveQuantizer.cpp +2 -1
data/vendor/faiss/faiss/IndexIVFAdditiveQuantizer.h +2 -1
data/vendor/faiss/faiss/IndexIVFFlat.cpp +2 -1
data/vendor/faiss/faiss/IndexIVFFlat.h +2 -1
data/vendor/faiss/faiss/IndexIVFPQ.cpp +2 -1
data/vendor/faiss/faiss/IndexIVFPQ.h +2 -1
data/vendor/faiss/faiss/IndexIVFRaBitQ.cpp +277 -0
data/vendor/faiss/faiss/IndexIVFRaBitQ.h +70 -0
data/vendor/faiss/faiss/IndexIVFSpectralHash.cpp +2 -1
data/vendor/faiss/faiss/IndexIVFSpectralHash.h +2 -1
data/vendor/faiss/faiss/IndexRaBitQ.cpp +148 -0
data/vendor/faiss/faiss/IndexRaBitQ.h +65 -0
data/vendor/faiss/faiss/IndexScalarQuantizer.cpp +2 -1
data/vendor/faiss/faiss/IndexScalarQuantizer.h +2 -1
data/vendor/faiss/faiss/clone_index.cpp +38 -3
data/vendor/faiss/faiss/cppcontrib/factory_tools.cpp +19 -0
data/vendor/faiss/faiss/cppcontrib/factory_tools.h +4 -11
data/vendor/faiss/faiss/gpu/GpuAutoTune.cpp +2 -1
data/vendor/faiss/faiss/gpu/GpuIndexCagra.h +13 -3
data/vendor/faiss/faiss/gpu/StandardGpuResources.cpp +1 -1
data/vendor/faiss/faiss/gpu/StandardGpuResources.h +1 -1
data/vendor/faiss/faiss/gpu/test/TestGpuIcmEncoder.cpp +112 -0
data/vendor/faiss/faiss/impl/HNSW.cpp +35 -13
data/vendor/faiss/faiss/impl/HNSW.h +5 -4
data/vendor/faiss/faiss/impl/NNDescent.cpp +1 -1
data/vendor/faiss/faiss/impl/RaBitQuantizer.cpp +519 -0
data/vendor/faiss/faiss/impl/RaBitQuantizer.h +78 -0
data/vendor/faiss/faiss/impl/ResultHandler.h +2 -2
data/vendor/faiss/faiss/impl/code_distance/code_distance-sve.h +3 -4
data/vendor/faiss/faiss/impl/index_read.cpp +220 -25
data/vendor/faiss/faiss/impl/index_write.cpp +29 -0
data/vendor/faiss/faiss/impl/io.h +2 -2
data/vendor/faiss/faiss/impl/io_macros.h +2 -0
data/vendor/faiss/faiss/impl/mapped_io.cpp +313 -0
data/vendor/faiss/faiss/impl/mapped_io.h +51 -0
data/vendor/faiss/faiss/impl/maybe_owned_vector.h +316 -0
data/vendor/faiss/faiss/impl/platform_macros.h +7 -3
data/vendor/faiss/faiss/impl/simd_result_handlers.h +1 -1
data/vendor/faiss/faiss/impl/zerocopy_io.cpp +67 -0
data/vendor/faiss/faiss/impl/zerocopy_io.h +32 -0
data/vendor/faiss/faiss/index_factory.cpp +16 -5
data/vendor/faiss/faiss/index_io.h +4 -0
data/vendor/faiss/faiss/invlists/InvertedLists.cpp +3 -3
data/vendor/faiss/faiss/invlists/InvertedLists.h +5 -3
data/vendor/faiss/faiss/invlists/InvertedListsIOHook.cpp +3 -3
data/vendor/faiss/faiss/python/python_callbacks.cpp +24 -0
data/vendor/faiss/faiss/python/python_callbacks.h +22 -0
data/vendor/faiss/faiss/utils/approx_topk_hamming/approx_topk_hamming.h +30 -12
data/vendor/faiss/faiss/utils/hamming.cpp +45 -21
data/vendor/faiss/faiss/utils/hamming.h +7 -3
data/vendor/faiss/faiss/utils/hamming_distance/avx512-inl.h +1 -1
data/vendor/faiss/faiss/utils/utils.cpp +4 -4
data/vendor/faiss/faiss/utils/utils.h +3 -3
metadata +16 -4

data/vendor/faiss/faiss/impl/platform_macros.h CHANGED Viewed

@@ -11,7 +11,7 @@
 #include <cstdint>
 #include <cstdio>
-#ifdef _MSC_VER
+#ifdef _WIN32
 /*******************************************************
  * Windows specific macros
@@ -23,11 +23,11 @@
 #define FAISS_API __declspec(dllimport)
 #endif // FAISS_MAIN_LIB
-#ifdef _MSC_VER
 #define strtok_r strtok_s
-#endif // _MSC_VER
+#ifdef _MSC_VER
 #define __PRETTY_FUNCTION__ __FUNCSIG__
+#endif // _MSC_VER
 #define posix_memalign(p, a, s) \
     (((*(p)) = _aligned_malloc((s), (a))), *(p) ? 0 : errno)
@@ -37,6 +37,7 @@
 #define ALIGNED(x) __declspec(align(x))
 // redefine the GCC intrinsics with Windows equivalents
+#ifdef _MSC_VER
 #include <intrin.h>
 #include <limits.h>
@@ -75,6 +76,7 @@ inline int __builtin_clzll(uint64_t x) {
 #define __builtin_popcount __popcnt
 #define __builtin_popcountl __popcnt64
+#define __builtin_popcountll __popcnt64
 #ifndef __clang__
 #define __m128i_u __m128i
@@ -101,6 +103,8 @@ inline int __builtin_clzll(uint64_t x) {
 #define __F16C__ 1
 #endif
+#endif // _MSC_VER
 #define FAISS_ALWAYS_INLINE __forceinline
 #else

data/vendor/faiss/faiss/impl/simd_result_handlers.h CHANGED Viewed

@@ -576,7 +576,7 @@ struct RangeHandler : ResultHandlerCompare<C, with_id_map> {
         normalizers = norms;
         for (int q = 0; q < nq; ++q) {
             thresholds[q] =
-                    normalizers[2 * q] * (radius - normalizers[2 * q + 1]);
+                    int(normalizers[2 * q] * (radius - normalizers[2 * q + 1]));
         }
     }

data/vendor/faiss/faiss/impl/zerocopy_io.cpp ADDED Viewed

@@ -0,0 +1,67 @@
+/*
+ * Copyright (c) Meta Platforms, Inc. and affiliates.
+ *
+ * This source code is licensed under the MIT license found in the
+ * LICENSE file in the root directory of this source tree.
+ */
+#include <faiss/impl/zerocopy_io.h>
+#include <cstring>
+namespace faiss {
+ZeroCopyIOReader::ZeroCopyIOReader(uint8_t* data, size_t size)
+        : data_(data), rp_(0), total_(size) {}
+ZeroCopyIOReader::~ZeroCopyIOReader() {}
+size_t ZeroCopyIOReader::get_data_view(void** ptr, size_t size, size_t nitems) {
+    if (size == 0) {
+        return nitems;
+    }
+    size_t actual_size = size * nitems;
+    if (rp_ + size * nitems > total_) {
+        actual_size = total_ - rp_;
+    }
+    size_t actual_nitems = (actual_size + size - 1) / size;
+    if (actual_nitems == 0) {
+        return 0;
+    }
+    // get an address
+    *ptr = (void*)(reinterpret_cast<const char*>(data_ + rp_));
+    // alter pos
+    rp_ += size * actual_nitems;
+    return actual_nitems;
+}
+void ZeroCopyIOReader::reset() {
+    rp_ = 0;
+}
+size_t ZeroCopyIOReader::operator()(void* ptr, size_t size, size_t nitems) {
+    if (size * nitems == 0) {
+        return 0;
+    }
+    if (rp_ >= total_) {
+        return 0;
+    }
+    size_t nremain = (total_ - rp_) / size;
+    if (nremain < nitems) {
+        nitems = nremain;
+    }
+    memcpy(ptr, (data_ + rp_), size * nitems);
+    rp_ += size * nitems;
+    return nitems;
+}
+int ZeroCopyIOReader::filedescriptor() {
+    return -1; // Indicating no file descriptor available for memory buffer
+}
+} // namespace faiss

data/vendor/faiss/faiss/impl/zerocopy_io.h ADDED Viewed

@@ -0,0 +1,32 @@
+/*
+ * Copyright (c) Meta Platforms, Inc. and affiliates.
+ *
+ * This source code is licensed under the MIT license found in the
+ * LICENSE file in the root directory of this source tree.
+ */
+#pragma once
+#include <cstdint>
+#include <faiss/impl/io.h>
+namespace faiss {
+// ZeroCopyIOReader just maps the data from a given pointer.
+struct ZeroCopyIOReader : public faiss::IOReader {
+    uint8_t* data_;
+    size_t rp_ = 0;
+    size_t total_ = 0;
+    ZeroCopyIOReader(uint8_t* data, size_t size);
+    ~ZeroCopyIOReader();
+    void reset();
+    size_t get_data_view(void** ptr, size_t size, size_t nitems);
+    size_t operator()(void* ptr, size_t size, size_t nitems) override;
+    int filedescriptor() override;
+};
+} // namespace faiss

data/vendor/faiss/faiss/index_factory.cpp CHANGED Viewed

@@ -11,9 +11,6 @@
 #include <faiss/index_factory.h>
-#include <cinttypes>
-#include <cmath>
 #include <map>
 #include <regex>
@@ -33,6 +30,7 @@
 #include <faiss/IndexIVFPQ.h>
 #include <faiss/IndexIVFPQFastScan.h>
 #include <faiss/IndexIVFPQR.h>
+#include <faiss/IndexIVFRaBitQ.h>
 #include <faiss/IndexIVFSpectralHash.h>
 #include <faiss/IndexLSH.h>
 #include <faiss/IndexLattice.h>
@@ -40,6 +38,7 @@
 #include <faiss/IndexPQ.h>
 #include <faiss/IndexPQFastScan.h>
 #include <faiss/IndexPreTransform.h>
+#include <faiss/IndexRaBitQ.h>
 #include <faiss/IndexRefine.h>
 #include <faiss/IndexRowwiseMinMax.h>
 #include <faiss/IndexScalarQuantizer.h>
@@ -67,6 +66,7 @@ namespace {
  */
 bool re_match(const std::string& s, const std::string& pat, std::smatch& sm) {
+    // @lint-ignore CLANGTIDY
     return std::regex_match(s, sm, std::regex(pat));
 }
@@ -164,7 +164,7 @@ const std::string aq_norm_pattern =
 const std::string paq_def_pattern = "([0-9]+)x([0-9]+)x([0-9]+)";
 AdditiveQuantizer::Search_type_t aq_parse_search_type(
-        std::string stok,
+        const std::string& stok,
         MetricType metric) {
     if (stok == "") {
         return metric == METRIC_L2 ? AdditiveQuantizer::ST_decompress
@@ -177,6 +177,7 @@ AdditiveQuantizer::Search_type_t aq_parse_search_type(
 std::vector<size_t> aq_parse_nbits(std::string stok) {
     std::vector<size_t> nbits;
     std::smatch sm;
+    // @lint-ignore CLANGTIDY
     while (std::regex_search(stok, sm, std::regex("[^q]([0-9]+)x([0-9]+)"))) {
         int M = std::stoi(sm[1].str());
         int nbit = std::stoi(sm[2].str());
@@ -186,6 +187,8 @@ std::vector<size_t> aq_parse_nbits(std::string stok) {
     return nbits;
 }
+const std::string rabitq_pattern = "(RaBitQ)";
 /***************************************************************
  * Parse VectorTransform
  */
@@ -436,6 +439,9 @@ IndexIVF* parse_IndexIVF(
         }
         return index_ivf;
     }
+    if (match(rabitq_pattern)) {
+        return new IndexIVFRaBitQ(get_q(), d, nlist, mt);
+    }
     return nullptr;
 }
@@ -657,6 +663,11 @@ Index* parse_other_indexes(
         }
     }
+    // IndexRaBitQ
+    if (match(rabitq_pattern)) {
+        return new IndexRaBitQ(d, metric);
+    }
     return nullptr;
 }
@@ -766,7 +777,7 @@ std::unique_ptr<Index> index_factory_sub(
     }
     if (verbose) {
-        printf("after () normalization: %s %ld parenthesis indexes d=%d\n",
+        printf("after () normalization: %s %zd parenthesis indexes d=%d\n",
                description.c_str(),
                parenthesis_indexes.size(),
                d);

data/vendor/faiss/faiss/index_io.h CHANGED Viewed

@@ -62,6 +62,10 @@ const int IO_FLAG_PQ_SKIP_SDC_TABLE = 32;
 // try to memmap data (useful to load an ArrayInvertedLists as an
 // OnDiskInvertedLists)
 const int IO_FLAG_MMAP = IO_FLAG_SKIP_IVF_DATA | 0x646f0000;
+// mmap that handles codes for IndexFlatCodes-derived indices and HNSW.
+// this is a temporary solution, it is expected to be merged with IO_FLAG_MMAP
+//   after OnDiskInvertedLists get properly updated.
+const int IO_FLAG_MMAP_IFC = 1 << 9;
 Index* read_index(const char* fname, int io_flags = 0);
 Index* read_index(FILE* f, int io_flags = 0);

data/vendor/faiss/faiss/invlists/InvertedLists.cpp CHANGED Viewed

@@ -181,7 +181,7 @@ size_t InvertedLists::copy_subset_to(
 }
 double InvertedLists::imbalance_factor() const {
-    std::vector<int> hist(nlist);
+    std::vector<int64_t> hist(nlist);
     for (size_t i = 0; i < nlist; i++) {
         hist[i] = list_size(i);
@@ -330,8 +330,8 @@ void ArrayInvertedLists::update_entries(
 }
 void ArrayInvertedLists::permute_invlists(const idx_t* map) {
-    std::vector<std::vector<uint8_t>> new_codes(nlist);
-    std::vector<std::vector<idx_t>> new_ids(nlist);
+    std::vector<MaybeOwnedVector<uint8_t>> new_codes(nlist);
+    std::vector<MaybeOwnedVector<idx_t>> new_ids(nlist);
     for (size_t i = 0; i < nlist; i++) {
         size_t o = map[i];

data/vendor/faiss/faiss/invlists/InvertedLists.h CHANGED Viewed

@@ -15,9 +15,11 @@
  * the interface.
  */
-#include <faiss/MetricType.h>
 #include <vector>
+#include <faiss/MetricType.h>
+#include <faiss/impl/maybe_owned_vector.h>
 namespace faiss {
 struct InvertedListsIterator {
@@ -241,8 +243,8 @@ struct InvertedLists {
 /// simple (default) implementation as an array of inverted lists
 struct ArrayInvertedLists : InvertedLists {
-    std::vector<std::vector<uint8_t>> codes; // binary codes, size nlist
-    std::vector<std::vector<idx_t>> ids;     ///< Inverted lists for indexes
+    std::vector<MaybeOwnedVector<uint8_t>> codes; // binary codes, size nlist
+    std::vector<MaybeOwnedVector<idx_t>> ids; ///< Inverted lists for indexes
     ArrayInvertedLists(size_t nlist, size_t code_size);

data/vendor/faiss/faiss/invlists/InvertedListsIOHook.cpp CHANGED Viewed

@@ -13,9 +13,9 @@
 #include <faiss/invlists/BlockInvertedLists.h>
-#ifndef _MSC_VER
+#ifndef _WIN32
 #include <faiss/invlists/OnDiskInvertedLists.h>
-#endif // !_MSC_VER
+#endif // !_WIN32
 namespace faiss {
@@ -33,7 +33,7 @@ namespace {
 /// std::vector that deletes its contents
 struct IOHookTable : std::vector<InvertedListsIOHook*> {
     IOHookTable() {
-#ifndef _MSC_VER
+#ifndef _WIN32
         push_back(new OnDiskInvertedListsIOHook());
 #endif
         push_back(new BlockInvertedListsIOHook());

data/vendor/faiss/faiss/python/python_callbacks.cpp CHANGED Viewed

@@ -134,3 +134,27 @@ PyCallbackIDSelector::~PyCallbackIDSelector() {
     PyThreadLock gil;
     Py_DECREF(callback);
 }
+/***********************************************************
+ * Callbacks for IVF index sharding
+ ***********************************************************/
+PyCallbackShardingFunction::PyCallbackShardingFunction(PyObject* callback)
+        : callback(callback) {
+    PyThreadLock gil;
+    Py_INCREF(callback);
+}
+int64_t PyCallbackShardingFunction::operator()(int64_t i, int64_t shard_count) {
+    PyThreadLock gil;
+    PyObject* shard_id = PyObject_CallFunction(callback, "LL", i, shard_count);
+    if (shard_id == nullptr) {
+        FAISS_THROW_MSG("propagate py error");
+    }
+    return PyLong_AsLongLong(shard_id);
+}
+PyCallbackShardingFunction::~PyCallbackShardingFunction() {
+    PyThreadLock gil;
+    Py_DECREF(callback);
+}

data/vendor/faiss/faiss/python/python_callbacks.h CHANGED Viewed

@@ -7,6 +7,7 @@
 #pragma once
+#include <faiss/IVFlib.h>
 #include <faiss/impl/IDSelector.h>
 #include <faiss/impl/io.h>
 #include <faiss/invlists/InvertedLists.h>
@@ -58,3 +59,24 @@ struct PyCallbackIDSelector : faiss::IDSelector {
     ~PyCallbackIDSelector() override;
 };
+/***********************************************************
+ * Callbacks for IVF index sharding
+ ***********************************************************/
+struct PyCallbackShardingFunction : faiss::ivflib::ShardingFunction {
+    PyObject* callback;
+    explicit PyCallbackShardingFunction(PyObject* callback);
+    int64_t operator()(int64_t i, int64_t shard_count) override;
+    ~PyCallbackShardingFunction() override;
+    PyCallbackShardingFunction(const PyCallbackShardingFunction&) = delete;
+    PyCallbackShardingFunction(PyCallbackShardingFunction&&) noexcept = default;
+    PyCallbackShardingFunction& operator=(const PyCallbackShardingFunction&) =
+            default;
+    PyCallbackShardingFunction& operator=(PyCallbackShardingFunction&&) =
+            default;
+};

data/vendor/faiss/faiss/utils/approx_topk_hamming/approx_topk_hamming.h CHANGED Viewed

@@ -46,9 +46,11 @@ struct HeapWithBucketsForHamming32<
             // output distances
             int* const __restrict bh_val,
             // output indices, each being within [0, n) range
-            int64_t* const __restrict bh_ids) {
+            int64_t* const __restrict bh_ids,
+            // optional id selector for filtering
+            const IDSelector* sel = nullptr) {
         // forward a call to bs_addn with 1 beam
-        bs_addn(1, n, hc, binaryVectors, k, bh_val, bh_ids);
+        bs_addn(1, n, hc, binaryVectors, k, bh_val, bh_ids, sel);
     }
     static void bs_addn(
@@ -66,7 +68,9 @@ struct HeapWithBucketsForHamming32<
             int* const __restrict bh_val,
             // output indices, each being within [0, n_per_beam * beam_size)
             // range
-            int64_t* const __restrict bh_ids) {
+            int64_t* const __restrict bh_ids,
+            // optional id selector for filtering
+            const IDSelector* sel = nullptr) {
         //
         using C = CMax<int, int64_t>;
@@ -95,11 +99,22 @@ struct HeapWithBucketsForHamming32<
             for (uint32_t ip = 0; ip < nb; ip += NBUCKETS) {
                 for (uint32_t j = 0; j < NBUCKETS_8; j++) {
                     uint32_t hamming_distances[8];
+                    uint8_t valid_counter = 0;
                     for (size_t j8 = 0; j8 < 8; j8++) {
-                        hamming_distances[j8] = hc.hamming(
-                                binary_vectors +
-                                (j8 + j * 8 + ip + n_per_beam * beam_index) *
-                                        code_size);
+                        const uint32_t idx =
+                                j8 + j * 8 + ip + n_per_beam * beam_index;
+                        if (!sel || sel->is_member(idx)) {
+                            hamming_distances[j8] = hc.hamming(
+                                    binary_vectors + idx * code_size);
+                            valid_counter++;
+                        } else {
+                            hamming_distances[j8] =
+                                    std::numeric_limits<int32_t>::max();
+                        }
+                    }
+                    if (valid_counter == 8) {
+                        continue; // Skip if all vectors are filtered out
                     }
                     // loop. Compiler should get rid of unneeded ops
@@ -157,7 +172,8 @@ struct HeapWithBucketsForHamming32<
                         const auto value = min_distances_scalar[j8];
                         const auto index = min_indices_scalar[j8];
-                        if (C::cmp2(bh_val[0], value, bh_ids[0], index)) {
+                        if (value < std::numeric_limits<int32_t>::max() &&
+                            C::cmp2(bh_val[0], value, bh_ids[0], index)) {
                             heap_replace_top<C>(
                                     k, bh_val, bh_ids, value, index);
                         }
@@ -168,11 +184,13 @@ struct HeapWithBucketsForHamming32<
             // process leftovers
             for (uint32_t ip = nb; ip < n_per_beam; ip++) {
                 const auto index = ip + n_per_beam * beam_index;
-                const auto value =
-                        hc.hamming(binary_vectors + (index)*code_size);
+                if (!sel || sel->is_member(index)) {
+                    const auto value =
+                            hc.hamming(binary_vectors + (index)*code_size);
-                if (C::cmp(bh_val[0], value)) {
-                    heap_replace_top<C>(k, bh_val, bh_ids, value, index);
+                    if (C::cmp(bh_val[0], value)) {
+                        heap_replace_top<C>(k, bh_val, bh_ids, value, index);
+                    }
                 }
             }
         }

data/vendor/faiss/faiss/utils/hamming.cpp CHANGED Viewed

@@ -30,6 +30,7 @@
 #include <faiss/impl/AuxIndexStructures.h>
 #include <faiss/impl/FaissAssert.h>
+#include <faiss/impl/IDSelector.h>
 #include <faiss/utils/Heap.h>
 #include <faiss/utils/approx_topk_hamming/approx_topk_hamming.h>
 #include <faiss/utils/utils.h>
@@ -62,15 +63,15 @@ void hammings(
         const uint64_t* __restrict bs2,
         size_t n1,
         size_t n2,
-        size_t nwords,
+        size_t nbits,
         hamdis_t* __restrict dis) {
     size_t i, j;
-    n1 *= nwords;
-    n2 *= nwords;
-    for (i = 0; i < n1; i += nwords) {
-        const uint64_t* bs1_ = bs1 + i;
-        for (j = 0; j < n2; j += nwords)
-            dis[j] = hamming(bs1_, bs2 + j, nwords);
+    const size_t nwords = nbits / 64;
+    for (i = 0; i < n1; i++) {
+        const uint64_t* __restrict bs1_ = bs1 + i * nwords;
+        hamdis_t* __restrict dis_ = dis + i * n2;
+        for (j = 0; j < n2; j++)
+            dis_[j] = hamming(bs1_, bs2 + j * nwords, nwords);
     }
 }
@@ -171,7 +172,8 @@ void hammings_knn_hc(
         size_t n2,
         bool order = true,
         bool init_heap = true,
-        ApproxTopK_mode_t approx_topk_mode = ApproxTopK_mode_t::EXACT_TOPK) {
+        ApproxTopK_mode_t approx_topk_mode = ApproxTopK_mode_t::EXACT_TOPK,
+        const faiss::IDSelector* sel = nullptr) {
     size_t k = ha->k;
     if (init_heap)
         ha->heapify();
@@ -204,7 +206,7 @@ void hammings_knn_hc(
                 NB,                                                          \
                 BD,                                                          \
                 HammingComputer>::                                           \
-                addn(j1 - j0, hc, bs2_, k, bh_val_, bh_ids_);                \
+                addn(j1 - j0, hc, bs2_, k, bh_val_, bh_ids_, sel);           \
         break;
             switch (approx_topk_mode) {
@@ -214,6 +216,9 @@ void hammings_knn_hc(
                 HANDLE_APPROX(32, 2)
                 default: {
                     for (size_t j = j0; j < j1; j++, bs2_ += bytes_per_code) {
+                        if (sel && !sel->is_member(j)) {
+                            continue;
+                        }
                         dis = hc.hamming(bs2_);
                         if (dis < bh_val_[0]) {
                             faiss::maxheap_replace_top<hamdis_t>(
@@ -238,7 +243,8 @@ void hammings_knn_mc(
         size_t nb,
         size_t k,
         int32_t* __restrict distances,
-        int64_t* __restrict labels) {
+        int64_t* __restrict labels,
+        const faiss::IDSelector* sel) {
     const int nBuckets = bytes_per_code * 8 + 1;
     std::vector<int> all_counters(na * nBuckets, 0);
     std::unique_ptr<int64_t[]> all_ids_per_dis(new int64_t[na * nBuckets * k]);
@@ -259,7 +265,9 @@ void hammings_knn_mc(
 #pragma omp parallel for
         for (int64_t i = 0; i < na; ++i) {
             for (size_t j = j0; j < j1; ++j) {
-                cs[i].update_counter(b + j * bytes_per_code, j);
+                if (!sel || sel->is_member(j)) {
+                    cs[i].update_counter(b + j * bytes_per_code, j);
+                }
             }
         }
     }
@@ -291,7 +299,8 @@ void hamming_range_search(
         size_t nb,
         int radius,
         size_t code_size,
-        RangeSearchResult* res) {
+        RangeSearchResult* res,
+        const faiss::IDSelector* sel) {
 #pragma omp parallel
     {
         RangeSearchPartialResult pres(res);
@@ -303,9 +312,11 @@ void hamming_range_search(
             RangeQueryResult& qres = pres.new_result(i);
             for (size_t j = 0; j < nb; j++) {
-                int dis = hc.hamming(yi);
-                if (dis < radius) {
-                    qres.add(dis, j);
+                if (!sel || sel->is_member(j)) {
+                    int dis = hc.hamming(yi);
+                    if (dis < radius) {
+                        qres.add(dis, j);
+                    }
                 }
                 yi += code_size;
             }
@@ -489,10 +500,21 @@ void hammings_knn_hc(
         size_t nb,
         size_t ncodes,
         int order,
-        ApproxTopK_mode_t approx_topk_mode) {
+        ApproxTopK_mode_t approx_topk_mode,
+        const faiss::IDSelector* sel) {
     Run_hammings_knn_hc r;
     dispatch_HammingComputer(
-            ncodes, r, ncodes, ha, a, b, nb, order, true, approx_topk_mode);
+            ncodes,
+            r,
+            ncodes,
+            ha,
+            a,
+            b,
+            nb,
+            order,
+            true,
+            approx_topk_mode,
+            sel);
 }
 void hammings_knn_mc(
@@ -503,10 +525,11 @@ void hammings_knn_mc(
         size_t k,
         size_t ncodes,
         int32_t* __restrict distances,
-        int64_t* __restrict labels) {
+        int64_t* __restrict labels,
+        const faiss::IDSelector* sel) {
     Run_hammings_knn_mc r;
     dispatch_HammingComputer(
-            ncodes, r, ncodes, a, b, na, nb, k, distances, labels);
+            ncodes, r, ncodes, a, b, na, nb, k, distances, labels, sel);
 }
 void hamming_range_search(
@@ -516,10 +539,11 @@ void hamming_range_search(
         size_t nb,
         int radius,
         size_t code_size,
-        RangeSearchResult* result) {
+        RangeSearchResult* result,
+        const faiss::IDSelector* sel) {
     Run_hamming_range_search r;
     dispatch_HammingComputer(
-            code_size, r, a, b, na, nb, radius, code_size, result);
+            code_size, r, a, b, na, nb, radius, code_size, result, sel);
 }
 /* Count number of matches given a max threshold            */

data/vendor/faiss/faiss/utils/hamming.h CHANGED Viewed

@@ -27,6 +27,7 @@
 #include <stdint.h>
+#include <faiss/impl/IDSelector.h>
 #include <faiss/impl/platform_macros.h>
 #include <faiss/utils/Heap.h>
@@ -135,7 +136,8 @@ void hammings_knn_hc(
         size_t nb,
         size_t ncodes,
         int ordered,
-        ApproxTopK_mode_t approx_topk_mode = ApproxTopK_mode_t::EXACT_TOPK);
+        ApproxTopK_mode_t approx_topk_mode = ApproxTopK_mode_t::EXACT_TOPK,
+        const faiss::IDSelector* sel = nullptr);
 /* Legacy alias to hammings_knn_hc. */
 void hammings_knn(
@@ -166,7 +168,8 @@ void hammings_knn_mc(
         size_t k,
         size_t ncodes,
         int32_t* distances,
-        int64_t* labels);
+        int64_t* labels,
+        const faiss::IDSelector* sel = nullptr);
 /** same as hammings_knn except we are doing a range search with radius */
 void hamming_range_search(
@@ -176,7 +179,8 @@ void hamming_range_search(
         size_t nb,
         int radius,
         size_t ncodes,
-        RangeSearchResult* result);
+        RangeSearchResult* result,
+        const faiss::IDSelector* sel = nullptr);
 /* Counting the number of matches or of cross-matches (without returning them)
    For use with function that assume pre-allocated memory */

data/vendor/faiss/faiss/utils/hamming_distance/avx512-inl.h CHANGED Viewed

@@ -11,7 +11,7 @@
 // AVX512 version
 // The _mm512_popcnt_epi64 intrinsic is used to accelerate Hamming distance
 // calculations in HammingComputerDefault and HammingComputer64. This intrinsic
-// is not available in the default FAISS avx512 build mode but is only
+// is not available in the default Faiss avx512 build mode but is only
 // available in the avx512_spr build mode, which targets Intel(R) Sapphire
 // Rapids.