npm - native-vector-store - Versions diffs - 0.1.0 → 0.3.0 - Mend

native-vector-store 0.1.0 → 0.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (53) hide show

package/README.md +242 -12
package/binding.gyp +22 -10
package/deps/simdjson/simdjson.cpp +56403 -0
package/deps/simdjson/simdjson.h +123534 -0
package/docs/PERFORMANCE_CASE_STUDY.md +130 -0
package/docs/PREBUILDS.md +69 -0
package/docs/VectorStore.html +180 -0
package/docs/VectorStoreWrapper.html +1356 -0
package/docs/fonts/OpenSans-Bold-webfont.eot +0 -0
package/docs/fonts/OpenSans-Bold-webfont.svg +1830 -0
package/docs/fonts/OpenSans-Bold-webfont.woff +0 -0
package/docs/fonts/OpenSans-BoldItalic-webfont.eot +0 -0
package/docs/fonts/OpenSans-BoldItalic-webfont.svg +1830 -0
package/docs/fonts/OpenSans-BoldItalic-webfont.woff +0 -0
package/docs/fonts/OpenSans-Italic-webfont.eot +0 -0
package/docs/fonts/OpenSans-Italic-webfont.svg +1830 -0
package/docs/fonts/OpenSans-Italic-webfont.woff +0 -0
package/docs/fonts/OpenSans-Light-webfont.eot +0 -0
package/docs/fonts/OpenSans-Light-webfont.svg +1831 -0
package/docs/fonts/OpenSans-Light-webfont.woff +0 -0
package/docs/fonts/OpenSans-LightItalic-webfont.eot +0 -0
package/docs/fonts/OpenSans-LightItalic-webfont.svg +1835 -0
package/docs/fonts/OpenSans-LightItalic-webfont.woff +0 -0
package/docs/fonts/OpenSans-Regular-webfont.eot +0 -0
package/docs/fonts/OpenSans-Regular-webfont.svg +1831 -0
package/docs/fonts/OpenSans-Regular-webfont.woff +0 -0
package/docs/global.html +561 -0
package/docs/index.html +570 -0
package/docs/scripts/linenumber.js +25 -0
package/docs/scripts/prettify/Apache-License-2.0.txt +202 -0
package/docs/scripts/prettify/lang-css.js +2 -0
package/docs/scripts/prettify/prettify.js +28 -0
package/docs/styles/jsdoc-default.css +358 -0
package/docs/styles/prettify-jsdoc.css +111 -0
package/docs/styles/prettify-tomorrow.css +132 -0
package/index.js +162 -0
package/package.json +30 -7
package/prebuilds/darwin-arm64/native-vector-store.node +0 -0
package/prebuilds/darwin-x64/native-vector-store.node +0 -0
package/prebuilds/linux-arm64/native-vector-store.node +0 -0
package/prebuilds/linux-x64/native-vector-store.node +0 -0
package/prebuilds/linux-x64-musl/napi-v9/native-vector-store.node +0 -0
package/prebuilds/linux-x64-musl/native-vector-store.node +0 -0
package/prebuilds/win32-x64/native-vector-store.node +0 -0
package/src/Makefile +87 -0
package/src/test_main.cpp +173 -0
package/src/test_stress.cpp +394 -0
package/src/vector_store.cpp +344 -0
package/src/vector_store.h +21 -323
package/native-vector-store-0.1.0.tgz +0 -0
package/scripts/build-prebuilds.sh +0 -23
/package/{src → deps/atomic_queue}/atomic_queue.h +0 -0
/package/{src → deps/atomic_queue}/defs.h +0 -0

package/src/vector_store.h CHANGED Viewed

@@ -26,74 +26,9 @@ class ArenaAllocator {
     std::mutex chunk_creation_mutex_;
 public:
-    ArenaAllocator() : head_(std::make_unique<Chunk>()),
-                       current_(head_.get()) {}
-    void* allocate(size_t size, size_t align = 64) {
-        // Validate alignment is power of 2 and reasonable
-        assert(align > 0 && (align & (align - 1)) == 0);
-        if (align > 4096) {
-            return nullptr;  // Alignment too large
-        }
-        // Validate size
-        if (size > CHUNK_SIZE) {
-            return nullptr;  // Cannot allocate larger than chunk size
-        }
-        Chunk* chunk = current_.load(std::memory_order_acquire);
-        while (true) {
-            size_t old_offset = chunk->offset.load(std::memory_order_relaxed);
-            // Calculate the pointer that would result from current offset
-            void* ptr = chunk->data + old_offset;
-            // Calculate how much padding we need for alignment
-            size_t misalignment = (uintptr_t)ptr & (align - 1);
-            size_t padding = misalignment ? (align - misalignment) : 0;
-            size_t aligned_offset = old_offset + padding;
-            size_t new_offset = aligned_offset + size;
-            if (new_offset > CHUNK_SIZE) {
-                // Need new chunk
-                Chunk* next = chunk->next.load(std::memory_order_acquire);
-                if (!next) {
-                    // Lock to prevent multiple threads creating chunks
-                    std::lock_guard<std::mutex> lock(chunk_creation_mutex_);
-                    // Double-check after acquiring lock
-                    next = chunk->next.load(std::memory_order_acquire);
-                    if (!next) {
-                        auto new_chunk = std::make_unique<Chunk>();
-                        next = new_chunk.get();
-                        chunk->next.store(next, std::memory_order_release);
-                        // Transfer ownership after setting atomic pointer
-                        new_chunk.release();
-                    }
-                }
-                // Update current to the new chunk
-                current_.store(next, std::memory_order_release);
-                chunk = next;
-                continue;
-            }
-            if (chunk->offset.compare_exchange_weak(old_offset, new_offset,
-                                                   std::memory_order_release,
-                                                   std::memory_order_relaxed)) {
-                return chunk->data + aligned_offset;
-            }
-        }
-    }
-    ~ArenaAllocator() {
-        // Clean up linked chunks
-        Chunk* chunk = head_->next.load(std::memory_order_acquire);
-        while (chunk) {
-            Chunk* next = chunk->next.load(std::memory_order_acquire);
-            delete chunk;
-            chunk = next;
-        }
-    }
+    ArenaAllocator();
+    void* allocate(size_t size, size_t align = 64);
+    ~ArenaAllocator();
 };
 struct Document {
@@ -107,9 +42,7 @@ struct TopK {
     size_t k;
     std::vector<std::pair<float, size_t>> heap; // min-heap by score
-    explicit TopK(size_t k = 0) : k(k) {
-        heap.reserve(k + 1); // Reserve k+1 to avoid reallocation during push
-    }
+    explicit TopK(size_t k = 0);
     // Make TopK move-only to prevent copy-construction races
     TopK(const TopK&) = delete;
@@ -117,46 +50,24 @@ struct TopK {
     TopK(TopK&&) = default;
     TopK& operator=(TopK&&) = default;
-    void push(float score, size_t idx) {
-        if (heap.size() < k) {
-            heap.emplace_back(score, idx);
-            std::push_heap(heap.begin(), heap.end(), cmp);
-        } else if (k > 0 && score > heap.front().first) {
-            // Replace the minimum element
-            std::pop_heap(heap.begin(), heap.end(), cmp);
-            heap.back() = {score, idx};
-            std::push_heap(heap.begin(), heap.end(), cmp);
-        }
-    }
+    void push(float score, size_t idx);
     // Comparator for min-heap (greater than for min-heap behavior)
-    static bool cmp(const std::pair<float, size_t>& a, const std::pair<float, size_t>& b) {
-        return a.first > b.first;
-    }
+    static bool cmp(const std::pair<float, size_t>& a, const std::pair<float, size_t>& b);
-    void merge(const TopK& other) {
-        // More efficient: if we have space, bulk insert then re-heapify
-        if (heap.size() + other.heap.size() <= k) {
-            heap.insert(heap.end(), other.heap.begin(), other.heap.end());
-            std::make_heap(heap.begin(), heap.end(), cmp);
-        } else {
-            // Otherwise, insert one by one
-            for (const auto& [score, idx] : other.heap) {
-                push(score, idx);
-            }
-        }
-    }
+    void merge(const TopK& other);
 };
 class VectorStore {
-    const size_t dim_;
-    ArenaAllocator arena_;
+public:
     struct Entry {
         Document doc;
         float* embedding;  // Extracted pointer for fast access
     };
+private:
+    const size_t dim_;
+    ArenaAllocator arena_;
     std::vector<Entry> entries_;
     std::atomic<size_t> count_{0};  // Atomic for parallel loading
@@ -164,238 +75,25 @@ class VectorStore {
     mutable std::shared_mutex search_mutex_;  // Protects against overlapping OpenMP teams
 public:
-    explicit VectorStore(size_t dim) : dim_(dim) {
-        entries_.resize(1'000'000);  // Pre-size with default-constructed entries
-    }
+    explicit VectorStore(size_t dim);
     // Overload for document type (used in test_main.cpp)
-    simdjson::error_code add_document(simdjson::ondemand::document& json_doc) {
-        simdjson::ondemand::object obj;
-        auto error = json_doc.get_object().get(obj);
-        if (error) {
-            return error;
-        }
-        return add_document(obj);
-    }
+    simdjson::error_code add_document(simdjson::ondemand::document& json_doc);
-    simdjson::error_code add_document(simdjson::ondemand::object& json_doc) {
-        // Cannot add documents after finalization
-        if (is_finalized_.load(std::memory_order_acquire)) {
-            return simdjson::INCORRECT_TYPE;
-        }
-        // Parse with error handling
-        std::string_view id, text;
-        auto error = json_doc["id"].get_string().get(id);
-        if (error) return error;
-        error = json_doc["text"].get_string().get(text);
-        if (error) return error;
-        // Calculate sizes
-        size_t emb_size = dim_ * sizeof(float);
-        size_t id_size = id.size() + 1;
-        size_t text_size = text.size() + 1;
-        // Allocate temporary buffer for embedding
-        std::vector<float> temp_embedding;
-        temp_embedding.reserve(dim_);
-        // Process metadata and embedding first
-        simdjson::ondemand::object metadata;
-        error = json_doc["metadata"].get_object().get(metadata);
-        if (error) return error;
-        simdjson::ondemand::array emb_array;
-        error = metadata["embedding"].get_array().get(emb_array);
-        if (error) return error;
-        // Consume the array before touching anything else
-        size_t i = 0;
-        for (auto value_result : emb_array) {
-            simdjson::ondemand::value v;
-            error = value_result.get(v);
-            if (error) return error;
-            double val;
-            error = v.get_double().get(val);
-            if (error) return error;
-            if (i >= dim_) {
-                return simdjson::CAPACITY; // Too many embedding values
-            }
-            temp_embedding.push_back(float(val));
-            i++;
-        }
-        // Verify we got the expected number of embedding values
-        if (i != dim_) {
-            return simdjson::INCORRECT_TYPE; // Wrong embedding dimension
-        }
-        // Now it is safe to take the raw metadata JSON
-        std::string_view raw_json;
-        error = metadata.raw_json().get(raw_json);
-        if (error) return error;
-        size_t meta_size = raw_json.size() + 1;
-        // Single arena allocation
-        char* base = (char*)arena_.allocate(emb_size + id_size + text_size + meta_size);
-        if (!base) {
-            return simdjson::MEMALLOC;  // Allocation failed
-        }
-        // Layout: [embedding][id][text][metadata_json]
-        float* emb_ptr = (float*)base;
-        char* id_ptr = base + emb_size;
-        char* text_ptr = id_ptr + id_size;
-        char* meta_ptr = text_ptr + text_size;
-        // Copy embedding from temporary buffer
-        std::memcpy(emb_ptr, temp_embedding.data(), emb_size);
-        // Copy strings (adding null terminator)
-        std::memcpy(id_ptr, id.data(), id.size());
-        id_ptr[id.size()] = '\0';
-        std::memcpy(text_ptr, text.data(), text.size());
-        text_ptr[text.size()] = '\0';
-        std::memcpy(meta_ptr, raw_json.data(), raw_json.size());
-        meta_ptr[raw_json.size()] = '\0';
-        // Atomic increment for parallel loading
-        size_t idx = count_.fetch_add(1, std::memory_order_relaxed);
-        // Bounds check
-        if (idx >= entries_.size()) {
-            count_.fetch_sub(1, std::memory_order_relaxed);
-            return simdjson::CAPACITY;
-        }
-        // Construct entry directly - no synchronization needed
-        entries_[idx] = Entry{
-            .doc = Document{
-                .id = std::string_view(id_ptr, id.size()),
-                .text = std::string_view(text_ptr, text.size()),
-                .metadata_json = std::string_view(meta_ptr, raw_json.size())
-            },
-            .embedding = emb_ptr
-        };
-        return simdjson::SUCCESS;
-    }
+    simdjson::error_code add_document(simdjson::ondemand::object& json_doc);
     // Finalize the store: normalize and switch to serving phase
-    void finalize() {
-        // If already finalized, do nothing
-        if (is_finalized_.load(std::memory_order_acquire)) {
-            return;
-        }
-        // Get final count
-        size_t final_count = count_.load(std::memory_order_acquire);
-        // Normalize all embeddings (single-threaded, no races)
-        for (size_t i = 0; i < final_count; ++i) {
-            float* emb = entries_[i].embedding;
-            if (!emb) continue;  // Skip uninitialized entries
-            float sum = 0.0f;
-            #pragma omp simd reduction(+:sum)
-            for (size_t j = 0; j < dim_; ++j) {
-                sum += emb[j] * emb[j];
-            }
-            if (sum > 1e-10f) {  // Avoid division by zero
-                float inv_norm = 1.0f / std::sqrt(sum);
-                #pragma omp simd
-                for (size_t j = 0; j < dim_; ++j) {
-                    emb[j] *= inv_norm;
-                }
-            }
-        }
-        // Ensure all threads see the normalized data
-        #pragma omp barrier
-        // Mark as finalized - this is the ONLY place this flag is set
-        is_finalized_.store(true, std::memory_order_seq_cst);
-    }
+    void finalize();
     // Deprecated: use finalize() instead
-    void normalize_all() {
-        finalize();
-    }
+    void normalize_all();
     std::vector<std::pair<float, size_t>>
-    search(const float* query, size_t k) const {
-        // Exclusive lock: prevent overlapping OpenMP teams
-        // Since each search uses all threads via OpenMP, concurrent searches provide no benefit
-        std::unique_lock<std::shared_mutex> lock(search_mutex_);
-        // Search can ONLY run if finalized
-        if (!is_finalized_.load(std::memory_order_acquire)) {
-            return {};
-        }
-        size_t n = count_.load(std::memory_order_acquire);
-        if (n == 0 || k == 0) return {};
-        k = std::min(k, n);  // Ensure k doesn't exceed count
-        // Always use per-thread heaps to avoid any shared memory races
-        const int num_threads = omp_get_max_threads();
-        std::vector<TopK> thread_heaps;
-        thread_heaps.reserve(num_threads);
-        for (int i = 0; i < num_threads; ++i) {
-            thread_heaps.emplace_back(k);  // in-place construction, no copies
-        }
-         std::vector<std::pair<float,std::size_t>> result;
-        #pragma omp parallel
-        {
-            const int tid = omp_get_thread_num();
-            TopK& local_heap = thread_heaps[tid];
-            #pragma omp for  // default barrier kept - ensures all threads finish before merge
-            for (size_t i = 0; i < n; ++i) {
-                float score = 0.0f;
-                const float* emb = entries_[i].embedding;
-                #pragma omp simd reduction(+:score)
-                for (size_t j = 0; j < dim_; ++j) {
-                    score += emb[j] * query[j];
-                }
-                local_heap.push(score, i);
-            }
-            #pragma omp barrier
-            #pragma omp single
-            {
-                TopK final_heap(k);
-                for (auto& th : thread_heaps) final_heap.merge(th);
-                result = std::move(final_heap.heap);
-            }
-        }
-        std::sort(result.begin(), result.end(),
-                  [](const auto& a, const auto& b) { return a.first > b.first; });
-        return result;
-    }
+    search(const float* query, size_t k) const;
-    const Entry& get_entry(size_t idx) const {
-        return entries_[idx];
-    }
+    const Entry& get_entry(size_t idx) const;
-    size_t size() const {
-        return count_.load(std::memory_order_acquire);
-    }
+    size_t size() const;
-    bool is_finalized() const {
-        return is_finalized_.load(std::memory_order_acquire);
-    }
+    bool is_finalized() const;
 };

package/native-vector-store-0.1.0.tgz DELETED Viewed

Binary file

package/scripts/build-prebuilds.sh DELETED Viewed

@@ -1,23 +0,0 @@
-#!/bin/bash
-# Build prebuilds for current platform
-echo "Building prebuilds for native-vector-store..."
-# Clean previous builds
-rm -rf prebuilds/
-# Build for current platform and architecture
-echo "Building for current platform..."
-npx prebuildify --napi --strip
-# For local testing on macOS, build both architectures if on Apple Silicon
-if [[ "$OSTYPE" == "darwin"* ]] && [[ "$(uname -m)" == "arm64" ]]; then
-    echo "Building universal binary for macOS..."
-    npx prebuildify --napi --strip --arch x64
-    npx prebuildify --napi --strip --arch arm64
-fi
-echo "Prebuilds created:"
-find prebuilds -type f -name "*.node" | sort
-echo "Done!"

/package/{src → deps/atomic_queue}/atomic_queue.h RENAMED Viewed

File without changes

/package/{src → deps/atomic_queue}/defs.h RENAMED Viewed

File without changes