npm - vectlite - Versions diffs - 0.9.0 → 0.9.2 - Mend

vectlite 0.9.0 → 0.9.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (13) hide show

package/README.md +26 -14
package/index.d.ts +60 -0
package/index.js +135 -8
package/native/Cargo.toml +1 -1
package/native/src/lib.rs +80 -47
package/native/vectlite-core/Cargo.toml +1 -1
package/native/vectlite-core/src/lib.rs +512 -152
package/native/vectlite-core/src/quantization.rs +234 -49
package/package.json +1 -1
package/prebuilds/darwin-arm64/vectlite.node +0 -0
package/prebuilds/darwin-x64/vectlite.node +0 -0
package/prebuilds/linux-x64-gnu/vectlite.node +0 -0
package/prebuilds/win32-x64-msvc/vectlite.node +0 -0

package/native/vectlite-core/src/quantization.rs CHANGED Viewed

@@ -1,14 +1,16 @@
 //! Vector quantization module for memory-efficient similarity search.
 //!
 //! Supports three quantization strategies:
-//! - **Scalar (int8)**: 4x memory reduction with minimal recall loss
-//! - **Binary**: 32x memory reduction, uses Hamming distance for fast filtering
+//! - **Scalar (int8)**: compact in-memory candidate index with minimal recall loss
+//! - **Binary**: smallest in-memory candidate index, uses Hamming distance for fast filtering
 //! - **Product Quantization (PQ)**: Configurable compression for very large datasets
 //!
 //! All strategies support a 2-stage pipeline: fast quantized search followed by
 //! exact float32 rescoring of top candidates.
-use std::io::{Read, Write};
+use std::io::{Error, ErrorKind, Read, Write};
+use crate::{DistanceMetric, Result, VectLiteError};
 // ---------------------------------------------------------------------------
 // Public types
@@ -18,10 +20,10 @@ use std::io::{Read, Write};
 #[derive(Clone, Debug, PartialEq)]
 pub enum QuantizationConfig {
     /// Scalar quantization: maps each f32 dimension to int8 using per-dimension
-    /// min/max calibration. 4x memory reduction.
+    /// min/max calibration for a compact in-memory candidate index.
     Scalar(ScalarQuantizationConfig),
     /// Binary quantization: maps each f32 dimension to a single bit.
-    /// 32x memory reduction. Best for high-dimensional normalized embeddings.
+    /// Smallest in-memory candidate index. Best for high-dimensional normalized embeddings.
     Binary(BinaryQuantizationConfig),
     /// Product quantization: splits vector into sub-vectors and quantizes each
     /// to a centroid index. Highest compression for large datasets.
@@ -31,14 +33,14 @@ pub enum QuantizationConfig {
 #[derive(Clone, Debug, PartialEq)]
 pub struct ScalarQuantizationConfig {
     /// Number of top candidates from quantized search to rescore with float32.
-    /// Default: 5x top_k (minimum 100).
+    /// Default: 10x top_k.
     pub rescore_multiplier: usize,
 }
 impl Default for ScalarQuantizationConfig {
     fn default() -> Self {
         Self {
-            rescore_multiplier: 5,
+            rescore_multiplier: 10,
         }
     }
 }
@@ -46,7 +48,7 @@ impl Default for ScalarQuantizationConfig {
 #[derive(Clone, Debug, PartialEq)]
 pub struct BinaryQuantizationConfig {
     /// Number of top candidates from Hamming search to rescore with float32.
-    /// Default: 10x top_k (minimum 100).
+    /// Default: 10x top_k.
     pub rescore_multiplier: usize,
 }
@@ -69,6 +71,7 @@ pub struct ProductQuantizationConfig {
     /// Number of k-means training iterations.
     pub training_iterations: usize,
     /// Number of top candidates from PQ search to rescore with float32.
+    /// Default: 10x top_k.
     pub rescore_multiplier: usize,
 }
@@ -83,6 +86,53 @@ impl Default for ProductQuantizationConfig {
     }
 }
+/// Choose a valid default PQ sub-vector count for a database dimension.
+///
+/// Prefer the historical default of 16 when possible, then fall back to smaller
+/// common divisors so dimensions such as 100, 146, and 200 do not require an
+/// explicit `num_sub_vectors`.
+pub fn default_product_num_sub_vectors(dimension: usize) -> usize {
+    [16, 12, 10, 8, 6, 4, 3, 2, 1]
+        .into_iter()
+        .find(|candidate| dimension % candidate == 0)
+        .unwrap_or(1)
+}
+/// List every valid PQ sub-vector count for a database dimension.
+pub fn valid_product_num_sub_vectors(dimension: usize) -> Vec<usize> {
+    if dimension == 0 {
+        return Vec::new();
+    }
+    (1..=dimension)
+        .filter(|candidate| dimension % candidate == 0)
+        .collect()
+}
+/// Validate quantization settings before an index build can panic.
+pub fn validate_quantization_config(config: &QuantizationConfig, dimension: usize) -> Result<()> {
+    if let QuantizationConfig::Product(cfg) = config {
+        if cfg.num_sub_vectors == 0 {
+            return Err(VectLiteError::InvalidFormat(
+                "num_sub_vectors must be greater than 0".to_owned(),
+            ));
+        }
+        if dimension % cfg.num_sub_vectors != 0 {
+            return Err(VectLiteError::InvalidFormat(format!(
+                "dimension ({dimension}) must be divisible by num_sub_vectors ({})",
+                cfg.num_sub_vectors
+            )));
+        }
+        if cfg.num_centroids == 0 || cfg.num_centroids > 256 {
+            return Err(VectLiteError::InvalidFormat(
+                "num_centroids must be between 1 and 256".to_owned(),
+            ));
+        }
+    }
+    Ok(())
+}
 // ---------------------------------------------------------------------------
 // Scalar Quantization
 // ---------------------------------------------------------------------------
@@ -173,18 +223,27 @@ impl ScalarQuantizer {
             .collect()
     }
-    /// Compute approximate cosine distance between a quantized query and all stored vectors.
+    /// Compute approximate cosine similarity between the query and all stored vectors.
     /// Returns indices sorted by approximate similarity (best first).
     pub fn search(&self, query: &[f32], top_k: usize) -> Vec<(usize, f32)> {
-        let rescore_count = (top_k * self.config.rescore_multiplier)
-            .max(100)
-            .min(self.count);
-        let query_quantized = self.quantize_query(query);
+        self.search_with_metric(query, top_k, DistanceMetric::Cosine)
+    }
+    /// Compute approximate metric scores between the query and all stored vectors.
+    /// Returns indices sorted by approximate score (best first).
+    pub fn search_with_metric(
+        &self,
+        query: &[f32],
+        top_k: usize,
+        metric: DistanceMetric,
+    ) -> Vec<(usize, f32)> {
+        assert_eq!(query.len(), self.dimension);
+        let rescore_count = rescore_count(top_k, self.config.rescore_multiplier, self.count);
         let mut scores: Vec<(usize, f32)> = (0..self.count)
             .map(|idx| {
                 let offset = idx * self.dimension;
                 let code_slice = &self.codes[offset..offset + self.dimension];
-                let sim = scalar_quantized_dot(&query_quantized, code_slice);
+                let sim = self.approximate_score(query, code_slice, metric);
                 (idx, sim)
             })
             .collect();
@@ -195,6 +254,71 @@ impl ScalarQuantizer {
         scores
     }
+    fn approximate_score(&self, query: &[f32], code_slice: &[u8], metric: DistanceMetric) -> f32 {
+        match metric {
+            DistanceMetric::Cosine => {
+                let mut dot = 0.0_f32;
+                let mut query_norm = 0.0_f32;
+                let mut vector_norm = 0.0_f32;
+                for (((&query_value, &code), &min), &scale) in query
+                    .iter()
+                    .zip(code_slice.iter())
+                    .zip(self.mins.iter())
+                    .zip(self.scales.iter())
+                {
+                    let value = dequantize_scalar(code, min, scale);
+                    dot += query_value * value;
+                    query_norm += query_value * query_value;
+                    vector_norm += value * value;
+                }
+                if query_norm == 0.0 || vector_norm == 0.0 {
+                    0.0
+                } else {
+                    dot / (query_norm.sqrt() * vector_norm.sqrt())
+                }
+            }
+            DistanceMetric::Euclidean => {
+                let mut sum = 0.0_f32;
+                for (((&query_value, &code), &min), &scale) in query
+                    .iter()
+                    .zip(code_slice.iter())
+                    .zip(self.mins.iter())
+                    .zip(self.scales.iter())
+                {
+                    let delta = query_value - dequantize_scalar(code, min, scale);
+                    sum += delta * delta;
+                }
+                -sum.sqrt()
+            }
+            DistanceMetric::DotProduct => {
+                let mut dot = 0.0_f32;
+                for (((&query_value, &code), &min), &scale) in query
+                    .iter()
+                    .zip(code_slice.iter())
+                    .zip(self.mins.iter())
+                    .zip(self.scales.iter())
+                {
+                    dot += query_value * dequantize_scalar(code, min, scale);
+                }
+                dot
+            }
+            DistanceMetric::Manhattan => {
+                let mut sum = 0.0_f32;
+                for (((&query_value, &code), &min), &scale) in query
+                    .iter()
+                    .zip(code_slice.iter())
+                    .zip(self.mins.iter())
+                    .zip(self.scales.iter())
+                {
+                    sum += (query_value - dequantize_scalar(code, min, scale)).abs();
+                }
+                -sum
+            }
+        }
+    }
     /// Rebuild codes from training vectors (used after deserialization with new vectors).
     pub fn rebuild_codes(&mut self, vectors: &[&[f32]]) {
         self.codes.clear();
@@ -311,9 +435,7 @@ impl BinaryQuantizer {
     /// Search using Hamming distance. Returns candidate indices sorted by
     /// Hamming similarity (fewest differing bits first).
     pub fn search(&self, query: &[f32], top_k: usize) -> Vec<(usize, u32)> {
-        let rescore_count = (top_k * self.config.rescore_multiplier)
-            .max(100)
-            .min(self.count);
+        let rescore_count = rescore_count(top_k, self.config.rescore_multiplier, self.count);
         let query_binary = self.binarize_query(query);
         let mut distances: Vec<(usize, u32)> = (0..self.count)
             .map(|idx| {
@@ -476,9 +598,7 @@ impl ProductQuantizer {
     /// Search using asymmetric distance computation (ADC).
     /// Returns candidate indices sorted by approximate L2 distance.
     pub fn search(&self, query: &[f32], top_k: usize) -> Vec<(usize, f32)> {
-        let rescore_count = (top_k * self.config.rescore_multiplier)
-            .max(100)
-            .min(self.count);
+        let rescore_count = rescore_count(top_k, self.config.rescore_multiplier, self.count);
         let distance_table = self.compute_distance_table(query);
         let mut distances: Vec<(usize, f32)> = (0..self.count)
@@ -542,6 +662,20 @@ impl ProductQuantizer {
         let num_centroids = read_usize(reader)?;
         let training_iterations = read_usize(reader)?;
         let rescore_multiplier = read_usize(reader)?;
+        if num_sub_vectors == 0 || dimension % num_sub_vectors != 0 {
+            return Err(Error::new(
+                ErrorKind::InvalidData,
+                format!(
+                    "dimension ({dimension}) must be divisible by num_sub_vectors ({num_sub_vectors})"
+                ),
+            ));
+        }
+        if num_centroids == 0 || num_centroids > 256 {
+            return Err(Error::new(
+                ErrorKind::InvalidData,
+                "num_centroids must be between 1 and 256",
+            ));
+        }
         let sub_dimension = dimension / num_sub_vectors;
         // Read codebooks
@@ -586,7 +720,7 @@ impl ProductQuantizer {
 #[derive(Clone, Debug, PartialEq)]
 pub struct TwoBitQuantizationConfig {
     /// Number of top candidate docs from quantized search to rescore with
-    /// exact float32 MaxSim. Default: 4x top_k (minimum 50).
+    /// exact float32 MaxSim. Default: 4x top_k.
     pub rescore_multiplier: usize,
 }
@@ -619,11 +753,7 @@ pub struct TwoBitQuantizer {
 impl TwoBitQuantizer {
     /// Train a 2-bit quantizer by computing per-dimension quartiles.
-    pub fn train(
-        vectors: &[&[f32]],
-        dimension: usize,
-        config: TwoBitQuantizationConfig,
-    ) -> Self {
+    pub fn train(vectors: &[&[f32]], dimension: usize, config: TwoBitQuantizationConfig) -> Self {
         assert!(!vectors.is_empty(), "need at least one vector to train");
         // Collect values per dimension and compute quartile boundaries
@@ -672,9 +802,7 @@ impl TwoBitQuantizer {
     /// Search for top-k candidates using approximate 2-bit dot products.
     /// Returns (index, approx_score) pairs sorted best-first.
     pub fn search(&self, query: &[f32], top_k: usize) -> Vec<(usize, i32)> {
-        let rescore_count = (top_k * self.config.rescore_multiplier)
-            .max(50)
-            .min(self.count);
+        let rescore_count = rescore_count(top_k, self.config.rescore_multiplier, self.count);
         let query_codes = self.quantize_vector(query);
         let mut scores: Vec<(usize, i32)> = (0..self.count)
@@ -691,8 +819,11 @@ impl TwoBitQuantizer {
         self.codes.clear();
         self.codes.reserve(vectors.len() * self.bytes_per_vector);
         for vector in vectors {
-            self.codes
-                .extend_from_slice(&quantize_two_bit(vector, &self.boundaries, self.bytes_per_vector));
+            self.codes.extend_from_slice(&quantize_two_bit(
+                vector,
+                &self.boundaries,
+                self.bytes_per_vector,
+            ));
         }
         self.count = vectors.len();
     }
@@ -824,9 +955,11 @@ impl MultiVectorQuantizedIndex {
     /// Search: returns candidate document indices sorted by approximate MaxSim.
     pub fn search(&self, query_tokens: &[&[f32]], top_k: usize) -> Vec<usize> {
-        let rescore_count = (top_k * self.quantizer.config.rescore_multiplier)
-            .max(50)
-            .min(self.doc_ranges.len());
+        let rescore_count = rescore_count(
+            top_k,
+            self.quantizer.config.rescore_multiplier,
+            self.doc_ranges.len(),
+        );
         if query_tokens.is_empty() || self.doc_ranges.is_empty() {
             return Vec::new();
         }
@@ -846,10 +979,7 @@ impl MultiVectorQuantizedIndex {
     }
     /// Rebuild from document token vectors (after loading parameters from disk).
-    pub fn rebuild(
-        &mut self,
-        doc_token_vectors: &[&[Vec<f32>]],
-    ) {
+    pub fn rebuild(&mut self, doc_token_vectors: &[&[Vec<f32>]]) {
         let all_tokens: Vec<&[f32]> = doc_token_vectors
             .iter()
             .flat_map(|tokens| tokens.iter().map(|v| v.as_slice()))
@@ -936,10 +1066,23 @@ impl QuantizedIndex {
     /// Search the quantized index. Returns candidate indices sorted by
     /// approximate similarity (best first), to be rescored with exact vectors.
     pub fn search_candidates(&self, query: &[f32], top_k: usize) -> Vec<usize> {
+        self.search_candidates_with_metric(query, top_k, DistanceMetric::Cosine)
+    }
+    /// Search the quantized index with the database metric.
+    /// Returns candidate indices sorted by approximate score (best first).
+    pub fn search_candidates_with_metric(
+        &self,
+        query: &[f32],
+        top_k: usize,
+        metric: DistanceMetric,
+    ) -> Vec<usize> {
         match self {
-            QuantizedIndex::Scalar(q) => {
-                q.search(query, top_k).into_iter().map(|(i, _)| i).collect()
-            }
+            QuantizedIndex::Scalar(q) => q
+                .search_with_metric(query, top_k, metric)
+                .into_iter()
+                .map(|(i, _)| i)
+                .collect(),
             QuantizedIndex::Binary(q) => {
                 q.search(query, top_k).into_iter().map(|(i, _)| i).collect()
             }
@@ -1020,6 +1163,14 @@ impl QuantizedIndex {
 // Internal helper functions
 // ---------------------------------------------------------------------------
+#[inline]
+fn rescore_count(top_k: usize, rescore_multiplier: usize, count: usize) -> usize {
+    top_k
+        .max(1)
+        .saturating_mul(rescore_multiplier.max(1))
+        .min(count)
+}
 /// Quantize a single f32 value to u8 using the given min and scale.
 #[inline]
 fn quantize_scalar(val: f32, min: f32, scale: f32) -> u8 {
@@ -1030,15 +1181,13 @@ fn quantize_scalar(val: f32, min: f32, scale: f32) -> u8 {
     }
 }
-/// Approximate dot product between two u8-quantized vectors.
-/// Higher value = more similar (analogous to cosine similarity for normalized vectors).
 #[inline]
-fn scalar_quantized_dot(a: &[u8], b: &[u8]) -> f32 {
-    let mut sum = 0i32;
-    for (&ai, &bi) in a.iter().zip(b.iter()) {
-        sum += (ai as i32) * (bi as i32);
+fn dequantize_scalar(code: u8, min: f32, scale: f32) -> f32 {
+    if scale == 0.0 {
+        min
+    } else {
+        min + (code as f32 / scale)
     }
-    sum as f32
 }
 /// Convert a float vector to a binary representation (1 bit per dimension).
@@ -1258,6 +1407,39 @@ mod tests {
         assert_eq!(results[0].1, 0); // Hamming distance 0
     }
+    #[test]
+    fn rescore_multiplier_controls_candidate_count_without_hidden_floor() {
+        let vectors = random_vectors(200, 64, 7);
+        let refs: Vec<&[f32]> = vectors.iter().map(Vec::as_slice).collect();
+        let scalar = ScalarQuantizer::train(
+            &refs,
+            64,
+            ScalarQuantizationConfig {
+                rescore_multiplier: 1,
+            },
+        );
+        assert_eq!(scalar.search(&vectors[0], 10).len(), 10);
+        let scalar = ScalarQuantizer::train(
+            &refs,
+            64,
+            ScalarQuantizationConfig {
+                rescore_multiplier: 4,
+            },
+        );
+        assert_eq!(scalar.search(&vectors[0], 10).len(), 40);
+        let mut binary = BinaryQuantizer::new(
+            64,
+            BinaryQuantizationConfig {
+                rescore_multiplier: 2,
+            },
+        );
+        binary.add_vectors(&refs);
+        assert_eq!(binary.search(&vectors[0], 10).len(), 20);
+    }
     #[test]
     fn product_quantization_basic() {
         let vectors = random_vectors(200, 128, 42);
@@ -1520,7 +1702,10 @@ mod tests {
         for (a, b) in original.boundaries.iter().zip(restored.boundaries.iter()) {
             assert!((a - b).abs() < 1e-6);
         }
-        assert_eq!(original.config.rescore_multiplier, restored.config.rescore_multiplier);
+        assert_eq!(
+            original.config.rescore_multiplier,
+            restored.config.rescore_multiplier
+        );
     }
     #[test]

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "vectlite",
-  "version": "0.9.0",
+  "version": "0.9.2",
   "description": "Embedded vector store for local-first AI applications.",
   "main": "index.js",
   "types": "index.d.ts",

package/prebuilds/darwin-arm64/vectlite.node CHANGED Viewed

Binary file

package/prebuilds/darwin-x64/vectlite.node CHANGED Viewed

Binary file

package/prebuilds/linux-x64-gnu/vectlite.node CHANGED Viewed

Binary file

package/prebuilds/win32-x64-msvc/vectlite.node CHANGED Viewed

Binary file