npm - nano-brain - Versions diffs - 2026.7.3 → 2026.7.4 - Mend

nano-brain 2026.7.3 → 2026.7.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (2) hide show

package/package.json +1 -1
package/src/embeddings.ts +40 -2

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "nano-brain",
-  "version": "2026.7.3",
+  "version": "2026.7.4",
   "description": "Persistent memory and code intelligence for AI coding agents. Local MCP server with self-learning hybrid search (BM25 + vector + knowledge graph + LLM reranking), automatic session ingestion, codebase indexing, and 22 tools. Learns your preferences over time. Works with OpenCode, Claude, Cursor, Windsurf, and any MCP client.",
   "type": "module",
   "bin": {

package/src/embeddings.ts CHANGED Viewed

@@ -150,13 +150,13 @@ class OllamaEmbeddingProvider implements EmbeddingProvider {
     };
   }
-  async embedBatch(texts: string[]): Promise<EmbeddingResult[]> {
+  private async _sendBatch(inputs: string[]): Promise<EmbeddingResult[]> {
     const response = await fetch(`${this.url}/api/embed`, {
       method: 'POST',
       headers: { 'Content-Type': 'application/json' },
       body: JSON.stringify({
         model: this.model,
-        input: texts.map(t => this.truncate(t)),
+        input: inputs.map(t => this.truncate(t)),
       }),
       signal: AbortSignal.timeout(180000),
     });
@@ -176,6 +176,44 @@ class OllamaEmbeddingProvider implements EmbeddingProvider {
     }));
   }
+  async embedBatch(texts: string[]): Promise<EmbeddingResult[]> {
+    const MAX_CHARS_PER_BATCH = 100_000; // ~25K tokens safety margin
+    const MAX_ITEMS_PER_BATCH = 50;      // Also limit item count
+    const results: EmbeddingResult[] = [];
+    // Split into sub-batches by cumulative character count
+    let currentBatch: string[] = [];
+    let currentChars = 0;
+    let batchCount = 0;
+    for (const text of texts) {
+      if (currentBatch.length > 0 &&
+          (currentChars + text.length > MAX_CHARS_PER_BATCH ||
+           currentBatch.length >= MAX_ITEMS_PER_BATCH)) {
+        batchCount++;
+        const embeddings = await this._sendBatch(currentBatch);
+        results.push(...embeddings);
+        currentBatch = [];
+        currentChars = 0;
+      }
+      currentBatch.push(text);
+      currentChars += text.length;
+    }
+    // Send remaining
+    if (currentBatch.length > 0) {
+      batchCount++;
+      const embeddings = await this._sendBatch(currentBatch);
+      results.push(...embeddings);
+    }
+    if (batchCount > 1) {
+      log('embed', `Ollama sub-batching: ${texts.length} items into ${batchCount} batches`);
+    }
+    return results;
+  }
   getDimensions(): number {
     return this.dimensions;
   }