npm - @juspay/neurolink - Versions diffs - 9.15.0 → 9.16.0 - Mend

@juspay/neurolink 9.15.0 → 9.16.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (193) hide show

package/CHANGELOG.md +6 -0
package/dist/adapters/video/videoAnalyzer.d.ts +1 -1
package/dist/adapters/video/videoAnalyzer.js +10 -8
package/dist/cli/commands/setup-anthropic.js +1 -14
package/dist/cli/commands/setup-azure.js +1 -12
package/dist/cli/commands/setup-bedrock.js +1 -9
package/dist/cli/commands/setup-google-ai.js +1 -12
package/dist/cli/commands/setup-openai.js +1 -14
package/dist/cli/commands/workflow.d.ts +27 -0
package/dist/cli/commands/workflow.js +216 -0
package/dist/cli/factories/commandFactory.js +79 -20
package/dist/cli/index.js +0 -1
package/dist/cli/parser.js +4 -1
package/dist/cli/utils/maskCredential.d.ts +11 -0
package/dist/cli/utils/maskCredential.js +23 -0
package/dist/constants/contextWindows.js +107 -16
package/dist/constants/enums.d.ts +99 -15
package/dist/constants/enums.js +152 -22
package/dist/context/budgetChecker.js +1 -1
package/dist/context/contextCompactor.js +31 -4
package/dist/context/emergencyTruncation.d.ts +21 -0
package/dist/context/emergencyTruncation.js +88 -0
package/dist/context/errorDetection.d.ts +16 -0
package/dist/context/errorDetection.js +48 -1
package/dist/context/errors.d.ts +19 -0
package/dist/context/errors.js +21 -0
package/dist/context/stages/slidingWindowTruncator.d.ts +6 -0
package/dist/context/stages/slidingWindowTruncator.js +159 -24
package/dist/core/baseProvider.js +306 -200
package/dist/core/conversationMemoryManager.js +104 -61
package/dist/core/evaluationProviders.js +16 -33
package/dist/core/factory.js +237 -164
package/dist/core/modules/GenerationHandler.js +175 -116
package/dist/core/modules/MessageBuilder.js +222 -170
package/dist/core/modules/StreamHandler.d.ts +1 -0
package/dist/core/modules/StreamHandler.js +95 -27
package/dist/core/modules/TelemetryHandler.d.ts +10 -1
package/dist/core/modules/TelemetryHandler.js +25 -7
package/dist/core/modules/ToolsManager.js +115 -191
package/dist/core/redisConversationMemoryManager.js +418 -282
package/dist/factories/providerRegistry.d.ts +5 -0
package/dist/factories/providerRegistry.js +20 -2
package/dist/index.d.ts +2 -2
package/dist/index.js +4 -2
package/dist/lib/adapters/video/videoAnalyzer.d.ts +1 -1
package/dist/lib/adapters/video/videoAnalyzer.js +10 -8
package/dist/lib/constants/contextWindows.js +107 -16
package/dist/lib/constants/enums.d.ts +99 -15
package/dist/lib/constants/enums.js +152 -22
package/dist/lib/context/budgetChecker.js +1 -1
package/dist/lib/context/contextCompactor.js +31 -4
package/dist/lib/context/emergencyTruncation.d.ts +21 -0
package/dist/lib/context/emergencyTruncation.js +89 -0
package/dist/lib/context/errorDetection.d.ts +16 -0
package/dist/lib/context/errorDetection.js +48 -1
package/dist/lib/context/errors.d.ts +19 -0
package/dist/lib/context/errors.js +22 -0
package/dist/lib/context/stages/slidingWindowTruncator.d.ts +6 -0
package/dist/lib/context/stages/slidingWindowTruncator.js +159 -24
package/dist/lib/core/baseProvider.js +306 -200
package/dist/lib/core/conversationMemoryManager.js +104 -61
package/dist/lib/core/evaluationProviders.js +16 -33
package/dist/lib/core/factory.js +237 -164
package/dist/lib/core/modules/GenerationHandler.js +175 -116
package/dist/lib/core/modules/MessageBuilder.js +222 -170
package/dist/lib/core/modules/StreamHandler.d.ts +1 -0
package/dist/lib/core/modules/StreamHandler.js +95 -27
package/dist/lib/core/modules/TelemetryHandler.d.ts +10 -1
package/dist/lib/core/modules/TelemetryHandler.js +25 -7
package/dist/lib/core/modules/ToolsManager.js +115 -191
package/dist/lib/core/redisConversationMemoryManager.js +418 -282
package/dist/lib/factories/providerRegistry.d.ts +5 -0
package/dist/lib/factories/providerRegistry.js +20 -2
package/dist/lib/index.d.ts +2 -2
package/dist/lib/index.js +4 -2
package/dist/lib/mcp/externalServerManager.js +66 -0
package/dist/lib/mcp/mcpCircuitBreaker.js +24 -0
package/dist/lib/mcp/mcpClientFactory.js +16 -0
package/dist/lib/mcp/toolDiscoveryService.js +32 -6
package/dist/lib/mcp/toolRegistry.js +193 -123
package/dist/lib/neurolink.d.ts +6 -0
package/dist/lib/neurolink.js +1162 -646
package/dist/lib/providers/amazonBedrock.d.ts +1 -1
package/dist/lib/providers/amazonBedrock.js +521 -319
package/dist/lib/providers/anthropic.js +73 -17
package/dist/lib/providers/anthropicBaseProvider.js +77 -17
package/dist/lib/providers/googleAiStudio.d.ts +1 -1
package/dist/lib/providers/googleAiStudio.js +292 -227
package/dist/lib/providers/googleVertex.d.ts +36 -1
package/dist/lib/providers/googleVertex.js +553 -260
package/dist/lib/providers/ollama.js +329 -278
package/dist/lib/providers/openAI.js +77 -19
package/dist/lib/providers/sagemaker/parsers.js +3 -3
package/dist/lib/providers/sagemaker/streaming.js +3 -3
package/dist/lib/proxy/proxyFetch.js +81 -48
package/dist/lib/rag/ChunkerFactory.js +1 -1
package/dist/lib/rag/chunkers/MarkdownChunker.d.ts +22 -0
package/dist/lib/rag/chunkers/MarkdownChunker.js +213 -9
package/dist/lib/rag/chunking/markdownChunker.d.ts +16 -0
package/dist/lib/rag/chunking/markdownChunker.js +174 -2
package/dist/lib/rag/pipeline/contextAssembly.js +2 -1
package/dist/lib/rag/ragIntegration.d.ts +18 -1
package/dist/lib/rag/ragIntegration.js +94 -14
package/dist/lib/rag/retrieval/vectorQueryTool.js +21 -4
package/dist/lib/server/abstract/baseServerAdapter.js +4 -1
package/dist/lib/server/adapters/fastifyAdapter.js +35 -30
package/dist/lib/services/server/ai/observability/instrumentation.d.ts +32 -0
package/dist/lib/services/server/ai/observability/instrumentation.js +39 -0
package/dist/lib/telemetry/attributes.d.ts +52 -0
package/dist/lib/telemetry/attributes.js +61 -0
package/dist/lib/telemetry/index.d.ts +3 -0
package/dist/lib/telemetry/index.js +3 -0
package/dist/lib/telemetry/telemetryService.d.ts +6 -0
package/dist/lib/telemetry/telemetryService.js +6 -0
package/dist/lib/telemetry/tracers.d.ts +15 -0
package/dist/lib/telemetry/tracers.js +17 -0
package/dist/lib/telemetry/withSpan.d.ts +9 -0
package/dist/lib/telemetry/withSpan.js +35 -0
package/dist/lib/types/contextTypes.d.ts +10 -0
package/dist/lib/types/streamTypes.d.ts +14 -0
package/dist/lib/utils/conversationMemory.js +121 -82
package/dist/lib/utils/logger.d.ts +5 -0
package/dist/lib/utils/logger.js +50 -2
package/dist/lib/utils/messageBuilder.js +22 -42
package/dist/lib/utils/modelDetection.js +3 -3
package/dist/lib/utils/providerRetry.d.ts +41 -0
package/dist/lib/utils/providerRetry.js +114 -0
package/dist/lib/utils/retryability.d.ts +14 -0
package/dist/lib/utils/retryability.js +23 -0
package/dist/lib/utils/sanitizers/svg.js +4 -5
package/dist/lib/utils/tokenEstimation.d.ts +11 -1
package/dist/lib/utils/tokenEstimation.js +19 -4
package/dist/lib/utils/videoAnalysisProcessor.js +7 -3
package/dist/mcp/externalServerManager.js +66 -0
package/dist/mcp/mcpCircuitBreaker.js +24 -0
package/dist/mcp/mcpClientFactory.js +16 -0
package/dist/mcp/toolDiscoveryService.js +32 -6
package/dist/mcp/toolRegistry.js +193 -123
package/dist/neurolink.d.ts +6 -0
package/dist/neurolink.js +1162 -646
package/dist/providers/amazonBedrock.d.ts +1 -1
package/dist/providers/amazonBedrock.js +521 -319
package/dist/providers/anthropic.js +73 -17
package/dist/providers/anthropicBaseProvider.js +77 -17
package/dist/providers/googleAiStudio.d.ts +1 -1
package/dist/providers/googleAiStudio.js +292 -227
package/dist/providers/googleVertex.d.ts +36 -1
package/dist/providers/googleVertex.js +553 -260
package/dist/providers/ollama.js +329 -278
package/dist/providers/openAI.js +77 -19
package/dist/providers/sagemaker/parsers.js +3 -3
package/dist/providers/sagemaker/streaming.js +3 -3
package/dist/proxy/proxyFetch.js +81 -48
package/dist/rag/ChunkerFactory.js +1 -1
package/dist/rag/chunkers/MarkdownChunker.d.ts +22 -0
package/dist/rag/chunkers/MarkdownChunker.js +213 -9
package/dist/rag/chunking/markdownChunker.d.ts +16 -0
package/dist/rag/chunking/markdownChunker.js +174 -2
package/dist/rag/pipeline/contextAssembly.js +2 -1
package/dist/rag/ragIntegration.d.ts +18 -1
package/dist/rag/ragIntegration.js +94 -14
package/dist/rag/retrieval/vectorQueryTool.js +21 -4
package/dist/server/abstract/baseServerAdapter.js +4 -1
package/dist/server/adapters/fastifyAdapter.js +35 -30
package/dist/services/server/ai/observability/instrumentation.d.ts +32 -0
package/dist/services/server/ai/observability/instrumentation.js +39 -0
package/dist/telemetry/attributes.d.ts +52 -0
package/dist/telemetry/attributes.js +60 -0
package/dist/telemetry/index.d.ts +3 -0
package/dist/telemetry/index.js +3 -0
package/dist/telemetry/telemetryService.d.ts +6 -0
package/dist/telemetry/telemetryService.js +6 -0
package/dist/telemetry/tracers.d.ts +15 -0
package/dist/telemetry/tracers.js +16 -0
package/dist/telemetry/withSpan.d.ts +9 -0
package/dist/telemetry/withSpan.js +34 -0
package/dist/types/contextTypes.d.ts +10 -0
package/dist/types/streamTypes.d.ts +14 -0
package/dist/utils/conversationMemory.js +121 -82
package/dist/utils/logger.d.ts +5 -0
package/dist/utils/logger.js +50 -2
package/dist/utils/messageBuilder.js +22 -42
package/dist/utils/modelDetection.js +3 -3
package/dist/utils/providerRetry.d.ts +41 -0
package/dist/utils/providerRetry.js +113 -0
package/dist/utils/retryability.d.ts +14 -0
package/dist/utils/retryability.js +22 -0
package/dist/utils/sanitizers/svg.js +4 -5
package/dist/utils/tokenEstimation.d.ts +11 -1
package/dist/utils/tokenEstimation.js +19 -4
package/dist/utils/videoAnalysisProcessor.js +7 -3
package/dist/workflow/config.d.ts +26 -26
package/package.json +1 -1

package/dist/rag/chunking/markdownChunker.d.ts CHANGED Viewed

@@ -14,6 +14,22 @@ export declare class MarkdownChunker implements Chunker {
     chunk(text: string, config?: MarkdownChunkerConfig): Promise<Chunk[]>;
     private splitByHeaders;
     private splitContent;
+    /**
+     * Detect contiguous table blocks in lines.
+     * Returns array of { start, end } line index ranges (inclusive).
+     */
+    private detectTableRanges;
+    /** Check if a line is a markdown table separator (e.g. |---|---|). */
+    private isTableSeparator;
+    /**
+     * Split content while preserving markdown tables.
+     */
+    private splitContentTableAware;
+    /**
+     * Split a table on row boundaries, repeating header + separator in each chunk.
+     */
+    private splitTableByRows;
+    private splitPlainContent;
     private stripMarkdown;
     validateConfig(config: BaseChunkerConfig): ChunkerValidationResult;
 }

package/dist/rag/chunking/markdownChunker.js CHANGED Viewed

@@ -129,10 +129,182 @@ export class MarkdownChunker {
         if (content.length <= effectiveMaxSize) {
             return [content];
         }
+        // Use table-aware splitting
+        const lines = content.split("\n");
+        const tableRanges = this.detectTableRanges(lines);
+        if (tableRanges.length > 0) {
+            return this.splitContentTableAware(content, lines, tableRanges, effectiveMaxSize, effectiveOverlap);
+        }
+        return this.splitPlainContent(content, effectiveMaxSize, effectiveOverlap);
+    }
+    /**
+     * Detect contiguous table blocks in lines.
+     * Returns array of { start, end } line index ranges (inclusive).
+     */
+    detectTableRanges(lines) {
+        // Simple pipe-prefixed line check (single character class — no backtracking)
+        const TABLE_ROW_RE = /^\|[^\r\n]{1,10000}/;
+        // Per-cell separator regex applied AFTER splitting on "|" — safe because
+        // each cell is short and bounded by pipe delimiters (CodeQL: js/polynomial-redos)
+        const SEPARATOR_CELL_RE = /^[\t ]*:?-+:?[\t ]*$/;
+        const ranges = [];
+        let i = 0;
+        while (i < lines.length) {
+            if (i + 1 < lines.length &&
+                TABLE_ROW_RE.test(lines[i]) &&
+                this.isTableSeparator(lines[i + 1], SEPARATOR_CELL_RE)) {
+                const start = i;
+                i += 2;
+                while (i < lines.length && TABLE_ROW_RE.test(lines[i])) {
+                    i++;
+                }
+                ranges.push({ start, end: i - 1 });
+            }
+            else {
+                i++;
+            }
+        }
+        return ranges;
+    }
+    /** Check if a line is a markdown table separator (e.g. |---|---|). */
+    isTableSeparator(line, cellRe) {
+        const trimmed = line.trimEnd();
+        if (!trimmed.startsWith("|")) {
+            return false;
+        }
+        // Split by "|" → ["", "---", "---", ""] for "|---|---|"
+        const cells = trimmed.split("|");
+        cells.shift(); // remove leading empty element
+        if (cells.length > 0 && cells[cells.length - 1].trim() === "") {
+            cells.pop(); // remove trailing empty element
+        }
+        if (cells.length === 0) {
+            return false;
+        }
+        return cells.every((cell) => cellRe.test(cell));
+    }
+    /**
+     * Split content while preserving markdown tables.
+     */
+    splitContentTableAware(content, lines, tableRanges, maxSize, overlap) {
+        // Build segments: alternating non-table and table blocks
+        const segments = [];
+        let lineIdx = 0;
+        for (const range of tableRanges) {
+            if (lineIdx < range.start) {
+                const text = lines.slice(lineIdx, range.start).join("\n").trim();
+                if (text) {
+                    segments.push({ text, isTable: false });
+                }
+            }
+            const tableText = lines.slice(range.start, range.end + 1).join("\n");
+            segments.push({ text: tableText, isTable: true });
+            lineIdx = range.end + 1;
+        }
+        if (lineIdx < lines.length) {
+            const text = lines.slice(lineIdx).join("\n").trim();
+            if (text) {
+                segments.push({ text, isTable: false });
+            }
+        }
+        const result = [];
+        let current = "";
+        for (const seg of segments) {
+            if (!seg.isTable) {
+                const pieces = this.splitPlainContent(seg.text, maxSize, overlap);
+                for (const piece of pieces) {
+                    if (current.length === 0) {
+                        current = piece;
+                    }
+                    else if (current.length + 1 + piece.length <= maxSize) {
+                        current += "\n" + piece;
+                    }
+                    else {
+                        result.push(current);
+                        current = piece;
+                    }
+                }
+            }
+            else {
+                if (seg.text.length <= maxSize) {
+                    if (current.length === 0) {
+                        current = seg.text;
+                    }
+                    else if (current.length + 2 + seg.text.length <= maxSize) {
+                        current += "\n\n" + seg.text;
+                    }
+                    else {
+                        result.push(current);
+                        current = seg.text;
+                    }
+                }
+                else {
+                    if (current) {
+                        result.push(current);
+                        current = "";
+                    }
+                    const tableChunks = this.splitTableByRows(seg.text, maxSize);
+                    result.push(...tableChunks);
+                }
+            }
+        }
+        if (current) {
+            result.push(current);
+        }
+        return result.length > 0 ? result : [content];
+    }
+    /**
+     * Split a table on row boundaries, repeating header + separator in each chunk.
+     */
+    splitTableByRows(tableText, maxSize) {
+        const rows = tableText.split("\n");
+        if (rows.length < 3) {
+            return [tableText];
+        }
+        const headerRow = rows[0];
+        const separatorRow = rows[1];
+        const headerBlock = headerRow + "\n" + separatorRow;
+        const dataRows = rows.slice(2);
+        if (headerBlock.length > maxSize) {
+            return this.splitPlainContent(tableText, maxSize, 0);
+        }
+        const chunks = [];
+        let currentChunk = headerBlock;
+        for (const row of dataRows) {
+            // Guard: single row exceeds budget — flush and emit as standalone chunk
+            const singleRowChunk = `${headerBlock}\n${row}`;
+            if (singleRowChunk.length > maxSize) {
+                if (currentChunk.length > headerBlock.length) {
+                    chunks.push(currentChunk);
+                }
+                chunks.push(singleRowChunk);
+                currentChunk = headerBlock;
+                continue;
+            }
+            const candidate = currentChunk + "\n" + row;
+            if (candidate.length <= maxSize) {
+                currentChunk = candidate;
+            }
+            else {
+                if (currentChunk.length > headerBlock.length) {
+                    chunks.push(currentChunk);
+                }
+                currentChunk = headerBlock + "\n" + row;
+            }
+        }
+        if (currentChunk.length > headerBlock.length) {
+            chunks.push(currentChunk);
+        }
+        return chunks.length > 0 ? chunks : [tableText];
+    }
+    splitPlainContent(content, maxSize, overlap) {
+        if (content.length <= maxSize) {
+            return [content];
+        }
         const chunks = [];
         let start = 0;
         while (start < content.length) {
-            let end = Math.min(start + effectiveMaxSize, content.length);
+            let end = Math.min(start + maxSize, content.length);
             // Try to break at a paragraph or sentence boundary
             if (end < content.length) {
                 const searchStart = Math.max(start, end - 200);
@@ -151,7 +323,7 @@ export class MarkdownChunker {
                 }
             }
             chunks.push(content.slice(start, end));
-            start = Math.max(start + 1, end - effectiveOverlap);
+            start = Math.max(start + 1, end - overlap);
         }
         return chunks;
     }

package/dist/rag/pipeline/contextAssembly.js CHANGED Viewed

@@ -12,6 +12,7 @@
  * - Context summarization
  */
 import { logger } from "../../utils/logger.js";
+import { estimateTokens } from "../../utils/tokenEstimation.js";
 /**
  * Assemble context from retrieved results
  *
@@ -184,7 +185,7 @@ export function createContextWindow(results, options) {
         text,
         chunkCount,
         charCount: text.length,
-        tokenCount: Math.ceil(text.length / 4),
+        tokenCount: estimateTokens(text),
         truncatedChunks,
         citations,
     };

package/dist/rag/ragIntegration.d.ts CHANGED Viewed

@@ -7,7 +7,20 @@
  * so developers only need to pass `rag: { files: [...] }`.
  */
 import type { Tool } from "ai";
-import type { RAGConfig } from "./types.js";
+import type { RAGConfig, VectorQueryResult } from "./types.js";
+/**
+ * Generate deterministic embeddings for chunks.
+ * Combines character-frequency (40%) with word-level hash features (60%)
+ * for better semantic discrimination than pure character frequency.
+ * When a real embedding provider is configured, it will be used instead.
+ */
+declare function generateSimpleEmbedding(text: string, dimension: number): number[];
+/**
+ * Diversify retrieval results via round-robin across source files.
+ * Ensures at least one chunk per source file appears in the top-K results,
+ * preventing any single file from dominating retrieval.
+ */
+declare function diversifyResults(results: VectorQueryResult[], topK: number): VectorQueryResult[];
 /**
  * Result of preparing RAG for a generate/stream call
  */
@@ -36,3 +49,7 @@ export type RAGPreparedTool = {
  * @returns Prepared RAG tool to inject into the tools record
  */
 export declare function prepareRAGTool(ragConfig: RAGConfig, fallbackProvider?: string): Promise<RAGPreparedTool>;
+/** @internal Exported for testing only */
+export { generateSimpleEmbedding as _generateSimpleEmbedding };
+/** @internal Exported for testing only */
+export { diversifyResults as _diversifyResults };

package/dist/rag/ragIntegration.js CHANGED Viewed

@@ -10,7 +10,7 @@ import { existsSync, readFileSync } from "fs";
 import { extname, resolve } from "path";
 import { z } from "zod";
 import { logger } from "../utils/logger.js";
-import { ChunkerRegistry } from "./chunking/index.js";
+import { createChunker } from "./ChunkerFactory.js";
 import { createVectorQueryTool, InMemoryVectorStore, } from "./retrieval/vectorQueryTool.js";
 /**
  * Maps file extensions to recommended chunking strategies
@@ -48,27 +48,91 @@ function detectStrategy(filePath) {
     const ext = extname(filePath).toLowerCase();
     return EXTENSION_TO_STRATEGY[ext] || "recursive";
 }
+/**
+ * Simple hash function for strings (FNV-1a variant).
+ * Maps a word to a bucket index deterministically.
+ */
+function hashWord(word, buckets) {
+    let hash = 2166136261;
+    for (let i = 0; i < word.length; i++) {
+        hash ^= word.charCodeAt(i);
+        hash = (hash * 16777619) >>> 0;
+    }
+    return hash % buckets;
+}
 /**
  * Generate deterministic embeddings for chunks.
- * Uses a simple hash-based approach for the in-memory vector store.
+ * Combines character-frequency (40%) with word-level hash features (60%)
+ * for better semantic discrimination than pure character frequency.
  * When a real embedding provider is configured, it will be used instead.
  */
 function generateSimpleEmbedding(text, dimension) {
-    const embedding = new Array(dimension).fill(0);
-    // Simple character-frequency based embedding
+    const charEmbedding = new Array(dimension).fill(0);
+    const wordEmbedding = new Array(dimension).fill(0);
+    // Character-frequency features
     for (let i = 0; i < text.length; i++) {
         const charCode = text.charCodeAt(i);
         const idx = charCode % dimension;
-        embedding[idx] += 1;
+        charEmbedding[idx] += 1;
+    }
+    // Word-level hash features (TF-IDF-like)
+    const words = text
+        .toLowerCase()
+        .replace(/[^a-z0-9\s]/g, "")
+        .split(/\s+/)
+        .filter((w) => w.length > 1);
+    for (const word of words) {
+        const idx = hashWord(word, dimension);
+        wordEmbedding[idx] += 1;
+    }
+    // Combine: 40% character, 60% word
+    const combined = new Array(dimension);
+    for (let i = 0; i < dimension; i++) {
+        combined[i] = 0.4 * charEmbedding[i] + 0.6 * wordEmbedding[i];
     }
     // Normalize to unit vector
-    const magnitude = Math.sqrt(embedding.reduce((sum, v) => sum + v * v, 0));
+    const magnitude = Math.sqrt(combined.reduce((sum, v) => sum + v * v, 0));
     if (magnitude > 0) {
         for (let i = 0; i < dimension; i++) {
-            embedding[i] /= magnitude;
+            combined[i] /= magnitude;
         }
     }
-    return embedding;
+    return combined;
+}
+/**
+ * Diversify retrieval results via round-robin across source files.
+ * Ensures at least one chunk per source file appears in the top-K results,
+ * preventing any single file from dominating retrieval.
+ */
+function diversifyResults(results, topK) {
+    // Group by source file
+    const byFile = new Map();
+    for (const r of results) {
+        const source = r.metadata?.source || "unknown";
+        if (!byFile.has(source)) {
+            byFile.set(source, []);
+        }
+        const sourceGroup = byFile.get(source);
+        if (sourceGroup) {
+            sourceGroup.push(r);
+        }
+    }
+    // If only one source file, no diversification needed
+    if (byFile.size <= 1) {
+        return results.slice(0, topK);
+    }
+    // Round-robin selection from each source file group
+    const diversified = [];
+    const iterators = [...byFile.values()].map((arr) => ({ arr, idx: 0 }));
+    while (diversified.length < topK &&
+        iterators.some((it) => it.idx < it.arr.length)) {
+        for (const it of iterators) {
+            if (it.idx < it.arr.length && diversified.length < topK) {
+                diversified.push(it.arr[it.idx++]);
+            }
+        }
+    }
+    return diversified;
 }
 /**
  * Prepare RAG tools from the provided configuration.
@@ -85,7 +149,7 @@ function generateSimpleEmbedding(text, dimension) {
  * @returns Prepared RAG tool to inject into the tools record
  */
 export async function prepareRAGTool(ragConfig, fallbackProvider) {
-    const { files, strategy: userStrategy, chunkSize = 1000, chunkOverlap = 200, topK = 5, toolName = "search_knowledge_base", toolDescription = "REQUIRED: Search through pre-loaded local documents to find relevant information. Use this tool FIRST before any web search or other tools. This searches an indexed knowledge base of documents the user has provided.", embeddingProvider, embeddingModel, } = ragConfig;
+    const { files, strategy: userStrategy, chunkSize = 1000, chunkOverlap = 200, topK: userTopK = 5, toolName = "search_knowledge_base", toolDescription = "REQUIRED: Search through pre-loaded local documents to find relevant information. Use this tool FIRST before any web search or other tools. This searches an indexed knowledge base of documents the user has provided.", embeddingProvider, embeddingModel, } = ragConfig;
     if (!files || files.length === 0) {
         throw new Error("RAG config requires at least one file path in 'files'");
     }
@@ -106,6 +170,11 @@ export async function prepareRAGTool(ragConfig, fallbackProvider) {
             logger.warn(`[RAG] Failed to read file: ${resolvedPath}: ${error instanceof Error ? error.message : String(error)}`);
         }
     }
+    // Auto-increase topK for multi-file scenarios to ensure coverage
+    // (computed after loading so it reflects only files that actually exist)
+    const topK = fileContents.length > 1
+        ? Math.max(userTopK, fileContents.length * 3)
+        : userTopK;
     if (fileContents.length === 0) {
         throw new Error("RAG: No files could be loaded. Check that file paths exist and are readable.");
     }
@@ -114,10 +183,11 @@ export async function prepareRAGTool(ragConfig, fallbackProvider) {
     const allChunks = [];
     for (const { path, content, strategy } of fileContents) {
         try {
-            const chunker = ChunkerRegistry.get(strategy);
-            const chunks = await chunker.chunk(content, {
+            const chunker = await createChunker(strategy, {
                 maxSize: chunkSize,
-                overlap: chunkOverlap,
+                overlap: Math.min(chunkOverlap, Math.floor(chunkSize * 0.5)),
+            });
+            const chunks = await chunker.chunk(content, {
                 metadata: { source: path },
             });
             for (const chunk of chunks) {
@@ -175,11 +245,17 @@ export async function prepareRAGTool(ragConfig, fallbackProvider) {
             // For the in-memory store with simple embeddings,
             // generate a query embedding using the same method
             const queryEmbedding = generateSimpleEmbedding(query, EMBEDDING_DIMENSION);
-            const results = await vectorStore.query({
+            // Fetch more candidates than needed so diversity can select across files
+            const fetchK = fileContents.length > 1 ? topK * 3 : topK;
+            const rawResults = await vectorStore.query({
                 indexName,
                 queryVector: queryEmbedding,
-                topK,
+                topK: fetchK,
             });
+            // Apply source-file diversity for multi-file RAG
+            const results = fileContents.length > 1
+                ? diversifyResults(rawResults, topK)
+                : rawResults.slice(0, topK);
             if (results.length === 0) {
                 return {
                     relevantContext: "No relevant documents found for the query.",
@@ -209,3 +285,7 @@ export async function prepareRAGTool(ragConfig, fallbackProvider) {
         filesLoaded: fileContents.length,
     };
 }
+/** @internal Exported for testing only */
+export { generateSimpleEmbedding as _generateSimpleEmbedding };
+/** @internal Exported for testing only */
+export { diversifyResults as _diversifyResults };

package/dist/rag/retrieval/vectorQueryTool.js CHANGED Viewed

@@ -253,10 +253,27 @@ export class InMemoryVectorStore {
                             !fieldValue.includes(ops.$contains))) {
                         return false;
                     }
-                    if ("$regex" in ops &&
-                        (typeof fieldValue !== "string" ||
-                            !new RegExp(ops.$regex).test(fieldValue))) {
-                        return false;
+                    if ("$regex" in ops) {
+                        const pattern = ops.$regex;
+                        let regexMatches = false;
+                        // Guard against ReDoS: reject excessively long patterns and limit
+                        // the tested string length to prevent pathological backtracking.
+                        if (pattern.length <= 200) {
+                            try {
+                                const re = new RegExp(pattern);
+                                const testValue = typeof fieldValue === "string"
+                                    ? fieldValue.slice(0, 10_000)
+                                    : "";
+                                regexMatches = re.test(testValue);
+                            }
+                            catch {
+                                // Invalid regex pattern — treat as non-match
+                                regexMatches = false;
+                            }
+                        }
+                        if (!regexMatches) {
+                            return false;
+                        }
                     }
                 }
                 else {

package/dist/server/abstract/baseServerAdapter.js CHANGED Viewed

@@ -166,7 +166,10 @@ export class BaseServerAdapter extends EventEmitter {
         }
         // Register all routes in the group with prefix applied
         for (const route of group.routes) {
-            const prefixedPath = this.normalizePath(`${group.prefix}${route.path}`);
+            // Only prepend prefix if route path doesn't already start with it
+            // (route definitions include full paths like /api/agent/execute)
+            const needsPrefix = !route.path.startsWith(group.prefix);
+            const prefixedPath = this.normalizePath(needsPrefix ? `${group.prefix}${route.path}` : route.path);
             const prefixedRoute = {
                 ...route,
                 path: prefixedPath,

package/dist/server/adapters/fastifyAdapter.js CHANGED Viewed

@@ -5,6 +5,7 @@
  */
 import { logger } from "../../utils/logger.js";
 import { AlreadyRunningError, ServerStartError, ServerStopError, wrapError, } from "../errors.js";
+import { withTimeout } from "../../utils/errorHandling.js";
 import { BaseServerAdapter } from "../abstract/baseServerAdapter.js";
 import { isErrorResponse } from "../utils/validation.js";
 /**
@@ -12,7 +13,7 @@ import { isErrorResponse } from "../utils/validation.js";
  * Provides high-performance HTTP server with schema validation
  */
 export class FastifyServerAdapter extends BaseServerAdapter {
-    app;
+    app = null;
     frameworkInitialized = false;
     constructor(neurolink, config = {}) {
         super(neurolink, config);
@@ -174,7 +175,15 @@ export class FastifyServerAdapter extends BaseServerAdapter {
      * Register route with Fastify
      */
     registerFrameworkRoute(route) {
+        if (!this.app) {
+            throw new Error("Fastify app not initialized. Call initialize() before registering routes.");
+        }
         const method = route.method.toUpperCase();
+        // Fastify does not allow duplicate method+path registrations.
+        // Skip if route already exists (e.g., built-in health routes).
+        if (this.app.hasRoute({ method, url: route.path })) {
+            return;
+        }
         this.app.route({
             method,
             url: route.path,
@@ -307,6 +316,9 @@ export class FastifyServerAdapter extends BaseServerAdapter {
      * Register middleware with Fastify
      */
     registerFrameworkMiddleware(middleware) {
+        if (!this.app) {
+            throw new Error("Fastify app not initialized. Call initialize() before registering middleware.");
+        }
         this.app.addHook("preHandler", async (request, _reply) => {
             // Skip excluded paths
             if (middleware.excludePaths?.some((p) => request.url.startsWith(p))) {
@@ -357,50 +369,39 @@ export class FastifyServerAdapter extends BaseServerAdapter {
         if (this.isRunning) {
             throw new AlreadyRunningError(this.config.port, this.config.host);
         }
+        if (!this.app) {
+            throw new Error("Fastify app not initialized. Call initialize() before starting.");
+        }
+        // Capture non-null reference for use in closures below
+        const app = this.app;
         this.lifecycleState = "starting";
         const { port, host } = this.config;
         const startupTimeout = this.config.timeout || 30000;
-        const startPromise = (async () => {
-            await this.app.listen({ port, host });
+        // Track connections via Fastify hooks (must be registered before listen)
+        app.addHook("onRequest", async (request) => {
+            const connectionId = `conn-${request.id}`;
+            this.trackConnection(connectionId, request.raw.socket, request.id);
+        });
+        app.addHook("onResponse", async (request) => {
+            const connectionId = `conn-${request.id}`;
+            this.untrackConnection(connectionId);
+        });
+        try {
+            await withTimeout(app.listen({ port, host }), startupTimeout, new ServerStartError(`Fastify server startup timed out after ${startupTimeout}ms`, undefined, port, host));
             this.isRunning = true;
             this.startTime = new Date();
             this.lifecycleState = "running";
-            // Track connections via Fastify hooks
-            this.app.addHook("onRequest", async (request) => {
-                const connectionId = `conn-${request.id}`;
-                this.trackConnection(connectionId, request.raw.socket, request.id);
-            });
-            this.app.addHook("onResponse", async (request) => {
-                const connectionId = `conn-${request.id}`;
-                this.untrackConnection(connectionId);
-            });
             logger.info(`[FastifyAdapter] Server started on ${host}:${port}`);
             this.emit("started", {
                 port,
                 host,
                 timestamp: this.startTime,
             });
-        })();
-        let startupTimer;
-        const timeoutPromise = new Promise((_, reject) => {
-            startupTimer = setTimeout(() => {
-                this.lifecycleState = "error";
-                reject(new ServerStartError(`Fastify server startup timed out after ${startupTimeout}ms`, undefined, port, host));
-            }, startupTimeout);
-        });
-        try {
-            await Promise.race([startPromise, timeoutPromise]);
         }
         catch (error) {
             this.lifecycleState = "error";
             throw error;
         }
-        finally {
-            // Always clear the timeout to prevent memory leak
-            if (startupTimer) {
-                clearTimeout(startupTimer);
-            }
-        }
     }
     /**
      * Stop the Fastify server with graceful shutdown
@@ -421,6 +422,7 @@ export class FastifyServerAdapter extends BaseServerAdapter {
             // Reset state for restart capability
             this.resetServerState();
             this.frameworkInitialized = false;
+            this.app = null;
         }
         catch (error) {
             const wrappedError = wrapError(error);
@@ -441,7 +443,10 @@ export class FastifyServerAdapter extends BaseServerAdapter {
      * Close the underlying server
      */
     async closeServer() {
-        await this.app.close();
+        if (this.app) {
+            const closeTimeout = this.shutdownConfig.gracefulShutdownTimeoutMs;
+            await withTimeout(this.app.close(), closeTimeout, new Error(`Fastify server close timed out after ${closeTimeout}ms`));
+        }
     }
     /**
      * Force close all active connections
@@ -451,7 +456,7 @@ export class FastifyServerAdapter extends BaseServerAdapter {
             count: this.activeConnections.size,
         });
         // Get the underlying server and destroy all sockets
-        const server = this.app.server;
+        const server = this.app?.server;
         if (server) {
             // Force close by destroying the server
             server.closeAllConnections?.();

package/dist/services/server/ai/observability/instrumentation.d.ts CHANGED Viewed

@@ -177,6 +177,38 @@ export declare function setLangfuseContext<T = void>(context: {
  * console.log(context?.userId, context?.sessionId);
  */
 export declare function getLangfuseContext(): LangfuseContext | undefined;
+/**
+ * Capture the current Langfuse AsyncLocalStorage context and return a wrapper
+ * that re-enters that context when executing the provided callback.
+ *
+ * This is essential for preserving trace context across async boundaries that
+ * break the automatic ALS propagation chain, such as `setImmediate()`,
+ * `setTimeout()`, or event-emitter callbacks. Without this, spans created
+ * inside those callbacks become orphaned traces in Langfuse.
+ *
+ * **How it works:**
+ * 1. Captures the current ALS store at call time (synchronously).
+ * 2. Returns an async function that, when invoked, re-enters the captured
+ *    context via `contextStorage.run()` before executing the callback.
+ * 3. If no context exists at capture time, the callback runs without
+ *    ALS wrapping (no-op passthrough).
+ *
+ * @param fn - The async function to execute within the captured context
+ * @returns A new async function that preserves the Langfuse ALS context
+ *
+ * @example
+ * // Before (broken — setImmediate loses ALS context):
+ * setImmediate(async () => {
+ *   await this.checkAndSummarize(session, threshold);
+ * });
+ *
+ * // After (fixed — context is captured and re-entered):
+ * const wrappedFn = runWithCurrentLangfuseContext(async () => {
+ *   await this.checkAndSummarize(session, threshold);
+ * });
+ * setImmediate(wrappedFn);
+ */
+export declare function runWithCurrentLangfuseContext<T>(fn: () => Promise<T>): () => Promise<T>;
 /**
  * Get an OpenTelemetry Tracer for creating custom spans
  *