npm - @rws-framework/ai-tools - Versions diffs - 2.2.1 → 3.1.0 - Mend

@rws-framework/ai-tools 2.2.1 → 3.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (22) hide show

package/docs/tutorial-style-rag.md +124 -0
package/examples/test-recursive-chunker.ts +167 -0
package/examples/tutorial-style-rag.ts +153 -0
package/package.json +6 -4
package/src/index.ts +25 -4
package/src/models/convo/EmbedLoader.ts +111 -29
package/src/models/convo/VectorStore.ts +82 -4
package/src/models/prompts/_prompt.ts +2 -2
package/src/models/prompts/inc/execution-methods-handler.ts +2 -2
package/src/models/prompts/inc/input-output-manager.ts +9 -7
package/src/services/LangChainEmbeddingService.ts +222 -0
package/src/services/LangChainRAGService.ts +395 -0
package/src/services/LangChainVectorStoreService.ts +378 -0
package/src/services/OptimizedVectorSearchService.ts +324 -0
package/src/services/TextChunker.ts +319 -0
package/src/types/IPrompt.ts +3 -1
package/src/types/embedding.types.ts +15 -0
package/src/types/index.ts +5 -0
package/src/types/rag.types.ts +44 -0
package/src/types/search.types.ts +56 -0
package/src/types/vectorstore.types.ts +23 -0
package/src/services/VectorStoreService.ts +0 -15

package/src/services/TextChunker.ts ADDED Viewed

@@ -0,0 +1,319 @@
+/**
+ * Text chunking utility following LangChain tutorial approach
+ * Uses RecursiveCharacterTextSplitter-like logic with token optimization
+ */
+export class TextChunker {
+    /**
+     * Conservative token estimation based on character count
+     * Uses a slightly more accurate ratio than the original 4 chars per token
+     */
+    static estimateTokens(text: string): number {
+        // More accurate estimation: ~3.7 characters per token on average
+        return Math.ceil(text.length / 3.7);
+    }
+    /**
+     * Default separators following LangChain RecursiveCharacterTextSplitter approach
+     * Ordered by preference for breaking text
+     */
+    private static readonly DEFAULT_SEPARATORS = [
+        '\n\n',  // Double newlines (paragraphs)
+        '\n',    // Single newlines
+        '. ',    // Sentence endings
+        '! ',    // Exclamation sentence endings
+        '? ',    // Question sentence endings
+        '; ',    // Semicolons
+        ', ',    // Commas
+        ' ',     // Spaces (words)
+        ''       // Character level (fallback)
+    ];
+    /**
+     * Chunk text using RecursiveCharacterTextSplitter approach from LangChain tutorial
+     * Recursively tries separators until chunks fit within token limits
+     *
+     * @param text - The text to chunk
+     * @param maxTokens - Maximum tokens per chunk (default: 450 to be safe under 512)
+     * @param overlap - Number of characters to overlap between chunks
+     * @param separators - Custom separators (uses defaults if not provided)
+     * @returns Array of text chunks
+     */
+    static chunkText(
+        text: string,
+        maxTokens: number = 450,
+        overlap: number = 50,
+        separators: string[] = TextChunker.DEFAULT_SEPARATORS
+    ): string[] {
+        if (!text || text.trim().length === 0) {
+            return [];
+        }
+        // If text is already within limits, return as-is
+        const estimatedTokens = this.estimateTokens(text);
+        if (estimatedTokens <= maxTokens) {
+            return [text.trim()];
+        }
+        console.log(`[TextChunker] Chunking text: ${text.length} chars, estimated ${estimatedTokens} tokens, max ${maxTokens} tokens per chunk`);
+        // Convert token limit to character limit (conservative)
+        const maxCharsPerChunk = Math.floor(maxTokens * 3.5);
+        // Use recursive splitting approach like LangChain tutorial
+        return this.recursiveSplit(text, maxCharsPerChunk, overlap, separators);
+    }
+    /**
+     * Recursive splitting approach following LangChain's RecursiveCharacterTextSplitter
+     * Tries each separator in order until chunks fit within limits
+     */
+    private static recursiveSplit(
+        text: string,
+        maxChars: number,
+        overlap: number,
+        separators: string[]
+    ): string[] {
+        const finalChunks: string[] = [];
+        // Get the first separator to try
+        const separator = separators[0];
+        let newSeparators: string[];
+        if (separator === '') {
+            // Character-level splitting (last resort)
+            newSeparators = [];
+        } else {
+            // Continue with remaining separators for recursive calls
+            newSeparators = separators.slice(1);
+        }
+        // Split text by current separator
+        const splits = this.splitTextBySeparator(text, separator);
+        // Process each split
+        for (const split of splits) {
+            if (split.length <= maxChars) {
+                // Split fits within limit, add it
+                finalChunks.push(split);
+            } else {
+                // Split is too large, need to recursively split further
+                if (newSeparators.length === 0) {
+                    // No more separators, force split by character limit
+                    finalChunks.push(...this.forceSplitByCharacterLimit(split, maxChars, overlap));
+                } else {
+                    // Recursively split with next separator
+                    finalChunks.push(...this.recursiveSplit(split, maxChars, overlap, newSeparators));
+                }
+            }
+        }
+        // Merge small chunks and add overlaps (like tutorial's approach)
+        return this.mergeChunksWithOverlap(finalChunks, maxChars, overlap);
+    }
+    /**
+     * Split text by a specific separator (preserving separator where appropriate)
+     */
+    private static splitTextBySeparator(text: string, separator: string): string[] {
+        if (separator === '') {
+            // Character-level split
+            return text.split('');
+        }
+        if (!text.includes(separator)) {
+            return [text];
+        }
+        // Split by separator and preserve meaningful separators
+        const splits = text.split(separator);
+        const result: string[] = [];
+        for (let i = 0; i < splits.length; i++) {
+            const split = splits[i];
+            if (i === splits.length - 1) {
+                // Last split, don't add separator
+                if (split.trim()) {
+                    result.push(split.trim());
+                }
+            } else {
+                // Add separator back for meaningful breaks
+                const withSeparator = split + (this.shouldPreserveSeparator(separator) ? separator : '');
+                if (withSeparator.trim()) {
+                    result.push(withSeparator.trim());
+                }
+            }
+        }
+        return result.filter(s => s.length > 0);
+    }
+    /**
+     * Determine if separator should be preserved in the text
+     */
+    private static shouldPreserveSeparator(separator: string): boolean {
+        // Preserve sentence endings and meaningful punctuation
+        return ['. ', '! ', '? ', '; '].includes(separator);
+    }
+    /**
+     * Force split by character limit when no separators work
+     */
+    private static forceSplitByCharacterLimit(text: string, maxChars: number, overlap: number): string[] {
+        const chunks: string[] = [];
+        let position = 0;
+        while (position < text.length) {
+            let endPosition = position + maxChars;
+            if (endPosition >= text.length) {
+                // Last chunk
+                const lastChunk = text.substring(position).trim();
+                if (lastChunk) {
+                    chunks.push(lastChunk);
+                }
+                break;
+            }
+            chunks.push(text.substring(position, endPosition).trim());
+            position = endPosition - overlap;
+            // Ensure we don't go backwards
+            if (position < 0) position = 0;
+        }
+        return chunks.filter(chunk => chunk.length > 0);
+    }
+    /**
+     * Merge small chunks and add overlaps following tutorial approach
+     */
+    private static mergeChunksWithOverlap(chunks: string[], maxChars: number, overlap: number): string[] {
+        if (chunks.length === 0) return [];
+        const mergedChunks: string[] = [];
+        let currentChunk = '';
+        for (let i = 0; i < chunks.length; i++) {
+            const chunk = chunks[i];
+            // Check if we can merge this chunk with current chunk
+            const combined = currentChunk ? currentChunk + ' ' + chunk : chunk;
+            if (combined.length <= maxChars) {
+                // Can merge
+                currentChunk = combined;
+            } else {
+                // Can't merge, save current chunk and start new one
+                if (currentChunk) {
+                    mergedChunks.push(currentChunk.trim());
+                }
+                currentChunk = chunk;
+            }
+        }
+        // Add final chunk
+        if (currentChunk.trim()) {
+            mergedChunks.push(currentChunk.trim());
+        }
+        // Add overlaps between chunks
+        return this.addOverlapsBetweenChunks(mergedChunks, overlap);
+    }
+    /**
+     * Add overlaps between chunks like the tutorial approach
+     */
+    private static addOverlapsBetweenChunks(chunks: string[], overlap: number): string[] {
+        if (chunks.length <= 1 || overlap <= 0) {
+            return chunks;
+        }
+        const chunksWithOverlap: string[] = [];
+        for (let i = 0; i < chunks.length; i++) {
+            let chunkWithOverlap = chunks[i];
+            // Add overlap from previous chunk at the beginning
+            if (i > 0) {
+                const prevOverlap = this.extractOverlap(chunks[i - 1], overlap);
+                if (prevOverlap && !chunkWithOverlap.startsWith(prevOverlap)) {
+                    chunkWithOverlap = prevOverlap + ' ' + chunkWithOverlap;
+                }
+            }
+            chunksWithOverlap.push(chunkWithOverlap.trim());
+        }
+        return chunksWithOverlap;
+    }
+    /**
+     * Extract overlap text from the end of a chunk
+     */
+    private static extractOverlap(text: string, overlapLength: number): string {
+        if (text.length <= overlapLength) {
+            return text;
+        }
+        // Try to break at word boundary for overlap
+        let startPosition = text.length - overlapLength;
+        while (startPosition < text.length && text[startPosition] !== ' ') {
+            startPosition++;
+        }
+        if (startPosition >= text.length) {
+            // No word boundary found, just take last characters
+            return text.substring(text.length - overlapLength);
+        }
+        return text.substring(startPosition + 1); // +1 to skip the space
+    }
+    /**
+     * Truncate text to fit within token limit (utility method)
+     */
+    static truncateText(text: string, maxTokens: number): string {
+        const maxChars = Math.floor(maxTokens * 3.5);
+        if (text.length <= maxChars) {
+            return text;
+        }
+        // Try to truncate at word boundary
+        let truncatePosition = maxChars;
+        while (truncatePosition > maxChars * 0.8 && text[truncatePosition] !== ' ') {
+            truncatePosition--;
+        }
+        if (truncatePosition <= maxChars * 0.8) {
+            // No word boundary found, truncate at character limit
+            truncatePosition = maxChars;
+        }
+        return text.substring(0, truncatePosition).trim();
+    }
+    /**
+     * Create documents from text chunks (tutorial-style helper)
+     * Similar to how the tutorial creates Document objects from splits
+     */
+    static createDocumentsFromChunks(
+        text: string,
+        metadata: Record<string, any> = {},
+        maxTokens: number = 450,
+        overlap: number = 50
+    ): Array<{ pageContent: string; metadata: Record<string, any> }> {
+        const chunks = this.chunkText(text, maxTokens, overlap);
+        return chunks.map((chunk, index) => ({
+            pageContent: chunk,
+            metadata: {
+                ...metadata,
+                chunkIndex: index,
+                id: `${metadata.documentId || 'doc'}_chunk_${index}`,
+                totalChunks: chunks.length
+            }
+        }));
+    }
+}

package/src/types/IPrompt.ts CHANGED Viewed

@@ -3,6 +3,7 @@ import { IterableReadableStream } from '@langchain/core/utils/stream';
 import { ChainValues } from '@langchain/core/utils/types';
 import { IContextToken } from './IContextToken';
 import { BaseChatModel } from '@langchain/core/language_models/chat_models';
+import z4, { Schema } from 'zod/v4';
 // General tool interfaces for AI models
 interface IAIToolParameterBase {
@@ -92,6 +93,7 @@ interface IAIRequestOptions {
     intruderPrompt?: string | null,
     ensureJson?: boolean,
     debugVars?: any,
+    schema?: z4.core.$ZodType | Schema,
     tools?: IAITool[]
 }
@@ -114,7 +116,7 @@ interface IRWSPromptJSON {
     enhancedInput: IPromptEnchantment[];
     sentInput: CompoundInput[];
     originalInput: CompoundInput[];
-    output: string;
+    output: string | object;
     modelId: string;
     modelType: string;
     multiTemplate: PromptTemplate;

package/src/types/embedding.types.ts ADDED Viewed

@@ -0,0 +1,15 @@
+/**
+ * Embedding service configuration interfaces
+ */
+export interface IEmbeddingConfig {
+    provider: 'cohere';
+    apiKey: string;
+    model?: string;
+    batchSize?: number;
+}
+export interface IChunkConfig {
+    chunkSize?: number;
+    chunkOverlap?: number;
+    separators?: string[];
+}

package/src/types/index.ts ADDED Viewed

@@ -0,0 +1,5 @@
+// Re-export all types from a central location
+export * from './embedding.types';
+export * from './search.types';
+export * from './vectorstore.types';
+export * from './rag.types';

package/src/types/rag.types.ts ADDED Viewed

@@ -0,0 +1,44 @@
+import { ISearchResult } from './search.types';
+/**
+ * RAG service configuration and request/response interfaces
+ */
+export interface ILangChainRAGConfig {
+    embedding?: import('./embedding.types').IEmbeddingConfig;
+    vectorStore: import('./vectorstore.types').IVectorStoreConfig;
+    chunking?: import('./embedding.types').IChunkConfig;
+    persistence?: {
+        enabled: boolean;
+        storagePath?: string;
+        autoSave?: boolean;
+    };
+}
+export interface IRAGIndexRequest {
+    content: string;
+    documentId: string | number;
+    metadata?: Record<string, any>;
+}
+export interface IRAGSearchRequest {
+    query: string;
+    maxResults?: number;
+    threshold?: number;
+    filter?: {
+        knowledgeIds?: (string | number)[];
+        documentIds?: (string | number)[];
+        [key: string]: any;
+    };
+}
+export interface IRAGResponse<T = any> {
+    success: boolean;
+    data: T | null;
+    error?: string;
+}
+export interface IRAGStats {
+    totalChunks: number;
+    totalDocuments: number;
+    knowledgeItems: number;
+}

package/src/types/search.types.ts ADDED Viewed

@@ -0,0 +1,56 @@
+/**
+ * Search and result interfaces
+ */
+export interface ISearchResult {
+    content: string;
+    score: number;
+    metadata: any;
+    chunkId: string;
+}
+export interface IVectorSearchRequest {
+    query: string;
+    maxResults?: number;
+    similarityThreshold?: number;
+    filter?: {
+        knowledgeIds?: string[];
+        documentIds?: string[];
+        [key: string]: any;
+    };
+}
+export interface IVectorSearchResponse {
+    results: ISearchResult[];
+    totalResults: number;
+}
+/**
+ * Optimized search interfaces
+ */
+export interface IOptimizedSearchRequest {
+    query: string;
+    knowledgeVectors: Array<{
+        knowledgeId: string | number;
+        chunks: Array<{
+            content: string;
+            embedding: number[];
+            metadata: any;
+        }>;
+    }>;
+    maxResults?: number;
+    threshold?: number;
+}
+export interface IOptimizedSearchResult {
+    content: string;
+    score: number;
+    metadata: any;
+    knowledgeId: string | number;
+    chunkId: string;
+}
+export interface IOptimizedSearchResponse {
+    results: IOptimizedSearchResult[];
+    searchTime: number;
+    totalCandidates: number;
+}

package/src/types/vectorstore.types.ts ADDED Viewed

@@ -0,0 +1,23 @@
+/**
+ * Vector store configuration interfaces
+ */
+export interface IVectorStoreConfig {
+    type: 'memory';
+    maxResults?: number;
+    autoSave?: boolean;
+    similarityThreshold?: number;
+}
+export interface IDocumentChunk {
+    id: string;
+    content: string;
+    embedding?: number[];
+    metadata?: {
+        documentId: string;
+        chunkIndex: number;
+        source?: string;
+        title?: string;
+        knowledgeId?: string;
+        [key: string]: any;
+    };
+}

package/src/services/VectorStoreService.ts DELETED Viewed

@@ -1,15 +0,0 @@
-import { EmbeddingsInterface } from '@langchain/core/embeddings';
-import { Injectable } from '@rws-framework/server/nest';
-import RWSVectorStore, { VectorDocType } from '../models/convo/VectorStore';
-@Injectable()
-class VectorStoreService
-{
-    async createStore(docs: VectorDocType, embeddings: EmbeddingsInterface): Promise<RWSVectorStore>
-    {
-        return await (new RWSVectorStore(docs, embeddings)).init();
-    }
-}
-export { VectorStoreService };