npm - rag-lite-ts - Versions diffs - 2.0.4 → 2.1.0 - Mend

rag-lite-ts 2.0.4 → 2.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (22) hide show

package/README.md +815 -808
package/dist/cli/indexer.js +2 -38
package/dist/cli/search.d.ts +1 -1
package/dist/cli/search.js +118 -9
package/dist/cli.js +77 -94
package/dist/config.js +3 -0
package/dist/core/database-connection-manager.js +5 -9
package/dist/core/db.js +173 -173
package/dist/core/ingestion.js +50 -9
package/dist/core/lazy-dependency-loader.d.ts +3 -8
package/dist/core/lazy-dependency-loader.js +11 -29
package/dist/core/mode-detection-service.js +1 -1
package/dist/core/reranking-config.d.ts +1 -1
package/dist/core/reranking-config.js +7 -16
package/dist/core/reranking-factory.js +3 -184
package/dist/core/reranking-strategies.js +5 -4
package/dist/core/search.d.ts +10 -0
package/dist/core/search.js +34 -11
package/dist/factories/ingestion-factory.js +3 -1
package/dist/mcp-server.js +147 -120
package/dist/multimodal/clip-embedder.js +70 -71
package/package.json +105 -105

package/dist/mcp-server.js CHANGED Viewed

@@ -24,13 +24,29 @@
 import { Server } from '@modelcontextprotocol/sdk/server/index.js';
 import { StdioServerTransport } from '@modelcontextprotocol/sdk/server/stdio.js';
 import { CallToolRequestSchema, ListToolsRequestSchema, } from '@modelcontextprotocol/sdk/types.js';
-import { existsSync, statSync } from 'fs';
+import { existsSync, statSync, createWriteStream } from 'fs';
 import { resolve } from 'path';
 import { SearchFactory } from './factories/search-factory.js';
 import { IngestionFactory } from './factories/ingestion-factory.js';
-import { openDatabase, getSystemInfo } from './core/db.js';
+import { getSystemInfo } from './core/db.js';
 import { DatabaseConnectionManager } from './core/database-connection-manager.js';
 import { config, validateCoreConfig, ConfigurationError } from './core/config.js';
+/**
+ * Detect MIME type from file path or extension
+ */
+function getMimeTypeFromPath(filePath) {
+    const ext = filePath.toLowerCase().split('.').pop() || '';
+    const mimeTypes = {
+        'jpg': 'image/jpeg',
+        'jpeg': 'image/jpeg',
+        'png': 'image/png',
+        'gif': 'image/gif',
+        'webp': 'image/webp',
+        'bmp': 'image/bmp',
+        'svg': 'image/svg+xml'
+    };
+    return mimeTypes[ext] || 'image/jpeg'; // Default to JPEG if unknown
+}
 /**
  * MCP Server class that wraps RAG-lite TS functionality
  * Implements MCP protocol interface without creating REST/GraphQL endpoints
@@ -118,8 +134,8 @@ class RagLiteMCPServer {
                                 },
                                 rerank_strategy: {
                                     type: 'string',
-                                    description: 'Reranking strategy for multimodal mode. Options: text-derived (default), metadata, hybrid, disabled',
-                                    enum: ['text-derived', 'metadata', 'hybrid', 'disabled']
+                                    description: 'Reranking strategy for multimodal mode. Options: text-derived (default), disabled',
+                                    enum: ['text-derived', 'disabled']
                                 },
                                 force_rebuild: {
                                     type: 'boolean',
@@ -152,8 +168,8 @@ class RagLiteMCPServer {
                                 },
                                 rerank_strategy: {
                                     type: 'string',
-                                    description: 'Reranking strategy for multimodal mode. Options: text-derived (default), metadata, hybrid, disabled',
-                                    enum: ['text-derived', 'metadata', 'hybrid', 'disabled'],
+                                    description: 'Reranking strategy for multimodal mode. Options: text-derived (default), disabled',
+                                    enum: ['text-derived', 'disabled'],
                                     default: 'text-derived'
                                 },
                                 title: {
@@ -375,50 +391,60 @@ class RagLiteMCPServer {
             const startTime = Date.now();
             const results = await this.searchEngine.search(args.query, searchOptions);
             const searchTime = Date.now() - startTime;
-            // Format results for MCP response with content type information
-            const formattedResults = {
+            // Format results for MCP response with proper image content support
+            const textResults = {
                 query: args.query,
                 results_count: results.length,
                 search_time_ms: searchTime,
-                results: await Promise.all(results.map(async (result, index) => {
-                    const formattedResult = {
-                        rank: index + 1,
-                        score: Math.round(result.score * 100) / 100, // Round to 2 decimal places
-                        content_type: result.contentType,
-                        document: {
-                            id: result.document.id,
-                            title: result.document.title,
-                            source: result.document.source,
-                            content_type: result.document.contentType
-                        },
-                        text: result.content
-                    };
-                    // For image content, include base64-encoded image data for MCP clients
-                    if (result.contentType === 'image' && result.document.contentId) {
-                        try {
-                            const imageData = await this.searchEngine.getContent(result.document.contentId, 'base64');
-                            formattedResult.image_data = imageData;
-                            formattedResult.image_format = 'base64';
-                        }
-                        catch (error) {
-                            // If image retrieval fails, include error but don't fail the entire search
-                            formattedResult.image_error = error instanceof Error ? error.message : 'Failed to retrieve image';
-                        }
-                    }
-                    // Include metadata if available
-                    if (result.metadata) {
-                        formattedResult.metadata = result.metadata;
-                    }
-                    return formattedResult;
+                results: results.map((result, index) => ({
+                    rank: index + 1,
+                    score: Math.round(result.score * 100) / 100,
+                    content_type: result.contentType,
+                    document: {
+                        id: result.document.id,
+                        title: result.document.title,
+                        source: result.document.source,
+                        content_type: result.document.contentType
+                    },
+                    text: result.content,
+                    metadata: result.metadata,
+                    // Reference to image content if applicable
+                    has_image: result.contentType === 'image' && !!result.document.contentId
                 }))
             };
+            // Build MCP response content array
+            const responseContent = [
+                {
+                    type: 'text',
+                    text: JSON.stringify(textResults, null, 2)
+                }
+            ];
+            // Add proper MCP image content for each image result
+            for (const result of results) {
+                if (result.contentType === 'image' && result.document.contentId) {
+                    try {
+                        const imageData = await this.searchEngine.getContent(result.document.contentId, 'base64');
+                        const mimeType = getMimeTypeFromPath(result.document.source);
+                        responseContent.push({
+                            type: 'image',
+                            data: imageData,
+                            mimeType: mimeType,
+                            annotations: {
+                                audience: ['user'],
+                                priority: 0.8,
+                                title: result.document.title,
+                                source: result.document.source
+                            }
+                        });
+                    }
+                    catch (error) {
+                        // If image retrieval fails, log but don't fail the entire search
+                        console.error(`Failed to retrieve image for ${result.document.source}:`, error);
+                    }
+                }
+            }
             return {
-                content: [
-                    {
-                        type: 'text',
-                        text: JSON.stringify(formattedResults, null, 2),
-                    },
-                ],
+                content: responseContent
             };
         }
         catch (error) {
@@ -549,7 +575,7 @@ class RagLiteMCPServer {
                 if (mode === 'text') {
                     throw new Error('Reranking strategy parameter is only supported in multimodal mode');
                 }
-                const validStrategies = ['text-derived', 'metadata', 'hybrid', 'disabled'];
+                const validStrategies = ['text-derived', 'disabled'];
                 if (!validStrategies.includes(args.rerank_strategy)) {
                     throw new Error(`Invalid reranking strategy: ${args.rerank_strategy}. Supported strategies: ${validStrategies.join(', ')}`);
                 }
@@ -746,7 +772,7 @@ class RagLiteMCPServer {
                                             reject(new Error(`Failed to download image: HTTP ${redirectResponse.statusCode}`));
                                             return;
                                         }
-                                        const fileStream = require('fs').createWriteStream(tempFilePath);
+                                        const fileStream = createWriteStream(tempFilePath);
                                         redirectResponse.pipe(fileStream);
                                         fileStream.on('finish', () => {
                                             fileStream.close();
@@ -761,7 +787,7 @@ class RagLiteMCPServer {
                                 return;
                             }
                             else {
-                                const fileStream = require('fs').createWriteStream(tempFilePath);
+                                const fileStream = createWriteStream(tempFilePath);
                                 response.pipe(fileStream);
                                 fileStream.on('finish', () => {
                                     fileStream.close();
@@ -916,8 +942,8 @@ class RagLiteMCPServer {
             // Create ingestion pipeline with force rebuild using factory
             const pipeline = await IngestionFactory.create(config.db_file, config.index_file, { forceRebuild: true });
             try {
-                // Get all documents from database and re-ingest them
-                const db = await openDatabase(config.db_file);
+                // Get all documents from database and re-ingest them - use shared connection
+                const db = await DatabaseConnectionManager.getConnection(config.db_file);
                 try {
                     const documents = await db.all('SELECT DISTINCT source FROM documents ORDER BY source');
                     if (documents.length === 0) {
@@ -971,7 +997,8 @@ class RagLiteMCPServer {
                     };
                 }
                 finally {
-                    await db.close();
+                    // Release instead of close - keeps connection alive for reuse
+                    await DatabaseConnectionManager.releaseConnection(config.db_file);
                 }
             }
             finally {
@@ -1009,7 +1036,7 @@ class RagLiteMCPServer {
             // Check model compatibility if database exists
             if (stats.database_exists) {
                 try {
-                    const db = await openDatabase(config.db_file);
+                    const db = await DatabaseConnectionManager.getConnection(config.db_file);
                     try {
                         const systemInfo = await getSystemInfo(db);
                         if (systemInfo && systemInfo.modelName && systemInfo.modelDimensions) {
@@ -1040,7 +1067,8 @@ class RagLiteMCPServer {
                         stats.total_chunks = chunkCount?.count || 0;
                     }
                     finally {
-                        await db.close();
+                        // Release instead of close - keeps connection alive for reuse
+                        await DatabaseConnectionManager.releaseConnection(config.db_file);
                     }
                 }
                 catch (error) {
@@ -1221,48 +1249,61 @@ class RagLiteMCPServer {
             const startTime = Date.now();
             const results = await this.searchEngine.search(args.query, searchOptions);
             const searchTime = Date.now() - startTime;
-            // Format results for MCP response with content type information and image data
-            const formattedResults = {
+            // Format results for MCP response with proper image content support
+            const textResults = {
                 query: args.query,
                 content_type_filter: args.content_type || 'all',
                 results_count: results.length,
                 search_time_ms: searchTime,
-                results: await Promise.all(results.map(async (result, index) => {
-                    const formattedResult = {
-                        rank: index + 1,
-                        score: Math.round(result.score * 100) / 100,
-                        content_type: result.contentType,
-                        document: {
-                            id: result.document.id,
-                            title: result.document.title,
-                            source: result.document.source,
-                            content_type: result.document.contentType
-                        },
-                        text: result.content,
-                        metadata: result.metadata
-                    };
-                    // For image content, include base64-encoded image data for MCP clients
-                    if (result.contentType === 'image' && result.document.contentId) {
-                        try {
-                            const imageData = await this.searchEngine.getContent(result.document.contentId, 'base64');
-                            formattedResult.image_data = imageData;
-                            formattedResult.image_format = 'base64';
-                        }
-                        catch (error) {
-                            // If image retrieval fails, include error but don't fail the entire search
-                            formattedResult.image_error = error instanceof Error ? error.message : 'Failed to retrieve image';
-                        }
-                    }
-                    return formattedResult;
+                results: results.map((result, index) => ({
+                    rank: index + 1,
+                    score: Math.round(result.score * 100) / 100,
+                    content_type: result.contentType,
+                    document: {
+                        id: result.document.id,
+                        title: result.document.title,
+                        source: result.document.source,
+                        content_type: result.document.contentType
+                    },
+                    text: result.content,
+                    metadata: result.metadata,
+                    // Reference to image content if applicable
+                    has_image: result.contentType === 'image' && !!result.document.contentId
                 }))
             };
+            // Build MCP response content array
+            const responseContent = [
+                {
+                    type: 'text',
+                    text: JSON.stringify(textResults, null, 2)
+                }
+            ];
+            // Add proper MCP image content for each image result
+            for (const result of results) {
+                if (result.contentType === 'image' && result.document.contentId) {
+                    try {
+                        const imageData = await this.searchEngine.getContent(result.document.contentId, 'base64');
+                        const mimeType = getMimeTypeFromPath(result.document.source);
+                        responseContent.push({
+                            type: 'image',
+                            data: imageData,
+                            mimeType: mimeType,
+                            annotations: {
+                                audience: ['user'],
+                                priority: 0.8,
+                                title: result.document.title,
+                                source: result.document.source
+                            }
+                        });
+                    }
+                    catch (error) {
+                        // If image retrieval fails, log but don't fail the entire search
+                        console.error(`Failed to retrieve image for ${result.document.source}:`, error);
+                    }
+                }
+            }
             return {
-                content: [
-                    {
-                        type: 'text',
-                        text: JSON.stringify(formattedResults, null, 2),
-                    },
-                ],
+                content: responseContent
             };
         }
         catch (error) {
@@ -1416,23 +1457,6 @@ class RagLiteMCPServer {
                                 strategyInfo.accuracy = 'high';
                                 strategyInfo.use_cases = ['Mixed content with images', 'Visual documentation', 'Diagrams and charts'];
                                 break;
-                            case 'metadata':
-                                strategyInfo.description = 'Uses file metadata, filenames, and content properties for scoring without model inference';
-                                strategyInfo.requirements = ['None - uses file system metadata only'];
-                                strategyInfo.supported_content_types = ['text', 'image', 'pdf', 'docx'];
-                                strategyInfo.performance_impact = 'low';
-                                strategyInfo.accuracy = 'medium';
-                                strategyInfo.use_cases = ['Fast retrieval', 'Filename-based search', 'Content type filtering'];
-                                break;
-                            case 'hybrid':
-                                strategyInfo.description = 'Combines multiple reranking signals (semantic + metadata) with configurable weights';
-                                strategyInfo.requirements = ['Text-derived reranker', 'Metadata reranker'];
-                                strategyInfo.supported_content_types = ['text', 'image', 'pdf', 'docx'];
-                                strategyInfo.performance_impact = 'high';
-                                strategyInfo.accuracy = 'very high';
-                                strategyInfo.use_cases = ['Best overall accuracy', 'Complex multimodal collections', 'Production systems'];
-                                strategyInfo.default_weights = { semantic: 0.7, metadata: 0.3 };
-                                break;
                             case 'disabled':
                                 strategyInfo.description = 'No reranking applied - results ordered by vector similarity scores only';
                                 strategyInfo.requirements = ['None'];
@@ -1453,8 +1477,8 @@ class RagLiteMCPServer {
                 strategies_by_mode: strategiesByMode,
                 recommendations: {
                     text_mode: 'Use cross-encoder for best accuracy, disabled for best performance',
-                    multimodal_mode: 'Use hybrid for best accuracy, text-derived for good balance, metadata for fast retrieval',
-                    development: 'Start with disabled or metadata for fast iteration, upgrade to cross-encoder/text-derived for production'
+                    multimodal_mode: 'Use text-derived for best accuracy, disabled for best performance',
+                    development: 'Start with disabled for fast iteration, upgrade to cross-encoder/text-derived for production'
                 }
             };
             return {
@@ -1500,19 +1524,19 @@ class RagLiteMCPServer {
                     };
                     // Add content breakdown if requested
                     if (args.include_content_breakdown) {
-                        const db = await openDatabase(config.db_file);
+                        const db = await DatabaseConnectionManager.getConnection(config.db_file);
                         try {
                             // Get document count by content type
-                            const docsByType = await db.all(`
-                SELECT content_type, COUNT(*) as count
-                FROM documents
-                GROUP BY content_type
+                            const docsByType = await db.all(`
+                SELECT content_type, COUNT(*) as count
+                FROM documents
+                GROUP BY content_type
               `);
                             // Get chunk count by content type
-                            const chunksByType = await db.all(`
-                SELECT content_type, COUNT(*) as count
-                FROM chunks
-                GROUP BY content_type
+                            const chunksByType = await db.all(`
+                SELECT content_type, COUNT(*) as count
+                FROM chunks
+                GROUP BY content_type
               `);
                             enhancedStats.content_breakdown = {
                                 documents_by_type: docsByType.reduce((acc, row) => {
@@ -1526,7 +1550,8 @@ class RagLiteMCPServer {
                             };
                         }
                         finally {
-                            await db.close();
+                            // Release instead of close - keeps connection alive for reuse
+                            await DatabaseConnectionManager.releaseConnection(config.db_file);
                         }
                     }
                     // Add performance metrics if requested
@@ -1600,6 +1625,8 @@ class RagLiteMCPServer {
             this.isSearchEngineInitialized = true;
         }
         catch (error) {
+            console.error('❌ MCP Server: Search engine initialization failed');
+            console.error(`❌ Error: ${error instanceof Error ? error.message : String(error)}`);
             // Check if this is a mode detection error
             if (error instanceof Error && error.message.includes('mode detection')) {
                 console.error('⚠️  MCP Server: Mode detection failed, falling back to text mode');
@@ -1612,7 +1639,6 @@ class RagLiteMCPServer {
                 throw error;
             }
             // For other initialization errors, provide a generic wrapper
-            console.error('❌ MCP Server: Search engine initialization failed');
             throw new Error(`Failed to initialize search engine: ${error instanceof Error ? error.message : 'Unknown error'}`);
         }
     }
@@ -1635,8 +1661,8 @@ class RagLiteMCPServer {
             const { ModeDetectionService } = await import('./core/mode-detection-service.js');
             const modeService = new ModeDetectionService(config.db_file);
             const systemInfo = await modeService.detectMode();
-            // Check if database has any images
-            const db = await openDatabase(config.db_file);
+            // Check if database has any images - use shared connection
+            const db = await DatabaseConnectionManager.getConnection(config.db_file);
             let hasImages = false;
             let documentCount = 0;
             try {
@@ -1646,7 +1672,8 @@ class RagLiteMCPServer {
                 documentCount = docCount?.count || 0;
             }
             finally {
-                await db.close();
+                // Release instead of close - keeps connection alive for reuse
+                await DatabaseConnectionManager.releaseConnection(config.db_file);
             }
             return {
                 mode: systemInfo.mode,

package/dist/multimodal/clip-embedder.js CHANGED Viewed

@@ -338,76 +338,73 @@ export class CLIPEmbedder extends BaseUniversalEmbedder {
         if (!this.textModel || !this.tokenizer) {
             throw new Error('CLIP text model or tokenizer not initialized');
         }
-        try {
-            // Use the validated CLIPTextModelWithProjection approach (no pixel_values errors)
-            // Tokenize text with CLIP's requirements
-            // The tokenizer handles truncation at 77 TOKENS (not characters)
-            const tokens = await this.tokenizer(processedText, {
-                padding: true,
-                truncation: true,
-                max_length: 77, // CLIP's text sequence length limit (77 tokens)
-                return_tensors: 'pt'
-            });
-            // Log token information for debugging (only in development)
-            if (process.env.NODE_ENV === 'development') {
-                const tokenIds = tokens.input_ids?.data || [];
-                const actualTokenCount = Array.from(tokenIds).filter((id) => id !== 0).length;
-                if (actualTokenCount >= 77) {
-                    console.warn(`Text truncated by tokenizer: "${processedText.substring(0, 50)}..." (truncated to 77 tokens)`);
-                }
-            }
-            // Generate text embedding using CLIPTextModelWithProjection
-            const output = await this.textModel(tokens);
-            // Extract embedding from text_embeds (no pixel_values dependency)
-            const embedding = new Float32Array(output.text_embeds.data);
-            // Validate embedding dimensions and values
-            if (embedding.length !== this.dimensions) {
-                throw new Error(`CLIP embedding dimension mismatch: expected ${this.dimensions}, got ${embedding.length}`);
-            }
-            // Validate that all values are finite numbers
-            const invalidValues = Array.from(embedding).filter(val => !isFinite(val) || isNaN(val));
-            if (invalidValues.length > 0) {
-                throw new Error(`CLIP embedding contains ${invalidValues.length} invalid values`);
-            }
-            // Validate embedding quality - should not be all zeros
-            const nonZeroValues = Array.from(embedding).filter(val => Math.abs(val) > 1e-8);
-            if (nonZeroValues.length === 0) {
-                throw new Error('CLIP embedding is all zeros');
-            }
-            // Calculate embedding magnitude before normalization for quality assessment
-            const magnitudeBeforeNorm = Math.sqrt(Array.from(embedding).reduce((sum, val) => sum + val * val, 0));
-            if (magnitudeBeforeNorm < 1e-6) {
-                throw new Error(`CLIP embedding has critically low magnitude: ${magnitudeBeforeNorm.toExponential(3)}`);
-            }
-            // Apply L2-normalization (CLIP models are trained with normalized embeddings)
-            this.normalizeEmbedding(embedding);
-            // Verify normalization was successful
-            const magnitudeAfterNorm = Math.sqrt(Array.from(embedding).reduce((sum, val) => sum + val * val, 0));
-            if (Math.abs(magnitudeAfterNorm - 1.0) > 0.01) {
-                console.warn(`Warning: Embedding normalization may be imprecise (magnitude: ${magnitudeAfterNorm.toFixed(6)})`);
+        // Use the validated CLIPTextModelWithProjection approach (no pixel_values errors)
+        // Tokenize text with CLIP's requirements
+        // The tokenizer handles truncation at 77 TOKENS (not characters)
+        const tokens = await this.tokenizer(processedText, {
+            padding: true,
+            truncation: true,
+            max_length: 77, // CLIP's text sequence length limit (77 tokens)
+            return_tensors: 'pt'
+        });
+        // Log token information for debugging (only in development)
+        if (process.env.NODE_ENV === 'development') {
+            const tokenIds = tokens.input_ids?.data || [];
+            const actualTokenCount = Array.from(tokenIds).filter((id) => id !== 0).length;
+            if (actualTokenCount >= 77) {
+                console.warn(`Text truncated by tokenizer: "${processedText.substring(0, 50)}..." (truncated to 77 tokens)`);
+            }
+        }
+        // Generate text embedding using CLIPTextModelWithProjection
+        const output = await this.textModel(tokens);
+        // Extract embedding from text_embeds (no pixel_values dependency)
+        const embedding = new Float32Array(output.text_embeds.data);
+        // Validate embedding dimensions and values
+        if (embedding.length !== this.dimensions) {
+            throw new Error(`CLIP embedding dimension mismatch: expected ${this.dimensions}, got ${embedding.length}`);
+        }
+        // Validate that all values are finite numbers
+        const invalidValues = Array.from(embedding).filter(val => !isFinite(val) || isNaN(val));
+        if (invalidValues.length > 0) {
+            throw new Error(`CLIP embedding contains ${invalidValues.length} invalid values`);
+        }
+        // Validate embedding quality - should not be all zeros
+        const nonZeroValues = Array.from(embedding).filter(val => Math.abs(val) > 1e-8);
+        if (nonZeroValues.length === 0) {
+            throw new Error('CLIP embedding is all zeros');
+        }
+        // Calculate embedding magnitude before normalization for quality assessment
+        const magnitudeBeforeNorm = Math.sqrt(Array.from(embedding).reduce((sum, val) => sum + val * val, 0));
+        if (magnitudeBeforeNorm < 1e-6) {
+            throw new Error(`CLIP embedding has critically low magnitude: ${magnitudeBeforeNorm.toExponential(3)}`);
+        }
+        // Apply L2-normalization (CLIP models are trained with normalized embeddings)
+        this.normalizeEmbedding(embedding);
+        // Verify normalization was successful
+        const magnitudeAfterNorm = Math.sqrt(Array.from(embedding).reduce((sum, val) => sum + val * val, 0));
+        if (Math.abs(magnitudeAfterNorm - 1.0) > 0.01) {
+            console.warn(`Warning: Embedding normalization may be imprecise (magnitude: ${magnitudeAfterNorm.toFixed(6)})`);
+        }
+        // Log text embedding generation
+        console.log(`[CLIP] Generated text embedding for: "${processedText.substring(0, 30)}${processedText.length > 30 ? '...' : ''}"`);
+        // Generate unique embedding ID
+        const embeddingId = this.generateEmbeddingId(processedText, 'text');
+        return {
+            embedding_id: embeddingId,
+            vector: embedding,
+            contentType: 'text',
+            metadata: {
+                originalText: text,
+                processedText: processedText,
+                textLength: processedText.length,
+                embeddingMagnitudeBeforeNorm: magnitudeBeforeNorm,
+                embeddingMagnitudeAfterNorm: magnitudeAfterNorm,
+                normalized: true,
+                modelName: this.modelName,
+                modelType: this.modelType,
+                dimensions: this.dimensions
             }
-            // Generate unique embedding ID
-            const embeddingId = this.generateEmbeddingId(processedText, 'text');
-            return {
-                embedding_id: embeddingId,
-                vector: embedding,
-                contentType: 'text',
-                metadata: {
-                    originalText: text,
-                    processedText: processedText,
-                    textLength: processedText.length,
-                    embeddingMagnitudeBeforeNorm: magnitudeBeforeNorm,
-                    embeddingMagnitudeAfterNorm: magnitudeAfterNorm,
-                    normalized: true,
-                    modelName: this.modelName,
-                    modelType: this.modelType,
-                    dimensions: this.dimensions
-                }
-            };
-        }
-        catch (error) {
-            throw error;
-        }
+        };
     }
     // =============================================================================
     // IMAGE EMBEDDING METHODS
@@ -602,9 +599,11 @@ export class CLIPEmbedder extends BaseUniversalEmbedder {
             const absolutePath = path.resolve(imagePath);
             // Try to use Sharp for better Node.js support
             try {
-                const sharp = await import('sharp');
+                const sharpModule = await import('sharp');
+                const sharp = sharpModule.default;
+                sharp.concurrency(2);
                 // Use Sharp to load and get raw pixel data
-                const { data, info } = await sharp.default(absolutePath)
+                const { data, info } = await sharp(absolutePath)
                     .resize(variant.imageSize, variant.imageSize, {
                     fit: 'cover',
                     position: 'center'