npm - @soulcraft/brainy - Versions diffs - 6.5.0 → 6.6.0 - Mend

@soulcraft/brainy 6.5.0 → 6.6.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (28) hide show

package/assets/models/all-MiniLM-L6-v2-q8/config.json +25 -0
package/assets/models/all-MiniLM-L6-v2-q8/model.onnx +0 -0
package/assets/models/all-MiniLM-L6-v2-q8/tokenizer.json +30686 -0
package/assets/models/all-MiniLM-L6-v2-q8/vocab.json +1 -0
package/dist/critical/model-guardian.d.ts +5 -22
package/dist/critical/model-guardian.js +38 -210
package/dist/embeddings/EmbeddingManager.d.ts +7 -17
package/dist/embeddings/EmbeddingManager.js +28 -136
package/dist/embeddings/wasm/AssetLoader.d.ts +67 -0
package/dist/embeddings/wasm/AssetLoader.js +238 -0
package/dist/embeddings/wasm/EmbeddingPostProcessor.d.ts +60 -0
package/dist/embeddings/wasm/EmbeddingPostProcessor.js +123 -0
package/dist/embeddings/wasm/ONNXInferenceEngine.d.ts +55 -0
package/dist/embeddings/wasm/ONNXInferenceEngine.js +154 -0
package/dist/embeddings/wasm/WASMEmbeddingEngine.d.ts +82 -0
package/dist/embeddings/wasm/WASMEmbeddingEngine.js +231 -0
package/dist/embeddings/wasm/WordPieceTokenizer.d.ts +71 -0
package/dist/embeddings/wasm/WordPieceTokenizer.js +264 -0
package/dist/embeddings/wasm/index.d.ts +13 -0
package/dist/embeddings/wasm/index.js +15 -0
package/dist/embeddings/wasm/types.d.ts +114 -0
package/dist/embeddings/wasm/types.js +25 -0
package/dist/setup.d.ts +11 -11
package/dist/setup.js +17 -31
package/dist/utils/embedding.d.ts +45 -62
package/dist/utils/embedding.js +61 -440
package/package.json +10 -3
package/scripts/download-model.cjs +175 -0

package/dist/critical/model-guardian.d.ts CHANGED Viewed

@@ -5,15 +5,14 @@
  * Without the exact model, users CANNOT access their data
  *
  * Requirements:
- * 1. Model MUST be Xenova/all-MiniLM-L6-v2 (never changes)
- * 2. Model MUST be available at runtime
+ * 1. Model MUST be all-MiniLM-L6-v2-q8 (bundled in package)
+ * 2. Model MUST be available at runtime (embedded in npm package)
  * 3. Model MUST produce consistent 384-dim embeddings
  * 4. System MUST fail fast if model unavailable in production
  */
 export declare class ModelGuardian {
     private static instance;
     private isVerified;
-    private modelPath;
     private lastVerification;
     private constructor();
     static getInstance(): ModelGuardian;
@@ -23,34 +22,18 @@ export declare class ModelGuardian {
      */
     ensureCriticalModel(): Promise<void>;
     /**
-     * Verify the local model files exist and are correct
+     * Verify the bundled WASM model works correctly
      */
-    private verifyLocalModel;
-    /**
-     * Compute SHA256 hash of a file
-     */
-    private computeFileHash;
-    /**
-     * Download model from a fallback source
-     */
-    private downloadFromSource;
-    /**
-     * Configure transformers.js to use verified local model
-     */
-    private configureTransformers;
-    /**
-     * Detect where models should be stored
-     */
-    private detectModelPath;
+    private verifyBundledModel;
     /**
      * Get model status for diagnostics
      */
     getStatus(): Promise<{
         verified: boolean;
-        path: string;
         lastVerification: Date | null;
         modelName: string;
         dimensions: number;
+        bundled: boolean;
     }>;
     /**
      * Force re-verification (for testing)

package/dist/critical/model-guardian.js CHANGED Viewed

@@ -5,51 +5,24 @@
  * Without the exact model, users CANNOT access their data
  *
  * Requirements:
- * 1. Model MUST be Xenova/all-MiniLM-L6-v2 (never changes)
- * 2. Model MUST be available at runtime
+ * 1. Model MUST be all-MiniLM-L6-v2-q8 (bundled in package)
+ * 2. Model MUST be available at runtime (embedded in npm package)
  * 3. Model MUST produce consistent 384-dim embeddings
  * 4. System MUST fail fast if model unavailable in production
  */
-import { env } from '@huggingface/transformers';
+import { WASMEmbeddingEngine } from '../embeddings/wasm/index.js';
 // CRITICAL: These values MUST NEVER CHANGE
 const CRITICAL_MODEL_CONFIG = {
-    modelName: 'Xenova/all-MiniLM-L6-v2',
-    modelHash: {
-        // SHA256 of model.onnx - computed from actual model
-        'onnx/model.onnx': 'add_actual_hash_here',
-        'tokenizer.json': 'add_actual_hash_here'
-    },
-    modelSize: {
-        'onnx/model.onnx': 90387606, // Exact size in bytes (updated to match actual file)
-        'tokenizer.json': 711661
-    },
+    modelName: 'all-MiniLM-L6-v2-q8',
     embeddingDimensions: 384,
-    fallbackSources: [
-        // Primary: Our Google Cloud Storage CDN (we control this, fastest)
-        {
-            name: 'Soulcraft CDN (Primary)',
-            url: 'https://models.soulcraft.com/models/all-MiniLM-L6-v2.tar.gz',
-            type: 'tarball'
-        },
-        // Secondary: GitHub releases backup
-        {
-            name: 'GitHub Backup',
-            url: 'https://github.com/soulcraftlabs/brainy-models/releases/download/v1.0.0/all-MiniLM-L6-v2.tar.gz',
-            type: 'tarball'
-        },
-        // Tertiary: Hugging Face (original source)
-        {
-            name: 'Hugging Face',
-            url: 'huggingface',
-            type: 'transformers'
-        }
-    ]
+    // Model is bundled in package - no external downloads needed
+    bundled: true
 };
 export class ModelGuardian {
     constructor() {
         this.isVerified = false;
         this.lastVerification = null;
-        this.modelPath = this.detectModelPath();
+        // Model is bundled - no path detection needed
     }
     static getInstance() {
         if (!ModelGuardian.instance) {
@@ -62,200 +35,55 @@ export class ModelGuardian {
      * This MUST be called before any embedding operations
      */
     async ensureCriticalModel() {
-        console.log('DEBUG: ensureCriticalModel called');
-        console.log('🛡️ MODEL GUARDIAN: Verifying critical model availability...');
-        console.log(`🚀 Debug: Model path: ${this.modelPath}`);
-        console.log(`🚀 Debug: Already verified: ${this.isVerified}`);
         // Check if already verified in this session
         if (this.isVerified && this.lastVerification) {
             const hoursSinceVerification = (Date.now() - this.lastVerification.getTime()) / (1000 * 60 * 60);
             if (hoursSinceVerification < 24) {
-                console.log('✅ Model previously verified in this session');
                 return;
             }
         }
-        // Step 1: Check if model exists locally
-        console.log('🔍 Debug: Calling verifyLocalModel()');
-        const modelExists = await this.verifyLocalModel();
-        if (modelExists) {
-            console.log('✅ Critical model verified locally');
+        // Verify the bundled WASM model works
+        const modelWorks = await this.verifyBundledModel();
+        if (modelWorks) {
             this.isVerified = true;
             this.lastVerification = new Date();
-            this.configureTransformers();
             return;
         }
-        // Step 2: In production, FAIL FAST (Node.js only)
-        if (typeof window === 'undefined' && process.env.NODE_ENV === 'production' && !process.env.BRAINY_ALLOW_RUNTIME_DOWNLOAD) {
-            throw new Error('🚨 CRITICAL FAILURE: Transformer model not found in production!\n' +
-                'The model is REQUIRED for Brainy to function.\n' +
-                'Users CANNOT access their data without it.\n' +
-                'Solution: Run "npm run download-models" during build stage.');
-        }
-        // Step 3: Attempt to download from fallback sources
-        console.warn('⚠️ Model not found locally, attempting download...');
-        for (const source of CRITICAL_MODEL_CONFIG.fallbackSources) {
-            try {
-                console.log(`📥 Trying ${source.name}...`);
-                await this.downloadFromSource(source);
-                // Verify the download
-                if (await this.verifyLocalModel()) {
-                    console.log(`✅ Successfully downloaded from ${source.name}`);
-                    this.isVerified = true;
-                    this.lastVerification = new Date();
-                    this.configureTransformers();
-                    return;
-                }
-            }
-            catch (error) {
-                console.warn(`❌ ${source.name} failed:`, error.message);
-            }
-        }
-        // Step 4: CRITICAL FAILURE
-        throw new Error('🚨 CRITICAL FAILURE: Cannot obtain transformer model!\n' +
-            'Tried all fallback sources.\n' +
-            'Brainy CANNOT function without the model.\n' +
-            'Users CANNOT access their data.\n' +
-            'Please check network connectivity or pre-download models.');
+        // CRITICAL FAILURE
+        throw new Error('🚨 CRITICAL FAILURE: Bundled transformer model not working!\n' +
+            'The model is REQUIRED for Brainy to function.\n' +
+            'Users CANNOT access their data without it.\n' +
+            'This indicates a package installation issue.');
     }
     /**
-     * Verify the local model files exist and are correct
+     * Verify the bundled WASM model works correctly
      */
-    async verifyLocalModel() {
-        // Browser doesn't have local file access
-        if (typeof window !== 'undefined') {
-            console.log('⚠️ Model verification skipped in browser environment');
-            return false;
-        }
-        // Dynamically import Node.js modules
-        const fs = await import('node:fs');
-        const fsPromises = await import('node:fs/promises');
-        const path = await import('node:path');
-        const modelBasePath = path.join(this.modelPath, ...CRITICAL_MODEL_CONFIG.modelName.split('/'));
-        console.log(`🔍 Debug: Checking model at path: ${modelBasePath}`);
-        console.log(`🔍 Debug: Model path components: ${this.modelPath} + ${CRITICAL_MODEL_CONFIG.modelName.split('/')}`);
-        // Check critical files
-        const criticalFiles = [
-            'onnx/model.onnx',
-            'tokenizer.json',
-            'config.json'
-        ];
-        for (const file of criticalFiles) {
-            const filePath = path.join(modelBasePath, file);
-            console.log(`🔍 Debug: Checking file: ${filePath}`);
-            if (!fs.existsSync(filePath)) {
-                console.log(`❌ Missing critical file: ${file} at ${filePath}`);
+    async verifyBundledModel() {
+        try {
+            const engine = WASMEmbeddingEngine.getInstance();
+            // Initialize the engine (loads bundled model)
+            await engine.initialize();
+            // Test embedding generation
+            const testEmbedding = await engine.embed('test verification');
+            // Verify dimensions
+            if (testEmbedding.length !== CRITICAL_MODEL_CONFIG.embeddingDimensions) {
+                console.error(`❌ CRITICAL: Model dimension mismatch!\n` +
+                    `Expected: ${CRITICAL_MODEL_CONFIG.embeddingDimensions}\n` +
+                    `Got: ${testEmbedding.length}`);
                 return false;
             }
-            // Verify size for critical files
-            if (CRITICAL_MODEL_CONFIG.modelSize[file]) {
-                const stats = await fsPromises.stat(filePath);
-                const expectedSize = CRITICAL_MODEL_CONFIG.modelSize[file];
-                if (Math.abs(stats.size - expectedSize) > 1000) { // Allow 1KB variance
-                    console.error(`❌ CRITICAL: Model file size mismatch!\n` +
-                        `File: ${file}\n` +
-                        `Expected: ${expectedSize} bytes\n` +
-                        `Actual: ${stats.size} bytes\n` +
-                        `This indicates model corruption or version mismatch!`);
-                    return false;
-                }
-            }
-            // SHA256 verification for ultimate security
-            if (CRITICAL_MODEL_CONFIG.modelHash && CRITICAL_MODEL_CONFIG.modelHash[file]) {
-                const hash = await this.computeFileHash(filePath);
-                if (hash !== CRITICAL_MODEL_CONFIG.modelHash[file]) {
-                    console.error(`❌ CRITICAL: Model hash mismatch for ${file}!\n` +
-                        `Expected: ${CRITICAL_MODEL_CONFIG.modelHash[file]}\n` +
-                        `Got: ${hash}\n` +
-                        `This indicates model tampering or corruption!`);
-                    return false;
-                }
+            // Verify normalization (should be unit length)
+            const norm = Math.sqrt(testEmbedding.reduce((sum, v) => sum + v * v, 0));
+            if (Math.abs(norm - 1.0) > 0.01) {
+                console.error(`❌ CRITICAL: Embeddings not normalized! Norm: ${norm}`);
+                return false;
             }
-        }
-        return true;
-    }
-    /**
-     * Compute SHA256 hash of a file
-     */
-    async computeFileHash(filePath) {
-        try {
-            const { readFile } = await import('node:fs/promises');
-            const { createHash } = await import('node:crypto');
-            const fileBuffer = await readFile(filePath);
-            const hash = createHash('sha256').update(fileBuffer).digest('hex');
-            return hash;
+            return true;
         }
         catch (error) {
-            console.error(`Failed to compute hash for ${filePath}:`, error);
-            return '';
-        }
-    }
-    /**
-     * Download model from a fallback source
-     */
-    async downloadFromSource(source) {
-        if (source.type === 'transformers') {
-            // Use transformers.js native download
-            const { pipeline } = await import('@huggingface/transformers');
-            env.cacheDir = this.modelPath;
-            env.allowRemoteModels = true;
-            const extractor = await pipeline('feature-extraction', CRITICAL_MODEL_CONFIG.modelName);
-            // Test the model
-            const test = await extractor('test', { pooling: 'mean', normalize: true });
-            if (test.data.length !== CRITICAL_MODEL_CONFIG.embeddingDimensions) {
-                throw new Error(`CRITICAL: Model dimension mismatch! ` +
-                    `Expected ${CRITICAL_MODEL_CONFIG.embeddingDimensions}, ` +
-                    `got ${test.data.length}`);
-            }
-        }
-        else if (source.type === 'tarball') {
-            // Tarball extraction would require additional dependencies
-            // Skip this source and try next fallback
-            console.warn(`⚠️ Tarball extraction not available for ${source.name}. Trying next source...`);
-            return; // Will continue to next source in the loop
-        }
-    }
-    /**
-     * Configure transformers.js to use verified local model
-     */
-    configureTransformers() {
-        env.localModelPath = this.modelPath;
-        env.allowRemoteModels = false; // Force local only after verification
-        console.log('🔒 Transformers configured to use verified local model');
-    }
-    /**
-     * Detect where models should be stored
-     */
-    detectModelPath() {
-        // Browser always uses default path
-        if (typeof window !== 'undefined') {
-            return './models';
-        }
-        // Use require for synchronous access in Node.js
-        try {
-            const fs = require('node:fs');
-            const path = require('node:path');
-            const candidates = [
-                process.env.BRAINY_MODELS_PATH,
-                './models',
-                path.join(process.cwd(), 'models'),
-                path.join(process.env.HOME || '', '.brainy', 'models'),
-                '/opt/models', // Lambda/container path
-                env.cacheDir
-            ];
-            for (const candidatePath of candidates) {
-                if (candidatePath && fs.existsSync(candidatePath)) {
-                    const modelPath = path.join(candidatePath, ...CRITICAL_MODEL_CONFIG.modelName.split('/'));
-                    if (fs.existsSync(path.join(modelPath, 'onnx', 'model.onnx'))) {
-                        return candidatePath; // Return the models directory, not its parent
-                    }
-                }
-            }
-        }
-        catch (e) {
-            // If Node.js modules not available, return default
+            console.error('❌ Model verification failed:', error);
+            return false;
         }
-        // Default
-        return './models';
     }
     /**
      * Get model status for diagnostics
@@ -263,10 +91,10 @@ export class ModelGuardian {
     async getStatus() {
         return {
             verified: this.isVerified,
-            path: this.modelPath,
             lastVerification: this.lastVerification,
             modelName: CRITICAL_MODEL_CONFIG.modelName,
-            dimensions: CRITICAL_MODEL_CONFIG.embeddingDimensions
+            dimensions: CRITICAL_MODEL_CONFIG.embeddingDimensions,
+            bundled: CRITICAL_MODEL_CONFIG.bundled
         };
     }
     /**

package/dist/embeddings/EmbeddingManager.d.ts CHANGED Viewed

@@ -2,18 +2,14 @@
  * Unified Embedding Manager
  *
  * THE single source of truth for all embedding operations in Brainy.
- * Combines model management, precision configuration, and embedding generation
- * into one clean, maintainable class.
+ * Uses direct ONNX WASM inference for universal compatibility.
  *
  * Features:
  * - Singleton pattern ensures ONE model instance
- * - Automatic Q8 (default) or FP32 precision
- * - Model downloading and caching
- * - Thread-safe initialization
+ * - Direct ONNX WASM (no transformers.js dependency)
+ * - Bundled model (no runtime downloads)
+ * - Works everywhere: Node.js, Bun, Bun --compile, browsers
  * - Memory monitoring
- *
- * This replaces: SingletonModelManager, TransformerEmbedding, ModelPrecisionManager,
- * hybridModelManager, universalMemoryManager, and more.
  */
 import { Vector, EmbeddingFunction } from '../coreTypes.js';
 export type ModelPrecision = 'q8' | 'fp32';
@@ -27,9 +23,11 @@ interface EmbeddingStats {
 }
 /**
  * Unified Embedding Manager - Clean, simple, reliable
+ *
+ * Now powered by direct ONNX WASM for universal compatibility.
  */
 export declare class EmbeddingManager {
-    private model;
+    private engine;
     private precision;
     private modelName;
     private initialized;
@@ -61,14 +59,6 @@ export declare class EmbeddingManager {
      * Get embedding function for compatibility
      */
     getEmbeddingFunction(): EmbeddingFunction;
-    /**
-     * Get models directory path
-     * Note: In browser environments, returns a simple default path
-     * In Node.js, checks multiple locations for the models directory
-     */
-    private getModelsPath;
-    private modelsPathCache;
-    private resolveModelsPathSync;
     /**
      * Get memory usage in MB
      */