npm - @soulcraft/brainy - Versions diffs - 1.2.0 → 1.3.0 - Mend

@soulcraft/brainy 1.2.0 → 1.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (9) hide show

package/README.md +6 -8
package/dist/brainyData.d.ts +5 -2
package/dist/brainyData.js +57 -28
package/dist/critical/model-guardian.d.ts +56 -0
package/dist/critical/model-guardian.js +238 -0
package/dist/embeddings/model-manager.d.ts +27 -0
package/dist/embeddings/model-manager.js +189 -0
package/dist/utils/embedding.js +4 -0
package/package.json +5 -2

package/README.md CHANGED Viewed

@@ -200,7 +200,7 @@ const answer = await llm.generate(relevant + userQuery)  // Generate with contex
 await brain.add("The iPhone 15 Pro has a titanium design")
 await brain.add("Samsung Galaxy S24 features AI photography")
-const results = await brain.search("premium smartphones with metal build")
+const results = await brain.search("smartphones with metal build")
 // Returns: iPhone (titanium matches "metal build" semantically)
 ```
@@ -240,18 +240,17 @@ await sharedBrain.init()
 // Sales Agent adds customer intelligence
 const customerId = await sharedBrain.addNoun("Acme Corp", NounType.Organization)
-await sharedBrain.addVerb(customerId, "enterprise-plan", VerbType.InterestedIn, {
+await sharedBrain.addVerb(customerId, "business-plan", VerbType.InterestedIn, {
   priority: "high",
-  budget: "$50k",
   timeline: "Q2 2025"
 })
 // Support Agent instantly sees the context
 const customerData = await sharedBrain.getNounWithVerbs(customerId)
-// Support knows: customer interested in enterprise plan with $50k budget
+// Support knows: customer interested in business plan
 // Marketing Agent learns from both
-const insights = await sharedBrain.search("enterprise customers budget 50k", 10)
+const insights = await sharedBrain.search("business customers Q2", 10)
 // Marketing can create targeted campaigns for similar prospects
 ```
@@ -332,9 +331,8 @@ import { BrainyData, Cortex } from '@soulcraft/brainy'
 const brain = new BrainyData()
 const cortex = new Cortex()
-// Add premium augmentations (requires Brain Cloud subscription)
-brain.register(new AIMemory())
-brain.register(new AgentCoordinator())
+// Add augmentations to extend functionality
+brain.register(new CustomAugmentation())
 // Now your AI remembers everything across all sessions!
 await brain.add("User prefers TypeScript over JavaScript")

package/dist/brainyData.d.ts CHANGED Viewed

@@ -785,7 +785,7 @@ export declare class BrainyData<T = any> implements BrainyDataInterface<T> {
      */
     delete(id: string, options?: {
         service?: string;
-        soft?: boolean;
+        hard?: boolean;
         cascade?: boolean;
         force?: boolean;
     }): Promise<boolean>;
@@ -1336,9 +1336,12 @@ export declare class BrainyData<T = any> implements BrainyDataInterface<T> {
     /**
      * Get a configuration value with automatic decryption
      * @param key Configuration key
+     * @param options Options including decryption (auto-detected by default)
      * @returns Configuration value or undefined
      */
-    getConfig(key: string): Promise<any>;
+    getConfig(key: string, options?: {
+        decrypt?: boolean;
+    }): Promise<any>;
     /**
      * Encrypt data using universal crypto utilities
      */

package/dist/brainyData.js CHANGED Viewed

@@ -656,6 +656,22 @@ export class BrainyData {
             return;
         }
         this.isInitializing = true;
+        // CRITICAL: Ensure model is available before ANY operations
+        // This is THE most critical part of the system
+        // Without the model, users CANNOT access their data
+        if (typeof this.embeddingFunction === 'function') {
+            try {
+                const { modelGuardian } = await import('./critical/model-guardian.js');
+                await modelGuardian.ensureCriticalModel();
+            }
+            catch (error) {
+                console.error('🚨 CRITICAL: Model verification failed!');
+                console.error('Brainy cannot function without the transformer model.');
+                console.error('Users cannot access their data without it.');
+                this.isInitializing = false;
+                throw error;
+            }
+        }
         try {
             // Pre-load the embedding model early to ensure it's always available
             // This helps prevent issues with the Universal Sentence Encoder not being loaded
@@ -1936,10 +1952,14 @@ export class BrainyData {
                 offset: options.offset
             });
         }
-        // Filter out placeholder nouns from search results
+        // Filter out placeholder nouns and deleted items from search results
         searchResults = searchResults.filter((result) => {
             if (result.metadata && typeof result.metadata === 'object') {
                 const metadata = result.metadata;
+                // Exclude deleted items from search results (soft delete)
+                if (metadata.deleted === true) {
+                    return false;
+                }
                 // Exclude placeholder nouns from search results
                 if (metadata.isPlaceholder) {
                     return false;
@@ -2296,12 +2316,13 @@ export class BrainyData {
      * @returns Promise that resolves to true if the vector was deleted, false otherwise
      */
     async delete(id, options = {}) {
+        // Clear API: use 'hard: true' for hard delete, otherwise soft delete
+        const isHardDelete = options.hard === true;
         const opts = {
-            service: undefined,
-            soft: true, // Soft delete is default - preserves indexes
-            cascade: false,
-            force: false,
-            ...options
+            service: options.service,
+            soft: !isHardDelete, // Soft delete is default unless hard: true is specified
+            cascade: options.cascade || false,
+            force: options.force || false
         };
         // Validate id parameter first, before any other logic
         if (id === null || id === undefined) {
@@ -2331,11 +2352,17 @@ export class BrainyData {
             // Handle soft delete vs hard delete
             if (opts.soft) {
                 // Soft delete: just mark as deleted - metadata filter will exclude from search
-                return await this.updateMetadata(actualId, {
-                    deleted: true,
-                    deletedAt: new Date().toISOString(),
-                    deletedBy: opts.service || 'user'
-                });
+                try {
+                    return await this.updateMetadata(actualId, {
+                        deleted: true,
+                        deletedAt: new Date().toISOString(),
+                        deletedBy: opts.service || 'user'
+                    });
+                }
+                catch (error) {
+                    // If item doesn't exist, return false (delete of non-existent item is not an error)
+                    return false;
+                }
             }
             // Hard delete: Remove from index
             const removed = this.index.removeItem(actualId);
@@ -4818,34 +4845,36 @@ export class BrainyData {
      * @param options Options including encryption
      */
     async setConfig(key, value, options) {
-        const configNoun = {
+        // Use a predictable ID based on the config key
+        const configId = `config-${key}`;
+        // Store the config data in metadata (not as vectorized data)
+        const configValue = options?.encrypt ? await this.encryptData(JSON.stringify(value)) : value;
+        // Use simple text for vectorization
+        const searchableText = `Configuration setting for ${key}`;
+        await this.add(searchableText, {
+            nounType: NounType.State,
             configKey: key,
-            configValue: options?.encrypt ? await this.encryptData(JSON.stringify(value)) : value,
+            configValue: configValue,
             encrypted: !!options?.encrypt,
             timestamp: new Date().toISOString()
-        };
-        await this.add(configNoun, {
-            nounType: NounType.State,
-            configKey: key,
-            encrypted: !!options?.encrypt
-        });
+        }, { id: configId });
     }
     /**
      * Get a configuration value with automatic decryption
      * @param key Configuration key
+     * @param options Options including decryption (auto-detected by default)
      * @returns Configuration value or undefined
      */
-    async getConfig(key) {
+    async getConfig(key, options) {
         try {
-            const results = await this.search('', 1, {
-                nounTypes: [NounType.State],
-                metadata: { configKey: key }
-            });
-            if (results.length === 0)
+            // Use the predictable ID to get the config directly
+            const configId = `config-${key}`;
+            const storedNoun = await this.get(configId);
+            if (!storedNoun)
                 return undefined;
-            const configNoun = results[0];
-            const value = configNoun.data?.configValue || configNoun.metadata?.configValue;
-            const encrypted = configNoun.data?.encrypted || configNoun.metadata?.encrypted;
+            // The config data is now stored in metadata
+            const value = storedNoun.metadata?.configValue;
+            const encrypted = storedNoun.metadata?.encrypted;
             if (encrypted && typeof value === 'string') {
                 const decrypted = await this.decryptData(value);
                 return JSON.parse(decrypted);

package/dist/critical/model-guardian.d.ts ADDED Viewed

@@ -0,0 +1,56 @@
+/**
+ * MODEL GUARDIAN - CRITICAL PATH
+ *
+ * THIS IS THE MOST CRITICAL COMPONENT OF BRAINY
+ * Without the exact model, users CANNOT access their data
+ *
+ * Requirements:
+ * 1. Model MUST be Xenova/all-MiniLM-L6-v2 (never changes)
+ * 2. Model MUST be available at runtime
+ * 3. Model MUST produce consistent 384-dim embeddings
+ * 4. System MUST fail fast if model unavailable in production
+ */
+export declare class ModelGuardian {
+    private static instance;
+    private isVerified;
+    private modelPath;
+    private lastVerification;
+    private constructor();
+    static getInstance(): ModelGuardian;
+    /**
+     * CRITICAL: Verify model availability and integrity
+     * This MUST be called before any embedding operations
+     */
+    ensureCriticalModel(): Promise<void>;
+    /**
+     * Verify the local model files exist and are correct
+     */
+    private verifyLocalModel;
+    /**
+     * Download model from a fallback source
+     */
+    private downloadFromSource;
+    /**
+     * Configure transformers.js to use verified local model
+     */
+    private configureTransformers;
+    /**
+     * Detect where models should be stored
+     */
+    private detectModelPath;
+    /**
+     * Get model status for diagnostics
+     */
+    getStatus(): Promise<{
+        verified: boolean;
+        path: string;
+        lastVerification: Date | null;
+        modelName: string;
+        dimensions: number;
+    }>;
+    /**
+     * Force re-verification (for testing)
+     */
+    forceReverify(): Promise<void>;
+}
+export declare const modelGuardian: ModelGuardian;

package/dist/critical/model-guardian.js ADDED Viewed

@@ -0,0 +1,238 @@
+/**
+ * MODEL GUARDIAN - CRITICAL PATH
+ *
+ * THIS IS THE MOST CRITICAL COMPONENT OF BRAINY
+ * Without the exact model, users CANNOT access their data
+ *
+ * Requirements:
+ * 1. Model MUST be Xenova/all-MiniLM-L6-v2 (never changes)
+ * 2. Model MUST be available at runtime
+ * 3. Model MUST produce consistent 384-dim embeddings
+ * 4. System MUST fail fast if model unavailable in production
+ */
+import { existsSync } from 'fs';
+import { stat } from 'fs/promises';
+import { join, dirname } from 'path';
+import { env } from '@huggingface/transformers';
+// CRITICAL: These values MUST NEVER CHANGE
+const CRITICAL_MODEL_CONFIG = {
+    modelName: 'Xenova/all-MiniLM-L6-v2',
+    modelHash: {
+        // SHA256 of model.onnx - computed from actual model
+        'onnx/model.onnx': 'add_actual_hash_here',
+        'tokenizer.json': 'add_actual_hash_here'
+    },
+    modelSize: {
+        'onnx/model.onnx': 90555481, // Exact size in bytes
+        'tokenizer.json': 711661
+    },
+    embeddingDimensions: 384,
+    fallbackSources: [
+        // Primary: Our GitHub releases (we control this)
+        {
+            name: 'GitHub (Primary)',
+            url: 'https://github.com/soulcraftlabs/brainy-models/releases/download/v1.0.0/all-MiniLM-L6-v2.tar.gz',
+            type: 'tarball'
+        },
+        // Secondary: Our CDN (future, for speed)
+        {
+            name: 'Soulcraft CDN',
+            url: 'https://models.soulcraft.com/brainy/v1/all-MiniLM-L6-v2.tar.gz',
+            type: 'tarball'
+        },
+        // Tertiary: Hugging Face (original source)
+        {
+            name: 'Hugging Face',
+            url: 'huggingface',
+            type: 'transformers'
+        }
+    ]
+};
+export class ModelGuardian {
+    constructor() {
+        this.isVerified = false;
+        this.lastVerification = null;
+        this.modelPath = this.detectModelPath();
+    }
+    static getInstance() {
+        if (!ModelGuardian.instance) {
+            ModelGuardian.instance = new ModelGuardian();
+        }
+        return ModelGuardian.instance;
+    }
+    /**
+     * CRITICAL: Verify model availability and integrity
+     * This MUST be called before any embedding operations
+     */
+    async ensureCriticalModel() {
+        console.log('🛡️ MODEL GUARDIAN: Verifying critical model availability...');
+        // Check if already verified in this session
+        if (this.isVerified && this.lastVerification) {
+            const hoursSinceVerification = (Date.now() - this.lastVerification.getTime()) / (1000 * 60 * 60);
+            if (hoursSinceVerification < 24) {
+                console.log('✅ Model previously verified in this session');
+                return;
+            }
+        }
+        // Step 1: Check if model exists locally
+        const modelExists = await this.verifyLocalModel();
+        if (modelExists) {
+            console.log('✅ Critical model verified locally');
+            this.isVerified = true;
+            this.lastVerification = new Date();
+            this.configureTransformers();
+            return;
+        }
+        // Step 2: In production, FAIL FAST
+        if (process.env.NODE_ENV === 'production' && !process.env.BRAINY_ALLOW_RUNTIME_DOWNLOAD) {
+            throw new Error('🚨 CRITICAL FAILURE: Transformer model not found in production!\n' +
+                'The model is REQUIRED for Brainy to function.\n' +
+                'Users CANNOT access their data without it.\n' +
+                'Solution: Run "npm run download-models" during build stage.');
+        }
+        // Step 3: Attempt to download from fallback sources
+        console.warn('⚠️ Model not found locally, attempting download...');
+        for (const source of CRITICAL_MODEL_CONFIG.fallbackSources) {
+            try {
+                console.log(`📥 Trying ${source.name}...`);
+                await this.downloadFromSource(source);
+                // Verify the download
+                if (await this.verifyLocalModel()) {
+                    console.log(`✅ Successfully downloaded from ${source.name}`);
+                    this.isVerified = true;
+                    this.lastVerification = new Date();
+                    this.configureTransformers();
+                    return;
+                }
+            }
+            catch (error) {
+                console.warn(`❌ ${source.name} failed:`, error.message);
+            }
+        }
+        // Step 4: CRITICAL FAILURE
+        throw new Error('🚨 CRITICAL FAILURE: Cannot obtain transformer model!\n' +
+            'Tried all fallback sources.\n' +
+            'Brainy CANNOT function without the model.\n' +
+            'Users CANNOT access their data.\n' +
+            'Please check network connectivity or pre-download models.');
+    }
+    /**
+     * Verify the local model files exist and are correct
+     */
+    async verifyLocalModel() {
+        const modelBasePath = join(this.modelPath, ...CRITICAL_MODEL_CONFIG.modelName.split('/'));
+        // Check critical files
+        const criticalFiles = [
+            'onnx/model.onnx',
+            'tokenizer.json',
+            'config.json'
+        ];
+        for (const file of criticalFiles) {
+            const filePath = join(modelBasePath, file);
+            if (!existsSync(filePath)) {
+                console.log(`❌ Missing critical file: ${file}`);
+                return false;
+            }
+            // Verify size for critical files
+            if (CRITICAL_MODEL_CONFIG.modelSize[file]) {
+                const stats = await stat(filePath);
+                const expectedSize = CRITICAL_MODEL_CONFIG.modelSize[file];
+                if (Math.abs(stats.size - expectedSize) > 1000) { // Allow 1KB variance
+                    console.error(`❌ CRITICAL: Model file size mismatch!\n` +
+                        `File: ${file}\n` +
+                        `Expected: ${expectedSize} bytes\n` +
+                        `Actual: ${stats.size} bytes\n` +
+                        `This indicates model corruption or version mismatch!`);
+                    return false;
+                }
+            }
+            // TODO: Add SHA256 verification for ultimate security
+            // if (CRITICAL_MODEL_CONFIG.modelHash[file]) {
+            //   const hash = await this.computeFileHash(filePath)
+            //   if (hash !== CRITICAL_MODEL_CONFIG.modelHash[file]) {
+            //     console.error('❌ CRITICAL: Model hash mismatch!')
+            //     return false
+            //   }
+            // }
+        }
+        return true;
+    }
+    /**
+     * Download model from a fallback source
+     */
+    async downloadFromSource(source) {
+        if (source.type === 'transformers') {
+            // Use transformers.js native download
+            const { pipeline } = await import('@huggingface/transformers');
+            env.cacheDir = this.modelPath;
+            env.allowRemoteModels = true;
+            const extractor = await pipeline('feature-extraction', CRITICAL_MODEL_CONFIG.modelName);
+            // Test the model
+            const test = await extractor('test', { pooling: 'mean', normalize: true });
+            if (test.data.length !== CRITICAL_MODEL_CONFIG.embeddingDimensions) {
+                throw new Error(`CRITICAL: Model dimension mismatch! ` +
+                    `Expected ${CRITICAL_MODEL_CONFIG.embeddingDimensions}, ` +
+                    `got ${test.data.length}`);
+            }
+        }
+        else if (source.type === 'tarball') {
+            // Download and extract tarball
+            // This would require implementation with proper tar extraction
+            throw new Error('Tarball extraction not yet implemented');
+        }
+    }
+    /**
+     * Configure transformers.js to use verified local model
+     */
+    configureTransformers() {
+        env.localModelPath = this.modelPath;
+        env.allowRemoteModels = false; // Force local only after verification
+        console.log('🔒 Transformers configured to use verified local model');
+    }
+    /**
+     * Detect where models should be stored
+     */
+    detectModelPath() {
+        const candidates = [
+            process.env.BRAINY_MODELS_PATH,
+            './models',
+            join(process.cwd(), 'models'),
+            join(process.env.HOME || '', '.brainy', 'models'),
+            '/opt/models', // Lambda/container path
+            env.cacheDir
+        ];
+        for (const path of candidates) {
+            if (path && existsSync(path)) {
+                const modelPath = join(path, ...CRITICAL_MODEL_CONFIG.modelName.split('/'));
+                if (existsSync(join(modelPath, 'onnx', 'model.onnx'))) {
+                    return dirname(dirname(modelPath)); // Return base models directory
+                }
+            }
+        }
+        // Default
+        return './models';
+    }
+    /**
+     * Get model status for diagnostics
+     */
+    async getStatus() {
+        return {
+            verified: this.isVerified,
+            path: this.modelPath,
+            lastVerification: this.lastVerification,
+            modelName: CRITICAL_MODEL_CONFIG.modelName,
+            dimensions: CRITICAL_MODEL_CONFIG.embeddingDimensions
+        };
+    }
+    /**
+     * Force re-verification (for testing)
+     */
+    async forceReverify() {
+        this.isVerified = false;
+        this.lastVerification = null;
+        await this.ensureCriticalModel();
+    }
+}
+// Export singleton instance
+export const modelGuardian = ModelGuardian.getInstance();
+//# sourceMappingURL=model-guardian.js.map

package/dist/embeddings/model-manager.d.ts ADDED Viewed

@@ -0,0 +1,27 @@
+/**
+ * Model Manager - Ensures transformer models are available at runtime
+ *
+ * Strategy:
+ * 1. Check local cache first
+ * 2. Try GitHub releases (our backup)
+ * 3. Fall back to Hugging Face
+ * 4. Future: CDN at models.soulcraft.com
+ */
+export declare class ModelManager {
+    private static instance;
+    private modelsPath;
+    private isInitialized;
+    private constructor();
+    static getInstance(): ModelManager;
+    private getModelsPath;
+    ensureModels(modelName?: string): Promise<boolean>;
+    private verifyModelFiles;
+    private downloadFromGitHub;
+    private downloadFromCDN;
+    private configureTransformers;
+    /**
+     * Pre-download models for deployment
+     * This is what npm run download-models calls
+     */
+    static predownload(): Promise<void>;
+}

package/dist/embeddings/model-manager.js ADDED Viewed

@@ -0,0 +1,189 @@
+/**
+ * Model Manager - Ensures transformer models are available at runtime
+ *
+ * Strategy:
+ * 1. Check local cache first
+ * 2. Try GitHub releases (our backup)
+ * 3. Fall back to Hugging Face
+ * 4. Future: CDN at models.soulcraft.com
+ */
+import { existsSync } from 'fs';
+import { join, dirname } from 'path';
+import { env } from '@huggingface/transformers';
+// Model sources in order of preference
+const MODEL_SOURCES = {
+    // GitHub Release - our controlled backup
+    github: 'https://github.com/soulcraftlabs/brainy/releases/download/models-v1/all-MiniLM-L6-v2.tar.gz',
+    // Future CDN - fastest option when available
+    cdn: 'https://models.soulcraft.com/brainy/all-MiniLM-L6-v2.tar.gz',
+    // Original Hugging Face - fallback
+    huggingface: 'default' // Uses transformers.js default
+};
+// Expected model files and their hashes
+const MODEL_MANIFEST = {
+    'Xenova/all-MiniLM-L6-v2': {
+        files: {
+            'onnx/model.onnx': {
+                size: 90555481,
+                sha256: null // Will be computed from actual model
+            },
+            'tokenizer.json': {
+                size: 711661,
+                sha256: null
+            },
+            'config.json': {
+                size: 650,
+                sha256: null
+            },
+            'tokenizer_config.json': {
+                size: 366,
+                sha256: null
+            }
+        }
+    }
+};
+export class ModelManager {
+    constructor() {
+        this.isInitialized = false;
+        // Determine models path
+        this.modelsPath = this.getModelsPath();
+    }
+    static getInstance() {
+        if (!ModelManager.instance) {
+            ModelManager.instance = new ModelManager();
+        }
+        return ModelManager.instance;
+    }
+    getModelsPath() {
+        // Check various possible locations
+        const paths = [
+            process.env.BRAINY_MODELS_PATH,
+            './models',
+            join(process.cwd(), 'models'),
+            join(process.env.HOME || '', '.brainy', 'models'),
+            env.cacheDir
+        ];
+        // Find first existing path or use default
+        for (const path of paths) {
+            if (path && existsSync(path)) {
+                return path;
+            }
+        }
+        // Default to local models directory
+        return join(process.cwd(), 'models');
+    }
+    async ensureModels(modelName = 'Xenova/all-MiniLM-L6-v2') {
+        if (this.isInitialized) {
+            return true;
+        }
+        const modelPath = join(this.modelsPath, ...modelName.split('/'));
+        // Check if model already exists locally
+        if (await this.verifyModelFiles(modelPath, modelName)) {
+            console.log('✅ Models found in cache:', modelPath);
+            this.configureTransformers(modelPath);
+            this.isInitialized = true;
+            return true;
+        }
+        // Try to download from our sources
+        console.log('📥 Downloading transformer models...');
+        // Try GitHub first (our backup)
+        if (await this.downloadFromGitHub(modelName)) {
+            this.isInitialized = true;
+            return true;
+        }
+        // Try CDN (when available)
+        if (await this.downloadFromCDN(modelName)) {
+            this.isInitialized = true;
+            return true;
+        }
+        // Fall back to Hugging Face (default transformers.js behavior)
+        console.log('⚠️ Using Hugging Face fallback for models');
+        env.allowRemoteModels = true;
+        this.isInitialized = true;
+        return true;
+    }
+    async verifyModelFiles(modelPath, modelName) {
+        const manifest = MODEL_MANIFEST[modelName];
+        if (!manifest)
+            return false;
+        for (const [filePath, info] of Object.entries(manifest.files)) {
+            const fullPath = join(modelPath, filePath);
+            if (!existsSync(fullPath)) {
+                return false;
+            }
+            // Optionally verify size
+            if (process.env.VERIFY_MODEL_SIZE === 'true') {
+                const stats = await import('fs').then(fs => fs.promises.stat(fullPath));
+                if (stats.size !== info.size) {
+                    console.warn(`⚠️ Model file size mismatch: ${filePath}`);
+                    return false;
+                }
+            }
+        }
+        return true;
+    }
+    async downloadFromGitHub(modelName) {
+        try {
+            const url = MODEL_SOURCES.github;
+            console.log('📥 Downloading from GitHub releases...');
+            // Download tar.gz file
+            const response = await fetch(url);
+            if (!response.ok) {
+                throw new Error(`GitHub download failed: ${response.status}`);
+            }
+            const buffer = await response.arrayBuffer();
+            // Extract tar.gz (would need tar library in production)
+            // For now, return false to fall back to other methods
+            console.log('⚠️ GitHub model extraction not yet implemented');
+            return false;
+        }
+        catch (error) {
+            console.log('⚠️ GitHub download failed:', error.message);
+            return false;
+        }
+    }
+    async downloadFromCDN(modelName) {
+        try {
+            const url = MODEL_SOURCES.cdn;
+            console.log('📥 Downloading from Soulcraft CDN...');
+            // Try to fetch from CDN
+            const response = await fetch(url);
+            if (!response.ok) {
+                throw new Error(`CDN download failed: ${response.status}`);
+            }
+            // Would extract files here
+            console.log('⚠️ CDN not yet available');
+            return false;
+        }
+        catch (error) {
+            console.log('⚠️ CDN download failed:', error.message);
+            return false;
+        }
+    }
+    configureTransformers(modelPath) {
+        // Configure transformers.js to use our local models
+        env.localModelPath = dirname(modelPath);
+        env.allowRemoteModels = false;
+        console.log('🔧 Configured transformers.js to use local models');
+    }
+    /**
+     * Pre-download models for deployment
+     * This is what npm run download-models calls
+     */
+    static async predownload() {
+        const manager = ModelManager.getInstance();
+        const success = await manager.ensureModels();
+        if (!success) {
+            throw new Error('Failed to download models');
+        }
+        console.log('✅ Models downloaded successfully');
+    }
+}
+// Auto-initialize on import in production
+if (process.env.NODE_ENV === 'production' && process.env.SKIP_MODEL_CHECK !== 'true') {
+    ModelManager.getInstance().ensureModels().catch(error => {
+        console.error('⚠️ Model initialization failed:', error);
+        // Don't throw - allow app to start and try downloading on first use
+    });
+}
+//# sourceMappingURL=model-manager.js.map

package/dist/utils/embedding.js CHANGED Viewed

@@ -3,6 +3,7 @@
  * Complete rewrite to eliminate TensorFlow.js and use ONNX-based models
  */
 import { isBrowser } from './environment.js';
+import { ModelManager } from '../embeddings/model-manager.js';
 // @ts-ignore - Transformers.js is now the primary embedding library
 import { pipeline, env } from '@huggingface/transformers';
 /**
@@ -192,6 +193,9 @@ export class TransformerEmbedding {
         }
         // Always use real implementation - no mocking
         try {
+            // Ensure models are available (downloads if needed)
+            const modelManager = ModelManager.getInstance();
+            await modelManager.ensureModels(this.options.model);
             // Resolve device configuration and cache directory
             const device = await resolveDevice(this.options.device);
             const cacheDir = this.options.cacheDir === './models'

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@soulcraft/brainy",
-  "version": "1.2.0",
+  "version": "1.3.0",
   "description": "Multi-Dimensional AI Database - Vector similarity, graph relationships, metadata facets with HNSW indexing and OPFS storage",
   "main": "dist/index.js",
   "module": "dist/index.js",
@@ -142,7 +142,10 @@
     "_workflow:major": "node scripts/release-workflow.js major",
     "_workflow:dry-run": "npm run build && npm test && npm run _release:dry-run",
     "_dry-run": "npm pack --dry-run",
-    "download-models": "node scripts/download-models.cjs"
+    "download-models": "node scripts/download-models.cjs",
+    "prepare-models": "node scripts/prepare-models.js",
+    "models:verify": "node scripts/ensure-models.js",
+    "models:download": "BRAINY_ALLOW_REMOTE_MODELS=true node scripts/download-models.cjs"
   },
   "keywords": [
     "vector-database",