npm - monomind - Versions diffs - 1.10.56 → 1.11.0 - Mend

monomind 1.10.56 → 1.11.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (247) hide show

package/packages/@monomind/cli/dist/src/ruvector/lora-adapter.js DELETED Viewed

@@ -1,455 +0,0 @@
-/**
- * LoRA (Low-Rank Adaptation) Implementation
- *
- * Enables efficient fine-tuning by decomposing weight updates into low-rank matrices.
- * Dramatically reduces memory requirements while maintaining adaptation quality.
- *
- * Features:
- * - Rank decomposition (r << d) for memory efficiency
- * - Additive weight updates: W' = W + BA (where B ∈ R^{d×r}, A ∈ R^{r×k})
- * - Support for multiple adaptation heads
- * - Persistence to .swarm/lora-weights.json
- *
- * Memory savings:
- * - Original: d × k parameters
- * - LoRA: r × (d + k) parameters
- * - For d=384, k=384, r=8: 786,432 → 6,144 (128x reduction)
- *
- * @module lora-adapter
- */
-import { existsSync, mkdirSync, readFileSync, writeFileSync } from 'fs';
-import { dirname, join } from 'path';
-// ============================================================================
-// Types & Constants
-// ============================================================================
-/**
- * Default LoRA rank (determines memory/quality tradeoff)
- */
-export const DEFAULT_RANK = 8;
-/**
- * Input dimension (384 from ONNX MiniLM-L6-v2)
- */
-export const INPUT_DIM = 384;
-/**
- * Default output dimension (same as input for adapter)
- */
-export const OUTPUT_DIM = 384;
-/**
- * Default alpha scaling factor
- */
-export const DEFAULT_ALPHA = 16;
-// ============================================================================
-// Default Configuration
-// ============================================================================
-const DEFAULT_CONFIG = {
-    rank: DEFAULT_RANK,
-    alpha: DEFAULT_ALPHA,
-    inputDim: INPUT_DIM,
-    outputDim: OUTPUT_DIM,
-    learningRate: 0.001,
-    weightsPath: join(process.cwd(), '.swarm', 'lora-weights.json'),
-    enableDropout: true,
-    dropoutProb: 0.1,
-    autoSaveInterval: 50,
-};
-// ============================================================================
-// LoRA Adapter Class
-// ============================================================================
-/**
- * Low-Rank Adaptation module for efficient embedding fine-tuning
- */
-export class LoRAAdapter {
-    config;
-    weights;
-    totalAdaptations = 0;
-    totalUpdates = 0;
-    adaptationNormSum = 0;
-    lastUpdate = null;
-    updatesSinceLastSave = 0;
-    constructor(config) {
-        this.config = { ...DEFAULT_CONFIG, ...config };
-        this.weights = this.initializeWeights();
-    }
-    /**
-     * Initialize weights with Kaiming/He initialization
-     */
-    initializeWeights() {
-        const { rank, inputDim, outputDim, alpha } = this.config;
-        // A: rank × inputDim, initialized with Kaiming normal
-        const A = new Float32Array(rank * inputDim);
-        const stdA = Math.sqrt(2.0 / inputDim);
-        for (let i = 0; i < A.length; i++) {
-            A[i] = this.gaussianRandom() * stdA;
-        }
-        // B: outputDim × rank, initialized to zero (standard LoRA init)
-        const B = new Float32Array(outputDim * rank);
-        // B starts at zero so initial adaptation is zero
-        return {
-            A,
-            B,
-            scaling: alpha / rank,
-        };
-    }
-    /**
-     * Box-Muller transform for Gaussian random numbers
-     */
-    gaussianRandom() {
-        let u = 0, v = 0;
-        while (u === 0)
-            u = Math.random();
-        while (v === 0)
-            v = Math.random();
-        return Math.sqrt(-2.0 * Math.log(u)) * Math.cos(2.0 * Math.PI * v);
-    }
-    /**
-     * Initialize adapter and load persisted weights
-     */
-    async initialize() {
-        const loaded = this.loadWeights();
-        return { success: true, weightsLoaded: loaded };
-    }
-    /**
-     * Apply LoRA adaptation to an embedding
-     * output = input + scaling * (B @ A @ input)
-     */
-    adapt(input) {
-        const startTime = performance.now();
-        const { rank, inputDim, outputDim } = this.config;
-        const { A, B, scaling } = this.weights;
-        // Step 1: Compute A @ input (rank-dimensional)
-        const hidden = new Float32Array(rank);
-        for (let r = 0; r < rank; r++) {
-            let sum = 0;
-            const rowOffset = r * inputDim;
-            // Unroll by 4 for SIMD-friendly access
-            let i = 0;
-            for (; i + 3 < inputDim; i += 4) {
-                sum += A[rowOffset + i] * input[i];
-                sum += A[rowOffset + i + 1] * input[i + 1];
-                sum += A[rowOffset + i + 2] * input[i + 2];
-                sum += A[rowOffset + i + 3] * input[i + 3];
-            }
-            for (; i < inputDim; i++) {
-                sum += A[rowOffset + i] * input[i];
-            }
-            hidden[r] = sum;
-        }
-        // Optional dropout (during training inference, skip)
-        // In LoRA inference, we don't apply dropout
-        // Step 2: Compute B @ hidden (outputDim-dimensional)
-        const delta = new Float32Array(outputDim);
-        for (let o = 0; o < outputDim; o++) {
-            let sum = 0;
-            const rowOffset = o * rank;
-            for (let r = 0; r < rank; r++) {
-                sum += B[rowOffset + r] * hidden[r];
-            }
-            delta[o] = sum * scaling;
-        }
-        // Step 3: Add adaptation to input
-        const adapted = new Float32Array(outputDim);
-        let adaptationNorm = 0;
-        for (let i = 0; i < outputDim; i++) {
-            adapted[i] = input[i] + delta[i];
-            adaptationNorm += delta[i] * delta[i];
-        }
-        adaptationNorm = Math.sqrt(adaptationNorm);
-        // Update stats
-        this.totalAdaptations++;
-        this.adaptationNormSum += adaptationNorm;
-        const timeMs = performance.now() - startTime;
-        return { adapted, adaptationNorm, timeMs };
-    }
-    /**
-     * Train the adapter with a gradient signal
-     * Uses simplified update: A += lr * hidden^T @ grad, B += lr * grad @ hidden^T
-     */
-    train(input, gradOutput, reward = 1.0) {
-        const { rank, inputDim, outputDim, learningRate } = this.config;
-        const { A, B, scaling } = this.weights;
-        // Forward pass to get hidden states
-        const hidden = new Float32Array(rank);
-        for (let r = 0; r < rank; r++) {
-            let sum = 0;
-            const rowOffset = r * inputDim;
-            for (let i = 0; i < inputDim; i++) {
-                sum += A[rowOffset + i] * input[i];
-            }
-            hidden[r] = sum;
-        }
-        // Compute gradient for B: grad_B = gradOutput @ hidden^T
-        const scaledLr = learningRate * reward * scaling;
-        for (let o = 0; o < outputDim; o++) {
-            const rowOffset = o * rank;
-            for (let r = 0; r < rank; r++) {
-                B[rowOffset + r] += scaledLr * gradOutput[o] * hidden[r];
-            }
-        }
-        // Compute gradient for hidden: grad_hidden = B^T @ gradOutput
-        const gradHidden = new Float32Array(rank);
-        for (let r = 0; r < rank; r++) {
-            let sum = 0;
-            for (let o = 0; o < outputDim; o++) {
-                sum += B[o * rank + r] * gradOutput[o];
-            }
-            gradHidden[r] = sum;
-        }
-        // Compute gradient for A: grad_A = gradHidden @ input^T
-        for (let r = 0; r < rank; r++) {
-            const rowOffset = r * inputDim;
-            for (let i = 0; i < inputDim; i++) {
-                A[rowOffset + i] += scaledLr * gradHidden[r] * input[i];
-            }
-        }
-        // Compute loss (L2 norm of gradient)
-        let loss = 0;
-        for (let i = 0; i < gradOutput.length; i++) {
-            loss += gradOutput[i] * gradOutput[i];
-        }
-        loss = Math.sqrt(loss);
-        // Update counters
-        this.totalUpdates++;
-        this.lastUpdate = Date.now();
-        this.updatesSinceLastSave++;
-        // Auto-save if needed
-        if (this.updatesSinceLastSave >= this.config.autoSaveInterval) {
-            this.saveWeights();
-            this.updatesSinceLastSave = 0;
-        }
-        return { updated: true, loss };
-    }
-    /**
-     * Merge LoRA weights into base weights (for deployment)
-     * Returns: W' = W + scaling * B @ A
-     */
-    merge(baseWeights) {
-        const { rank, inputDim, outputDim } = this.config;
-        const { A, B, scaling } = this.weights;
-        // Compute BA product
-        const merged = new Float32Array(baseWeights);
-        for (let o = 0; o < outputDim; o++) {
-            for (let i = 0; i < inputDim; i++) {
-                let sum = 0;
-                for (let r = 0; r < rank; r++) {
-                    sum += B[o * rank + r] * A[r * inputDim + i];
-                }
-                merged[o * inputDim + i] += scaling * sum;
-            }
-        }
-        return merged;
-    }
-    /**
-     * Get current statistics
-     */
-    getStats() {
-        const { rank, inputDim, outputDim } = this.config;
-        const originalParams = inputDim * outputDim;
-        const loraParams = rank * (inputDim + outputDim);
-        return {
-            totalAdaptations: this.totalAdaptations,
-            totalUpdates: this.totalUpdates,
-            rank: this.config.rank,
-            compressionRatio: originalParams / loraParams,
-            avgAdaptationNorm: this.totalAdaptations > 0
-                ? this.adaptationNormSum / this.totalAdaptations
-                : 0,
-            lastUpdate: this.lastUpdate,
-        };
-    }
-    /**
-     * Reset adapter to initial state
-     */
-    reset() {
-        this.weights = this.initializeWeights();
-        this.totalAdaptations = 0;
-        this.totalUpdates = 0;
-        this.adaptationNormSum = 0;
-        this.lastUpdate = null;
-        this.updatesSinceLastSave = 0;
-    }
-    /**
-     * Save weights to disk
-     */
-    saveWeights() {
-        try {
-            const dir = dirname(this.config.weightsPath);
-            if (!existsSync(dir)) {
-                mkdirSync(dir, { recursive: true });
-            }
-            const data = {
-                version: 1,
-                config: {
-                    rank: this.config.rank,
-                    alpha: this.config.alpha,
-                    inputDim: this.config.inputDim,
-                    outputDim: this.config.outputDim,
-                },
-                weights: {
-                    A: Array.from(this.weights.A),
-                    B: Array.from(this.weights.B),
-                    scaling: this.weights.scaling,
-                },
-                stats: {
-                    totalAdaptations: this.totalAdaptations,
-                    totalUpdates: this.totalUpdates,
-                    adaptationNormSum: this.adaptationNormSum,
-                    lastUpdate: this.lastUpdate,
-                },
-                savedAt: new Date().toISOString(),
-            };
-            writeFileSync(this.config.weightsPath, JSON.stringify(data, null, 2));
-            return true;
-        }
-        catch {
-            return false;
-        }
-    }
-    /**
-     * Load weights from disk
-     */
-    loadWeights() {
-        try {
-            if (!existsSync(this.config.weightsPath)) {
-                return false;
-            }
-            const content = readFileSync(this.config.weightsPath, 'utf-8');
-            const data = JSON.parse(content);
-            if (data.version !== 1) {
-                return false;
-            }
-            // Verify dimensions match
-            const { rank, inputDim, outputDim } = data.config;
-            if (rank !== this.config.rank ||
-                inputDim !== this.config.inputDim ||
-                outputDim !== this.config.outputDim) {
-                return false;
-            }
-            // Load weights
-            this.weights = {
-                A: new Float32Array(data.weights.A),
-                B: new Float32Array(data.weights.B),
-                scaling: data.weights.scaling,
-            };
-            // Load stats
-            this.totalAdaptations = data.stats.totalAdaptations || 0;
-            this.totalUpdates = data.stats.totalUpdates || 0;
-            this.adaptationNormSum = data.stats.adaptationNormSum || 0;
-            this.lastUpdate = data.stats.lastUpdate || null;
-            return true;
-        }
-        catch {
-            return false;
-        }
-    }
-    /**
-     * Export weights as JSON
-     */
-    exportWeights() {
-        return {
-            A: Array.from(this.weights.A),
-            B: Array.from(this.weights.B),
-            scaling: this.weights.scaling,
-            config: {
-                rank: this.config.rank,
-                alpha: this.config.alpha,
-                inputDim: this.config.inputDim,
-                outputDim: this.config.outputDim,
-            },
-        };
-    }
-    /**
-     * Import weights from JSON
-     */
-    importWeights(data) {
-        try {
-            const { rank, inputDim, outputDim } = this.config;
-            if (data.A.length !== rank * inputDim ||
-                data.B.length !== outputDim * rank) {
-                return false;
-            }
-            this.weights = {
-                A: new Float32Array(data.A),
-                B: new Float32Array(data.B),
-                scaling: data.scaling,
-            };
-            return true;
-        }
-        catch {
-            return false;
-        }
-    }
-}
-// ============================================================================
-// Singleton & Factory Functions
-// ============================================================================
-let loraInstance = null;
-let initPromise = null;
-/**
- * Get or create singleton LoRA adapter instance
- */
-export async function getLoRAAdapter() {
-    if (loraInstance) {
-        return loraInstance;
-    }
-    if (initPromise) {
-        return initPromise;
-    }
-    initPromise = (async () => {
-        const adapter = new LoRAAdapter();
-        await adapter.initialize();
-        loraInstance = adapter;
-        return adapter;
-    })();
-    return initPromise;
-}
-/**
- * Reset singleton instance (for testing)
- */
-export function resetLoRAAdapter() {
-    if (loraInstance) {
-        loraInstance.reset();
-    }
-    loraInstance = null;
-    initPromise = null;
-}
-/**
- * Create new LoRA adapter instance (factory)
- */
-export function createLoRAAdapter(config) {
-    return new LoRAAdapter(config);
-}
-/**
- * Quick adaptation (convenience function)
- */
-export async function adaptEmbedding(input) {
-    const adapter = await getLoRAAdapter();
-    return adapter.adapt(input);
-}
-/**
- * Quick training (convenience function)
- */
-export async function trainLoRA(input, gradOutput, reward) {
-    const adapter = await getLoRAAdapter();
-    return adapter.train(input, gradOutput, reward);
-}
-/**
- * Get LoRA statistics (convenience function)
- */
-export async function getLoRAStats() {
-    const adapter = await getLoRAAdapter();
-    return adapter.getStats();
-}
-export default {
-    LoRAAdapter,
-    getLoRAAdapter,
-    resetLoRAAdapter,
-    createLoRAAdapter,
-    adaptEmbedding,
-    trainLoRA,
-    getLoRAStats,
-    DEFAULT_RANK,
-    DEFAULT_ALPHA,
-    INPUT_DIM,
-    OUTPUT_DIM,
-};
-//# sourceMappingURL=lora-adapter.js.map

package/packages/@monomind/cli/dist/src/ruvector/model-router.d.ts DELETED Viewed

@@ -1,222 +0,0 @@
-/**
- * Intelligent Model Router using Tiny Dancer
- *
- * Dynamically routes requests to optimal Claude model (haiku/sonnet/opus)
- * based on task complexity, confidence scores, and historical performance.
- *
- * Features:
- * - FastGRNN-based routing decisions (<100μs)
- * - Uncertainty quantification for model escalation
- * - Circuit breaker for failover
- * - Online learning from routing outcomes
- * - Complexity scoring via embeddings
- *
- * Routing Strategy:
- * - Haiku: High confidence, low complexity (fast, cheap)
- * - Sonnet: Medium confidence, moderate complexity (balanced)
- * - Opus: Low confidence, high complexity (most capable)
- *
- * @module model-router
- */
-/**
- * Available Claude models for routing
- */
-export type ClaudeModel = 'haiku' | 'sonnet' | 'opus' | 'inherit';
-/**
- * Model capabilities and characteristics
- */
-export declare const MODEL_CAPABILITIES: Record<ClaudeModel, {
-    maxComplexity: number;
-    costMultiplier: number;
-    speedMultiplier: number;
-    description: string;
-}>;
-/**
- * Complexity indicators for task classification
- */
-export declare const COMPLEXITY_INDICATORS: {
-    high: string[];
-    medium: string[];
-    low: string[];
-};
-/**
- * Model router configuration
- */
-export interface ModelRouterConfig {
-    /** Confidence threshold for model selection (default: 0.85) */
-    confidenceThreshold: number;
-    /** Maximum uncertainty before escalating (default: 0.15) */
-    maxUncertainty: number;
-    /** Enable circuit breaker (default: true) */
-    enableCircuitBreaker: boolean;
-    /** Failures before circuit opens (default: 5) */
-    circuitBreakerThreshold: number;
-    /** Path for router state persistence */
-    statePath: string;
-    /** Auto-save interval in decisions (default: 20) */
-    autoSaveInterval: number;
-    /** Enable cost optimization (default: true) */
-    enableCostOptimization: boolean;
-    /** Prefer faster models when confidence is high (default: true) */
-    preferSpeed: boolean;
-}
-/**
- * Routing decision result
- */
-export interface ModelRoutingResult {
-    /** Selected model */
-    model: ClaudeModel;
-    /** Confidence in the decision (0-1) */
-    confidence: number;
-    /** Uncertainty estimate (0-1) */
-    uncertainty: number;
-    /** Computed complexity score (0-1) */
-    complexity: number;
-    /** Reasoning for the selection */
-    reasoning: string;
-    /** Alternative models considered */
-    alternatives: Array<{
-        model: ClaudeModel;
-        score: number;
-    }>;
-    /** Inference time in microseconds */
-    inferenceTimeUs: number;
-    /** Estimated cost multiplier */
-    costMultiplier: number;
-}
-/**
- * Complexity analysis result
- */
-export interface ComplexityAnalysis {
-    /** Overall complexity score (0-1) */
-    score: number;
-    /** Indicators found */
-    indicators: {
-        high: string[];
-        medium: string[];
-        low: string[];
-    };
-    /** Feature breakdown */
-    features: {
-        lexicalComplexity: number;
-        semanticDepth: number;
-        taskScope: number;
-        uncertaintyLevel: number;
-    };
-}
-/**
- * Intelligent Model Router using complexity-based routing
- */
-export declare class ModelRouter {
-    private config;
-    private state;
-    private decisionCount;
-    private consecutiveFailures;
-    constructor(config?: Partial<ModelRouterConfig>);
-    /**
-     * Route a task to the optimal model
-     */
-    route(task: string, embedding?: number[]): Promise<ModelRoutingResult>;
-    /**
-     * Analyze task complexity
-     */
-    analyzeComplexity(task: string, embedding?: number[]): ComplexityAnalysis;
-    /**
-     * Compute lexical complexity from text features
-     */
-    private computeLexicalComplexity;
-    /**
-     * Compute semantic depth from indicators and embedding
-     */
-    private computeSemanticDepth;
-    /**
-     * Compute task scope from content analysis
-     */
-    private computeTaskScope;
-    /**
-     * Compute uncertainty level from task phrasing
-     */
-    private computeUncertaintyLevel;
-    /**
-     * Compute scores for each model
-     */
-    private computeModelScores;
-    /**
-     * Apply circuit breaker adjustments
-     */
-    private applyCircuitBreaker;
-    /**
-     * Select the best model from scores
-     */
-    private selectModel;
-    /**
-     * Build human-readable reasoning
-     */
-    private buildReasoning;
-    /**
-     * Track routing decision for learning
-     */
-    private trackDecision;
-    /**
-     * Record outcome for learning
-     */
-    recordOutcome(task: string, model: ClaudeModel, outcome: 'success' | 'failure' | 'escalated', complexity?: number): void;
-    /**
-     * Get router statistics
-     */
-    getStats(): {
-        totalDecisions: number;
-        modelDistribution: Record<ClaudeModel, number>;
-        avgComplexity: number;
-        avgConfidence: number;
-        circuitBreakerTrips: number;
-        consecutiveFailures: Record<ClaudeModel, number>;
-    };
-    /**
-     * Load state from disk
-     */
-    private loadState;
-    /**
-     * Save state to disk
-     */
-    private saveState;
-    /**
-     * Reset router state
-     */
-    reset(): void;
-}
-/**
- * Get or create the singleton ModelRouter instance.
- * Throws if called with a config that differs from the one used to create
- * the existing instance — silent config mismatch causes hard-to-debug routing bugs.
- */
-export declare function getModelRouter(config?: Partial<ModelRouterConfig>): ModelRouter;
-/**
- * Reset the singleton instance
- */
-export declare function resetModelRouter(): void;
-/**
- * Create a new ModelRouter instance (non-singleton)
- */
-export declare function createModelRouter(config?: Partial<ModelRouterConfig>): ModelRouter;
-/**
- * Quick route function for common use case
- */
-export declare function routeToModel(task: string): Promise<ClaudeModel>;
-/**
- * Route with full result
- */
-export declare function routeToModelFull(task: string, embedding?: number[]): Promise<ModelRoutingResult>;
-/**
- * Analyze task complexity without routing
- */
-export declare function analyzeTaskComplexity(task: string): ComplexityAnalysis;
-/**
- * Get model router statistics
- */
-export declare function getModelRouterStats(): ReturnType<ModelRouter['getStats']>;
-/**
- * Record routing outcome for learning
- */
-export declare function recordModelOutcome(task: string, model: ClaudeModel, outcome: 'success' | 'failure' | 'escalated'): void;
-//# sourceMappingURL=model-router.d.ts.map