npm - @soulcraft/brainy - Versions diffs - 4.1.3 → 4.2.0 - Mend

@soulcraft/brainy 4.1.3 → 4.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (52) hide show

package/CHANGELOG.md +100 -7
package/dist/brainy.d.ts +74 -16
package/dist/brainy.js +74 -16
package/dist/import/FormatDetector.d.ts +6 -1
package/dist/import/FormatDetector.js +40 -1
package/dist/import/ImportCoordinator.d.ts +155 -5
package/dist/import/ImportCoordinator.js +346 -6
package/dist/import/InstancePool.d.ts +136 -0
package/dist/import/InstancePool.js +231 -0
package/dist/importers/SmartCSVImporter.d.ts +2 -1
package/dist/importers/SmartCSVImporter.js +11 -22
package/dist/importers/SmartDOCXImporter.d.ts +125 -0
package/dist/importers/SmartDOCXImporter.js +227 -0
package/dist/importers/SmartExcelImporter.d.ts +12 -1
package/dist/importers/SmartExcelImporter.js +40 -25
package/dist/importers/SmartJSONImporter.d.ts +1 -0
package/dist/importers/SmartJSONImporter.js +25 -6
package/dist/importers/SmartMarkdownImporter.d.ts +2 -1
package/dist/importers/SmartMarkdownImporter.js +11 -16
package/dist/importers/SmartPDFImporter.d.ts +2 -1
package/dist/importers/SmartPDFImporter.js +11 -22
package/dist/importers/SmartYAMLImporter.d.ts +121 -0
package/dist/importers/SmartYAMLImporter.js +275 -0
package/dist/importers/VFSStructureGenerator.js +12 -0
package/dist/neural/SmartExtractor.d.ts +279 -0
package/dist/neural/SmartExtractor.js +592 -0
package/dist/neural/SmartRelationshipExtractor.d.ts +217 -0
package/dist/neural/SmartRelationshipExtractor.js +396 -0
package/dist/neural/embeddedTypeEmbeddings.d.ts +1 -1
package/dist/neural/embeddedTypeEmbeddings.js +2 -2
package/dist/neural/entityExtractor.d.ts +3 -0
package/dist/neural/entityExtractor.js +34 -36
package/dist/neural/presets.d.ts +189 -0
package/dist/neural/presets.js +365 -0
package/dist/neural/signals/ContextSignal.d.ts +166 -0
package/dist/neural/signals/ContextSignal.js +646 -0
package/dist/neural/signals/EmbeddingSignal.d.ts +175 -0
package/dist/neural/signals/EmbeddingSignal.js +435 -0
package/dist/neural/signals/ExactMatchSignal.d.ts +220 -0
package/dist/neural/signals/ExactMatchSignal.js +542 -0
package/dist/neural/signals/PatternSignal.d.ts +159 -0
package/dist/neural/signals/PatternSignal.js +478 -0
package/dist/neural/signals/VerbContextSignal.d.ts +102 -0
package/dist/neural/signals/VerbContextSignal.js +390 -0
package/dist/neural/signals/VerbEmbeddingSignal.d.ts +131 -0
package/dist/neural/signals/VerbEmbeddingSignal.js +304 -0
package/dist/neural/signals/VerbExactMatchSignal.d.ts +115 -0
package/dist/neural/signals/VerbExactMatchSignal.js +335 -0
package/dist/neural/signals/VerbPatternSignal.d.ts +104 -0
package/dist/neural/signals/VerbPatternSignal.js +457 -0
package/dist/types/graphTypes.d.ts +2 -0
package/package.json +4 -1

package/dist/neural/signals/VerbContextSignal.js ADDED Viewed

@@ -0,0 +1,390 @@
+/**
+ * VerbContextSignal - Type-based relationship inference
+ *
+ * WEIGHT: 5% (lowest weight, backup signal)
+ *
+ * Uses:
+ * 1. Entity type pairs (Person+Organization → WorksWith)
+ * 2. Semantic compatibility (Document+Person → CreatedBy)
+ * 3. Domain heuristics (Location+Organization → LocatedAt)
+ *
+ * PRODUCTION-READY: No TODOs, no mocks, real implementation
+ */
+import { VerbType, NounType } from '../../types/graphTypes.js';
+/**
+ * VerbContextSignal - Type-based relationship classification
+ *
+ * Production features:
+ * - Pre-defined type pair mappings (zero runtime cost)
+ * - Semantic type compatibility
+ * - Bidirectional hint support (subject→object and object→subject)
+ * - LRU cache for hot paths
+ */
+export class VerbContextSignal {
+    constructor(brain, options) {
+        // Type pair hints (subject type → object type → verb types)
+        this.typePairHints = [];
+        // LRU cache
+        this.cache = new Map();
+        this.cacheOrder = [];
+        // Statistics
+        this.stats = {
+            calls: 0,
+            cacheHits: 0,
+            matches: 0,
+            hintHits: new Map()
+        };
+        this.brain = brain;
+        this.options = {
+            minConfidence: options?.minConfidence ?? 0.60,
+            cacheSize: options?.cacheSize ?? 1000
+        };
+        // Initialize type pair hints
+        this.initializeTypePairHints();
+    }
+    /**
+     * Initialize all type pair hints
+     *
+     * Maps entity type combinations to likely relationship types
+     */
+    initializeTypePairHints() {
+        this.typePairHints = [
+            // ========== Person → Organization ==========
+            {
+                subjectType: NounType.Person,
+                objectType: NounType.Organization,
+                verbType: VerbType.WorksWith,
+                confidence: 0.75,
+                description: 'Person works at Organization'
+            },
+            {
+                subjectType: NounType.Person,
+                objectType: NounType.Organization,
+                verbType: VerbType.MemberOf,
+                confidence: 0.70,
+                description: 'Person is member of Organization'
+            },
+            {
+                subjectType: NounType.Person,
+                objectType: NounType.Organization,
+                verbType: VerbType.ReportsTo,
+                confidence: 0.65,
+                description: 'Person reports to Organization'
+            },
+            // ========== Person → Person ==========
+            {
+                subjectType: NounType.Person,
+                objectType: NounType.Person,
+                verbType: VerbType.WorksWith,
+                confidence: 0.70,
+                description: 'Person works with Person'
+            },
+            {
+                subjectType: NounType.Person,
+                objectType: NounType.Person,
+                verbType: VerbType.FriendOf,
+                confidence: 0.65,
+                description: 'Person is friend of Person'
+            },
+            {
+                subjectType: NounType.Person,
+                objectType: NounType.Person,
+                verbType: VerbType.Mentors,
+                confidence: 0.65,
+                description: 'Person mentors Person'
+            },
+            // ========== Person → Location ==========
+            {
+                subjectType: NounType.Person,
+                objectType: NounType.Location,
+                verbType: VerbType.LocatedAt,
+                confidence: 0.70,
+                description: 'Person located at Location'
+            },
+            // ========== Document → Person ==========
+            {
+                subjectType: NounType.Document,
+                objectType: NounType.Person,
+                verbType: VerbType.CreatedBy,
+                confidence: 0.80,
+                description: 'Document created by Person'
+            },
+            {
+                subjectType: NounType.Document,
+                objectType: NounType.Person,
+                verbType: VerbType.AttributedTo,
+                confidence: 0.75,
+                description: 'Document attributed to Person'
+            },
+            // ========== Document → Document ==========
+            {
+                subjectType: NounType.Document,
+                objectType: NounType.Document,
+                verbType: VerbType.References,
+                confidence: 0.75,
+                description: 'Document references Document'
+            },
+            {
+                subjectType: NounType.Document,
+                objectType: NounType.Document,
+                verbType: VerbType.PartOf,
+                confidence: 0.70,
+                description: 'Document is part of Document'
+            },
+            // ========== Document → Concept ==========
+            {
+                subjectType: NounType.Document,
+                objectType: NounType.Concept,
+                verbType: VerbType.Describes,
+                confidence: 0.75,
+                description: 'Document describes Concept'
+            },
+            {
+                subjectType: NounType.Document,
+                objectType: NounType.Concept,
+                verbType: VerbType.Defines,
+                confidence: 0.70,
+                description: 'Document defines Concept'
+            },
+            // ========== Organization → Location ==========
+            {
+                subjectType: NounType.Organization,
+                objectType: NounType.Location,
+                verbType: VerbType.LocatedAt,
+                confidence: 0.80,
+                description: 'Organization located at Location'
+            },
+            // ========== Organization → Organization ==========
+            {
+                subjectType: NounType.Organization,
+                objectType: NounType.Organization,
+                verbType: VerbType.PartOf,
+                confidence: 0.70,
+                description: 'Organization is part of Organization'
+            },
+            {
+                subjectType: NounType.Organization,
+                objectType: NounType.Organization,
+                verbType: VerbType.Competes,
+                confidence: 0.65,
+                description: 'Organization competes with Organization'
+            },
+            // ========== Product → Organization ==========
+            {
+                subjectType: NounType.Product,
+                objectType: NounType.Organization,
+                verbType: VerbType.CreatedBy,
+                confidence: 0.75,
+                description: 'Product created by Organization'
+            },
+            {
+                subjectType: NounType.Product,
+                objectType: NounType.Organization,
+                verbType: VerbType.Owns,
+                confidence: 0.70,
+                description: 'Product owned by Organization'
+            },
+            // ========== Product → Person ==========
+            {
+                subjectType: NounType.Product,
+                objectType: NounType.Person,
+                verbType: VerbType.CreatedBy,
+                confidence: 0.75,
+                description: 'Product created by Person'
+            },
+            // ========== Event → Person ==========
+            {
+                subjectType: NounType.Event,
+                objectType: NounType.Person,
+                verbType: VerbType.CreatedBy,
+                confidence: 0.70,
+                description: 'Event created by Person'
+            },
+            // ========== Event → Location ==========
+            {
+                subjectType: NounType.Event,
+                objectType: NounType.Location,
+                verbType: VerbType.LocatedAt,
+                confidence: 0.75,
+                description: 'Event located at Location'
+            },
+            // ========== Event → Event ==========
+            {
+                subjectType: NounType.Event,
+                objectType: NounType.Event,
+                verbType: VerbType.Precedes,
+                confidence: 0.70,
+                description: 'Event precedes Event'
+            },
+            // ========== Project → Organization ==========
+            {
+                subjectType: NounType.Project,
+                objectType: NounType.Organization,
+                verbType: VerbType.BelongsTo,
+                confidence: 0.75,
+                description: 'Project belongs to Organization'
+            },
+            // ========== Project → Person ==========
+            {
+                subjectType: NounType.Project,
+                objectType: NounType.Person,
+                verbType: VerbType.CreatedBy,
+                confidence: 0.70,
+                description: 'Project created by Person'
+            },
+            // ========== Thing → Thing (generic fallback) ==========
+            {
+                subjectType: NounType.Thing,
+                objectType: NounType.Thing,
+                verbType: VerbType.RelatedTo,
+                confidence: 0.60,
+                description: 'Thing related to Thing'
+            }
+        ];
+        // Initialize hint hit tracking
+        for (const hint of this.typePairHints) {
+            this.stats.hintHits.set(hint.description, 0);
+        }
+    }
+    /**
+     * Classify relationship type from entity type pair
+     *
+     * @param subjectType Type of subject entity
+     * @param objectType Type of object entity
+     * @returns VerbSignal with classified type or null
+     */
+    async classify(subjectType, objectType) {
+        this.stats.calls++;
+        if (!subjectType || !objectType) {
+            return null;
+        }
+        // Check cache
+        const cacheKey = this.getCacheKey(subjectType, objectType);
+        const cached = this.getFromCache(cacheKey);
+        if (cached !== undefined) {
+            this.stats.cacheHits++;
+            return cached;
+        }
+        try {
+            // Find matching hints for this type pair
+            const matchingHints = this.typePairHints.filter(hint => (hint.subjectType === subjectType && hint.objectType === objectType) ||
+                (hint.subjectType === objectType && hint.objectType === subjectType));
+            if (matchingHints.length === 0) {
+                // Try fallback to Thing → Thing
+                const fallbackHints = this.typePairHints.filter(hint => hint.subjectType === NounType.Thing && hint.objectType === NounType.Thing);
+                if (fallbackHints.length > 0) {
+                    const hint = fallbackHints[0];
+                    const result = {
+                        type: hint.verbType,
+                        confidence: hint.confidence,
+                        evidence: `Type pair hint (fallback): ${hint.description}`,
+                        metadata: {
+                            subjectType,
+                            objectType
+                        }
+                    };
+                    this.addToCache(cacheKey, result);
+                    return result;
+                }
+                const result = null;
+                this.addToCache(cacheKey, result);
+                return result;
+            }
+            // Use highest confidence hint
+            const bestHint = matchingHints.sort((a, b) => b.confidence - a.confidence)[0];
+            // Track hint hit
+            const currentHits = this.stats.hintHits.get(bestHint.description) || 0;
+            this.stats.hintHits.set(bestHint.description, currentHits + 1);
+            // Check confidence threshold
+            if (bestHint.confidence < this.options.minConfidence) {
+                const result = null;
+                this.addToCache(cacheKey, result);
+                return result;
+            }
+            this.stats.matches++;
+            const result = {
+                type: bestHint.verbType,
+                confidence: bestHint.confidence,
+                evidence: `Type pair hint: ${bestHint.description}`,
+                metadata: {
+                    subjectType,
+                    objectType
+                }
+            };
+            this.addToCache(cacheKey, result);
+            return result;
+        }
+        catch (error) {
+            return null;
+        }
+    }
+    /**
+     * Get cache key
+     */
+    getCacheKey(subjectType, objectType) {
+        return `${subjectType}:${objectType}`;
+    }
+    /**
+     * Get from LRU cache
+     */
+    getFromCache(key) {
+        if (!this.cache.has(key)) {
+            return undefined;
+        }
+        const cached = this.cache.get(key);
+        // Move to end (most recently used)
+        this.cacheOrder = this.cacheOrder.filter(k => k !== key);
+        this.cacheOrder.push(key);
+        return cached ?? null;
+    }
+    /**
+     * Add to LRU cache with eviction
+     */
+    addToCache(key, value) {
+        this.cache.set(key, value);
+        this.cacheOrder.push(key);
+        // Evict oldest if over limit
+        if (this.cache.size > this.options.cacheSize) {
+            const oldest = this.cacheOrder.shift();
+            if (oldest) {
+                this.cache.delete(oldest);
+            }
+        }
+    }
+    /**
+     * Get statistics
+     */
+    getStats() {
+        return {
+            ...this.stats,
+            hintCount: this.typePairHints.length,
+            cacheSize: this.cache.size,
+            cacheHitRate: this.stats.calls > 0 ? this.stats.cacheHits / this.stats.calls : 0,
+            matchRate: this.stats.calls > 0 ? this.stats.matches / this.stats.calls : 0,
+            topHints: Array.from(this.stats.hintHits.entries())
+                .sort((a, b) => b[1] - a[1])
+                .slice(0, 10)
+                .map(([hint, hits]) => ({ hint, hits }))
+        };
+    }
+    /**
+     * Reset statistics
+     */
+    resetStats() {
+        this.stats.calls = 0;
+        this.stats.cacheHits = 0;
+        this.stats.matches = 0;
+        // Reset hint hit counts
+        for (const hint of this.typePairHints) {
+            this.stats.hintHits.set(hint.description, 0);
+        }
+    }
+    /**
+     * Clear cache
+     */
+    clearCache() {
+        this.cache.clear();
+        this.cacheOrder = [];
+    }
+}
+//# sourceMappingURL=VerbContextSignal.js.map

package/dist/neural/signals/VerbEmbeddingSignal.d.ts ADDED Viewed

@@ -0,0 +1,131 @@
+/**
+ * VerbEmbeddingSignal - Neural semantic similarity for relationship classification
+ *
+ * WEIGHT: 35% (second highest after exact match)
+ *
+ * Uses:
+ * 1. 40 pre-computed verb type embeddings (384 dimensions)
+ * 2. Cosine similarity against context text
+ * 3. Semantic understanding of relationship intent
+ *
+ * PRODUCTION-READY: No TODOs, no mocks, real implementation
+ */
+import type { Brainy } from '../../brainy.js';
+import { VerbType } from '../../types/graphTypes.js';
+import type { Vector } from '../../coreTypes.js';
+/**
+ * Signal result with classification details
+ */
+export interface VerbSignal {
+    type: VerbType;
+    confidence: number;
+    evidence: string;
+    metadata?: {
+        similarity?: number;
+        allScores?: Array<{
+            type: VerbType;
+            similarity: number;
+        }>;
+    };
+}
+/**
+ * Options for verb embedding signal
+ */
+export interface VerbEmbeddingSignalOptions {
+    minConfidence?: number;
+    minSimilarity?: number;
+    topK?: number;
+    cacheSize?: number;
+    enableTemporalBoosting?: boolean;
+}
+/**
+ * VerbEmbeddingSignal - Neural relationship type classification
+ *
+ * Production features:
+ * - Uses 40 pre-computed verb type embeddings (zero runtime cost)
+ * - Cosine similarity for semantic matching
+ * - Temporal boosting for recently seen patterns
+ * - LRU cache for hot paths
+ * - Confidence calibration based on similarity distribution
+ */
+export declare class VerbEmbeddingSignal {
+    private brain;
+    private options;
+    private verbTypeEmbeddings;
+    private history;
+    private readonly MAX_HISTORY;
+    private cache;
+    private cacheOrder;
+    private stats;
+    constructor(brain: Brainy, options?: VerbEmbeddingSignalOptions);
+    /**
+     * Classify relationship type using semantic similarity
+     *
+     * @param context Full context text (sentence or paragraph)
+     * @param contextVector Optional pre-computed embedding (performance optimization)
+     * @returns VerbSignal with classified type or null
+     */
+    classify(context: string, contextVector?: Vector): Promise<VerbSignal | null>;
+    /**
+     * Get embedding for context text
+     */
+    private getEmbedding;
+    /**
+     * Calibrate confidence based on similarity distribution
+     *
+     * Higher confidence when:
+     * - Top similarity is high
+     * - Clear gap between top and second-best
+     * - Top K candidates agree on same type
+     */
+    private calibrateConfidence;
+    /**
+     * Get temporal boost for recently seen patterns
+     *
+     * Boosts confidence if similar context was recently classified as the same type
+     */
+    private getTemporalBoost;
+    /**
+     * Add pattern to history for temporal boosting
+     */
+    addToHistory(text: string, type: VerbType, vector: Vector): void;
+    /**
+     * Clear history
+     */
+    clearHistory(): void;
+    /**
+     * Get cache key
+     */
+    private getCacheKey;
+    /**
+     * Get from LRU cache
+     */
+    private getFromCache;
+    /**
+     * Add to LRU cache with eviction
+     */
+    private addToCache;
+    /**
+     * Get statistics
+     */
+    getStats(): {
+        verbTypeCount: number;
+        historySize: number;
+        cacheSize: number;
+        cacheHitRate: number;
+        matchRate: number;
+        calls: number;
+        cacheHits: number;
+        matches: number;
+        temporalBoosts: number;
+        averageSimilarity: number;
+    };
+    /**
+     * Reset statistics
+     */
+    resetStats(): void;
+    /**
+     * Clear cache
+     */
+    clearCache(): void;
+}