npm - cozo-memory - Versions diffs - 1.1.3 → 1.1.4 - Mend

cozo-memory 1.1.3 → 1.1.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (15) hide show

package/README.md +330 -4
package/dist/adaptive-retrieval.js +520 -0
package/dist/dynamic-fusion.js +602 -0
package/dist/index.js +386 -6
package/dist/logical-edges-service.js +316 -0
package/dist/multi-hop-vector-pivot.js +390 -0
package/dist/temporal-embedding-service.js +313 -0
package/dist/test-adaptive-integration.js +84 -0
package/dist/test-adaptive-retrieval.js +135 -0
package/dist/test-dynamic-fusion.js +231 -0
package/dist/test-logical-edges.js +282 -0
package/dist/test-multi-hop-vector-pivot-v2.js +239 -0
package/dist/test-multi-hop-vector-pivot.js +240 -0
package/dist/test-temporal-embeddings.js +123 -0
package/package.json +1 -1

package/dist/index.js CHANGED Viewed

@@ -16,6 +16,8 @@ const fs_1 = __importDefault(require("fs"));
 const pdf_mjs_1 = require("pdfjs-dist/legacy/build/pdf.mjs");
 const hybrid_search_1 = require("./hybrid-search");
 const inference_engine_1 = require("./inference-engine");
+const dynamic_fusion_1 = require("./dynamic-fusion");
+const adaptive_retrieval_1 = require("./adaptive-retrieval");
 exports.DB_PATH = path_1.default.resolve(__dirname, "..", "memory_db.cozo");
 const DB_ENGINE = process.env.DB_ENGINE || "sqlite"; // "sqlite" or "rocksdb"
 exports.USER_ENTITY_ID = "global_user_profile";
@@ -26,6 +28,8 @@ class MemoryServer {
     mcp;
     embeddingService;
     hybridSearch;
+    dynamicFusion;
+    adaptiveRetrieval;
     inferenceEngine;
     initPromise;
     compactionLocks = new Set();
@@ -76,6 +80,8 @@ class MemoryServer {
         console.error(`[DB] Using backend: ${DB_ENGINE}, path: ${fullDbPath}`);
         this.embeddingService = new embedding_service_1.EmbeddingService();
         this.hybridSearch = new hybrid_search_1.HybridSearch(this.db, this.embeddingService);
+        this.dynamicFusion = new dynamic_fusion_1.DynamicFusionSearch(this.db, this.embeddingService);
+        this.adaptiveRetrieval = new adaptive_retrieval_1.AdaptiveGraphRetrieval(this.db, this.embeddingService);
         this.inferenceEngine = new inference_engine_1.InferenceEngine(this.db, this.embeddingService);
         this.mcp = new fastmcp_1.FastMCP({
             name: "cozo-memory-server",
@@ -2383,6 +2389,215 @@ Format MUST start with "ExecutiveSummary: " followed by the consolidated content
             return { error: "Deletion failed", message: error.message };
         }
     }
+    /**
+     * Memory Defragmentation
+     * Reorganizes memory structure by:
+     * 1. Detecting and merging duplicate/near-duplicate observations using LSH MinHash
+     * 2. Connecting fragmented knowledge islands (small connected components) to main graph
+     * 3. Removing orphaned entities (no observations or relations)
+     *
+     * Inspired by Letta MemFS defragmentation
+     */
+    async defragMemory(args) {
+        await this.initPromise;
+        const startTime = Date.now();
+        try {
+            console.error(`[Defrag] Starting memory defragmentation (confirm=${args.confirm})`);
+            const similarity_threshold = args.similarity_threshold || 0.95; // High threshold for near-duplicates
+            const min_island_size = args.min_island_size || 3; // Islands with <= 3 nodes
+            const stats = {
+                duplicates_found: 0,
+                duplicates_merged: 0,
+                islands_found: 0,
+                islands_connected: 0,
+                orphans_found: 0,
+                orphans_removed: 0,
+            };
+            // Step 1: Find duplicate observations using semantic similarity
+            console.error(`[Defrag] Step 1: Detecting duplicate observations (threshold=${similarity_threshold})`);
+            const allObs = await this.db.run(`
+        ?[id, entity_id, text, embedding] := *observation{id, entity_id, text, embedding, @ "NOW"}
+      `);
+            const duplicatePairs = [];
+            // Compare embeddings for similarity (using existing embeddings)
+            for (let i = 0; i < allObs.rows.length; i++) {
+                for (let j = i + 1; j < allObs.rows.length; j++) {
+                    const emb1 = allObs.rows[i][3];
+                    const emb2 = allObs.rows[j][3];
+                    if (!emb1 || !emb2 || emb1.length === 0 || emb2.length === 0)
+                        continue;
+                    // Cosine similarity
+                    const similarity = this.cosineSimilarity(emb1, emb2);
+                    if (similarity >= similarity_threshold) {
+                        duplicatePairs.push([
+                            String(allObs.rows[i][0]), // id1
+                            String(allObs.rows[j][0]), // id2
+                            similarity
+                        ]);
+                    }
+                }
+            }
+            stats.duplicates_found = duplicatePairs.length;
+            console.error(`[Defrag] Found ${stats.duplicates_found} duplicate observation pairs`);
+            // Step 2: Find fragmented knowledge islands (small connected components)
+            console.error(`[Defrag] Step 2: Detecting fragmented knowledge islands`);
+            const components = await this.recomputeConnectedComponents();
+            const smallIslands = Object.entries(components.components || {})
+                .filter(([_, entities]) => entities.length > 0 && entities.length <= min_island_size)
+                .map(([compId, entities]) => ({ compId, entities: entities, size: entities.length }));
+            stats.islands_found = smallIslands.length;
+            console.error(`[Defrag] Found ${stats.islands_found} small knowledge islands (size <= ${min_island_size})`);
+            // Step 3: Find orphaned entities (no observations, no relations)
+            console.error(`[Defrag] Step 3: Detecting orphaned entities`);
+            // Simplified approach: Get all entities, then filter in JavaScript
+            const allEntities = await this.db.run(`
+        ?[id, name, type] := *entity{id, name, type, @ "NOW"}, id != "global_user_profile"
+      `);
+            const orphanedEntities = { rows: [] };
+            for (const row of allEntities.rows) {
+                const entityId = String(row[0]);
+                // Check if entity has observations
+                const obsCheck = await this.db.run(`
+          ?[count(id)] := *observation{id, entity_id, @ "NOW"}, entity_id = $eid
+        `, { eid: entityId });
+                const hasObs = Number(obsCheck.rows[0]?.[0] || 0) > 0;
+                if (hasObs)
+                    continue;
+                // Check if entity has relationships
+                const relCheck = await this.db.run(`
+          out[count(from_id)] := *relationship{from_id, @ "NOW"}, from_id = $eid
+          in[count(to_id)] := *relationship{to_id, @ "NOW"}, to_id = $eid
+          ?[total] := out[out_count], in[in_count], total = out_count + in_count
+        `, { eid: entityId });
+                const hasRel = Number(relCheck.rows[0]?.[0] || 0) > 0;
+                if (hasRel)
+                    continue;
+                // This entity is orphaned
+                orphanedEntities.rows.push(row);
+            }
+            stats.orphans_found = orphanedEntities.rows.length;
+            console.error(`[Defrag] Found ${stats.orphans_found} orphaned entities`);
+            // If not confirmed, return dry-run results
+            if (!args.confirm) {
+                return {
+                    status: "dry_run",
+                    message: "Defragmentation analysis complete. Set confirm=true to execute.",
+                    statistics: stats,
+                    preview: {
+                        duplicate_samples: duplicatePairs.slice(0, 5).map(([id1, id2, sim]) => ({
+                            observation_id_1: id1,
+                            observation_id_2: id2,
+                            similarity: sim
+                        })),
+                        island_samples: smallIslands.slice(0, 5),
+                        orphan_samples: orphanedEntities.rows.slice(0, 5).map((r) => ({
+                            id: String(r[0]),
+                            name: String(r[1]),
+                            type: String(r[2])
+                        }))
+                    }
+                };
+            }
+            // Execute defragmentation
+            console.error(`[Defrag] Executing defragmentation...`);
+            // Merge duplicates: Keep first, delete second
+            for (const [id1, id2, similarity] of duplicatePairs) {
+                try {
+                    // Delete the duplicate observation
+                    await this.db.run(`
+            ?[id, created_at] := *observation{id, created_at}, id = $id2
+            :rm observation {id, created_at}
+          `, { id2 });
+                    stats.duplicates_merged++;
+                }
+                catch (e) {
+                    console.error(`[Defrag] Failed to merge duplicate ${id2}:`, e.message);
+                }
+            }
+            // Connect islands: Create semantic relations to main graph
+            for (const island of smallIslands) {
+                try {
+                    // Find the most central entity in the island
+                    const islandEntityIds = island.entities.map((e) => e.id);
+                    // Find semantically similar entities in the main graph (not in this island)
+                    for (const entityId of islandEntityIds) {
+                        const entityData = await this.db.run(`
+              ?[embedding] := *entity{id: $id, embedding, @ "NOW"}
+            `, { id: entityId });
+                        if (entityData.rows.length === 0)
+                            continue;
+                        const embedding = entityData.rows[0][0];
+                        if (!embedding || embedding.length === 0)
+                            continue;
+                        // Find similar entity in main graph
+                        const similarEntities = await this.db.run(`
+              ~entity:semantic { id: target_id | query: $emb, k: 1, bind_distance: dist }
+              ?[target_id, dist] := ~entity:semantic { id: target_id | query: $emb, k: 1, bind_distance: dist },
+                                     target_id != $id
+            `, { emb: embedding, id: entityId });
+                        if (similarEntities.rows.length > 0) {
+                            const targetId = String(similarEntities.rows[0][0]);
+                            const distance = Number(similarEntities.rows[0][1]);
+                            const similarity = 1 - distance;
+                            // Create bridge relation
+                            if (similarity >= 0.7) {
+                                await this.createRelation({
+                                    from_id: entityId,
+                                    to_id: targetId,
+                                    relation_type: "semantically_related",
+                                    strength: similarity,
+                                    metadata: { created_by: "defrag", reason: "island_connection" }
+                                });
+                                stats.islands_connected++;
+                                break; // One connection per island is enough
+                            }
+                        }
+                    }
+                }
+                catch (e) {
+                    console.error(`[Defrag] Failed to connect island ${island.compId}:`, e.message);
+                }
+            }
+            // Remove orphaned entities
+            for (const row of orphanedEntities.rows) {
+                try {
+                    const entityId = String(row[0]);
+                    await this.deleteEntity({ entity_id: entityId });
+                    stats.orphans_removed++;
+                }
+                catch (e) {
+                    console.error(`[Defrag] Failed to remove orphan ${row[0]}:`, e.message);
+                }
+            }
+            this.trackOperation('defrag', startTime);
+            return {
+                status: "completed",
+                message: `Defragmentation complete: ${stats.duplicates_merged} duplicates merged, ${stats.islands_connected} islands connected, ${stats.orphans_removed} orphans removed`,
+                statistics: stats,
+                duration_ms: Date.now() - startTime
+            };
+        }
+        catch (error) {
+            console.error("[Defrag] Error during defragmentation:", error);
+            this.trackError('defrag');
+            return { error: "Defragmentation failed", message: error.message };
+        }
+    }
+    cosineSimilarity(a, b) {
+        if (a.length !== b.length)
+            return 0;
+        let dotProduct = 0;
+        let normA = 0;
+        let normB = 0;
+        for (let i = 0; i < a.length; i++) {
+            dotProduct += a[i] * b[i];
+            normA += a[i] * a[i];
+            normB += b[i] * b[i];
+        }
+        if (normA === 0 || normB === 0)
+            return 0;
+        return dotProduct / (Math.sqrt(normA) * Math.sqrt(normB));
+    }
     async invalidateObservation(args) {
         await this.initPromise;
         const startTime = Date.now();
@@ -3183,13 +3398,56 @@ Validation: Invalid syntax or missing columns in inference rules will result in
                 session_id: zod_1.z.string().optional().describe("Prioritize results from this session"),
                 task_id: zod_1.z.string().optional().describe("Prioritize results from this task"),
             }),
+            zod_1.z.object({
+                action: zod_1.z.literal("dynamic_fusion"),
+                query: zod_1.z.string().describe("Search query"),
+                config: zod_1.z.object({
+                    vector: zod_1.z.object({
+                        enabled: zod_1.z.boolean().optional().default(true),
+                        weight: zod_1.z.number().min(0).max(1).optional().default(0.4),
+                        topK: zod_1.z.number().optional().default(20),
+                        efSearch: zod_1.z.number().optional().default(100),
+                    }).optional(),
+                    sparse: zod_1.z.object({
+                        enabled: zod_1.z.boolean().optional().default(true),
+                        weight: zod_1.z.number().min(0).max(1).optional().default(0.3),
+                        topK: zod_1.z.number().optional().default(20),
+                        minScore: zod_1.z.number().optional().default(0.1),
+                    }).optional(),
+                    fts: zod_1.z.object({
+                        enabled: zod_1.z.boolean().optional().default(true),
+                        weight: zod_1.z.number().min(0).max(1).optional().default(0.2),
+                        topK: zod_1.z.number().optional().default(20),
+                        fuzzy: zod_1.z.boolean().optional().default(true),
+                    }).optional(),
+                    graph: zod_1.z.object({
+                        enabled: zod_1.z.boolean().optional().default(true),
+                        weight: zod_1.z.number().min(0).max(1).optional().default(0.1),
+                        maxDepth: zod_1.z.number().min(1).max(3).optional().default(2),
+                        maxResults: zod_1.z.number().optional().default(20),
+                        relationTypes: zod_1.z.array(zod_1.z.string()).optional(),
+                    }).optional(),
+                    fusion: zod_1.z.object({
+                        strategy: zod_1.z.enum(['rrf', 'weighted_sum', 'max', 'adaptive']).optional().default('rrf'),
+                        rrfK: zod_1.z.number().optional().default(60),
+                        minScore: zod_1.z.number().optional().default(0.0),
+                        deduplication: zod_1.z.boolean().optional().default(true),
+                    }).optional(),
+                }).optional().describe("Dynamic fusion configuration (all paths optional)"),
+                limit: zod_1.z.number().optional().default(10).describe("Maximum number of results to return"),
+            }),
+            zod_1.z.object({
+                action: zod_1.z.literal("adaptive_retrieval"),
+                query: zod_1.z.string().describe("Search query for adaptive retrieval"),
+                limit: zod_1.z.number().optional().default(10).describe("Maximum number of results"),
+            }),
         ]);
         const QueryMemoryParameters = zod_1.z.object({
             action: zod_1.z
-                .enum(["search", "advancedSearch", "context", "entity_details", "history", "graph_rag", "graph_walking", "agentic_search"])
+                .enum(["search", "advancedSearch", "context", "entity_details", "history", "graph_rag", "graph_walking", "agentic_search", "dynamic_fusion", "adaptive_retrieval"])
                 .describe("Action (determines which fields are required)"),
-            query: zod_1.z.string().optional().describe("Required for search/advancedSearch/context/graph_rag/graph_walking/agentic_search"),
-            limit: zod_1.z.number().optional().describe("Only for search/advancedSearch/graph_rag/graph_walking"),
+            query: zod_1.z.string().optional().describe("Required for search/advancedSearch/context/graph_rag/graph_walking/agentic_search/dynamic_fusion/adaptive_retrieval"),
+            limit: zod_1.z.number().optional().describe("Only for search/advancedSearch/graph_rag/graph_walking/dynamic_fusion/adaptive_retrieval"),
             session_id: zod_1.z.string().optional().describe("Optional session ID for context boosting"),
             task_id: zod_1.z.string().optional().describe("Optional task ID for context boosting"),
             filters: zod_1.z.any().optional().describe("Only for advancedSearch"),
@@ -3205,6 +3463,7 @@ Validation: Invalid syntax or missing columns in inference rules will result in
             max_depth: zod_1.z.number().optional().describe("Only for graph_rag/graph_walking: Maximum expansion depth"),
             start_entity_id: zod_1.z.string().optional().describe("Only for graph_walking: Start entity"),
             rerank: zod_1.z.boolean().optional().describe("Only for search/advancedSearch/agentic_search: Enable Cross-Encoder reranking"),
+            config: zod_1.z.any().optional().describe("Only for dynamic_fusion: Fusion configuration object"),
         });
         this.mcp.addTool({
             name: "query_memory",
@@ -3220,8 +3479,10 @@ Supported actions:
 - 'graph_rag': Graph-based reasoning (Hybrid RAG). Finds semantic vector seeds first, then expands via graph traversals. Ideal for multi-hop reasoning. Params: { query: string, max_depth?: number, limit?: number }.
 - 'graph_walking': Recursive semantic graph search. Starts at vector seeds or an entity and follows relationships to other semantically relevant entities. Params: { query: string, start_entity_id?: string, max_depth?: number, limit?: number }.
 - 'agentic_search': Auto-Routing Search. Uses local LLM to analyze intent and routes the query automatically to the best strategy (Vector, Graph, or Community Summaries). Params: { query: string, limit?: number }.
+- 'adaptive_retrieval': GraphRAG-R1 inspired adaptive retrieval with Progressive Retrieval Attenuation (PRA) and Cost-Aware F1 (CAF) scoring. Automatically selects optimal strategy based on query complexity and historical performance. Params: { query: string, limit?: number }.
+- 'dynamic_fusion': Advanced multi-path fusion search combining Vector (HNSW), Sparse (keyword), FTS (full-text), and Graph traversal with configurable weights and strategies. Params: { query: string, config?: { vector?, sparse?, fts?, graph?, fusion? }, limit?: number }. Each path can be enabled/disabled and weighted independently. Fusion strategies: 'rrf' (Reciprocal Rank Fusion), 'weighted_sum', 'max', 'adaptive'. Returns results with path contribution details and performance stats.
-Notes: 'agentic_search' is the most powerful and adaptable, 'context' is ideal for exploratory questions. 'search' and 'advancedSearch' are better for targeted fact retrieval.`,
+Notes: 'adaptive_retrieval' learns from usage and optimizes over time. 'dynamic_fusion' provides the most control and transparency over retrieval paths. 'agentic_search' is the most adaptive. 'context' is ideal for exploratory questions. 'search' and 'advancedSearch' are better for targeted fact retrieval.`,
             parameters: QueryMemoryParameters,
             execute: async (args) => {
                 await this.initPromise;
@@ -3392,6 +3653,101 @@ Notes: 'agentic_search' is the most powerful and adaptable, 'context' is ideal f
                     });
                     return JSON.stringify(results);
                 }
+                if (input.action === "dynamic_fusion") {
+                    const startTime = Date.now();
+                    if (!input.query || input.query.trim().length === 0) {
+                        return JSON.stringify({ error: "Search query must not be empty." });
+                    }
+                    try {
+                        console.log('[query_memory] Dynamic Fusion search:', {
+                            query: input.query,
+                            config: input.config ? 'custom' : 'default',
+                            limit: input.limit
+                        });
+                        // Execute dynamic fusion search
+                        const { results, stats } = await this.dynamicFusion.search(input.query, input.config || {});
+                        // Apply limit
+                        const limitedResults = results.slice(0, input.limit || 10);
+                        const response = {
+                            results: limitedResults,
+                            stats: {
+                                ...stats,
+                                totalTime: Date.now() - startTime,
+                                resultsReturned: limitedResults.length,
+                                resultsTotal: results.length
+                            },
+                            metadata: {
+                                query: input.query,
+                                fusionStrategy: input.config?.fusion?.strategy || 'rrf',
+                                enabledPaths: {
+                                    vector: input.config?.vector?.enabled !== false,
+                                    sparse: input.config?.sparse?.enabled !== false,
+                                    fts: input.config?.fts?.enabled !== false,
+                                    graph: input.config?.graph?.enabled !== false
+                                }
+                            }
+                        };
+                        console.log('[query_memory] Dynamic Fusion completed:', {
+                            resultsReturned: limitedResults.length,
+                            totalTime: response.stats.totalTime,
+                            pathContributions: stats.pathContributions
+                        });
+                        return JSON.stringify(response);
+                    }
+                    catch (error) {
+                        console.error('[query_memory] Dynamic Fusion error:', error);
+                        return JSON.stringify({
+                            error: "Dynamic fusion search failed",
+                            details: error.message
+                        });
+                    }
+                }
+                if (input.action === "adaptive_retrieval") {
+                    const startTime = Date.now();
+                    if (!input.query || input.query.trim().length === 0) {
+                        return JSON.stringify({ error: "Search query must not be empty." });
+                    }
+                    try {
+                        console.log('[query_memory] Adaptive Retrieval search:', {
+                            query: input.query,
+                            limit: input.limit
+                        });
+                        // Execute adaptive retrieval
+                        const result = await this.adaptiveRetrieval.retrieve(input.query, input.limit || 10);
+                        const response = {
+                            results: result.results,
+                            metadata: {
+                                query: input.query,
+                                strategy: result.strategy,
+                                retrievalCount: result.retrievalCount,
+                                latency: result.latency,
+                                cafScore: result.cafScore,
+                                totalTime: Date.now() - startTime
+                            },
+                            performance: {
+                                strategyUsed: result.strategy,
+                                retrievalCalls: result.retrievalCount,
+                                costAwareF1: result.cafScore,
+                                latencyMs: result.latency
+                            }
+                        };
+                        console.log('[query_memory] Adaptive Retrieval completed:', {
+                            strategy: result.strategy,
+                            resultsReturned: result.results.length,
+                            retrievalCount: result.retrievalCount,
+                            cafScore: result.cafScore?.toFixed(3),
+                            totalTime: response.metadata.totalTime
+                        });
+                        return JSON.stringify(response);
+                    }
+                    catch (error) {
+                        console.error('[query_memory] Adaptive Retrieval error:', error);
+                        return JSON.stringify({
+                            error: "Adaptive retrieval search failed",
+                            details: error.message
+                        });
+                    }
+                }
                 if (input.action === "graph_rag") {
                     if (!input.query || input.query.trim().length === 0) {
                         return JSON.stringify({ error: "Search query must not be empty." });
@@ -3865,6 +4221,12 @@ Supported actions:
                 min_entity_degree: zod_1.z.number().min(0).max(100).optional().default(2),
                 model: zod_1.z.string().optional().default("demyagent-4b-i1:Q6_K"),
             }),
+            zod_1.z.object({
+                action: zod_1.z.literal("defrag"),
+                confirm: zod_1.z.boolean().describe("Must be true to confirm defragmentation"),
+                similarity_threshold: zod_1.z.number().min(0.8).max(1.0).optional().default(0.95).describe("Similarity threshold for duplicate detection (0.8-1.0)"),
+                min_island_size: zod_1.z.number().min(1).max(10).optional().default(3).describe("Maximum size of knowledge islands to connect"),
+            }),
             zod_1.z.object({
                 action: zod_1.z.literal("reflect"),
                 entity_id: zod_1.z.string().optional().describe("Optional entity ID for targeted reflection"),
@@ -3889,7 +4251,7 @@ Supported actions:
         ]);
         const ManageSystemParameters = zod_1.z.object({
             action: zod_1.z
-                .enum(["health", "metrics", "export_memory", "import_memory", "snapshot_create", "snapshot_list", "snapshot_diff", "cleanup", "reflect", "clear_memory", "summarize_communities", "compact"])
+                .enum(["health", "metrics", "export_memory", "import_memory", "snapshot_create", "snapshot_list", "snapshot_diff", "cleanup", "defrag", "reflect", "clear_memory", "summarize_communities", "compact"])
                 .describe("Action (determines which fields are required)"),
             format: zod_1.z.enum(["json", "markdown", "obsidian"]).optional().describe("Export format (for export_memory)"),
             includeMetadata: zod_1.z.boolean().optional().describe("Include metadata (for export_memory)"),
@@ -3904,10 +4266,12 @@ Supported actions:
             snapshot_id_a: zod_1.z.string().optional().describe("Required for snapshot_diff"),
             snapshot_id_b: zod_1.z.string().optional().describe("Required for snapshot_diff"),
             metadata: MetadataSchema.optional().describe("Optional for snapshot_create"),
-            confirm: zod_1.z.boolean().optional().describe("Required for cleanup/clear_memory and must be true"),
+            confirm: zod_1.z.boolean().optional().describe("Required for cleanup/defrag/clear_memory and must be true"),
             older_than_days: zod_1.z.number().optional().describe("Optional for cleanup"),
             max_observations: zod_1.z.number().optional().describe("Optional for cleanup"),
             min_entity_degree: zod_1.z.number().optional().describe("Optional for cleanup"),
+            similarity_threshold: zod_1.z.number().optional().describe("Optional for defrag (0.8-1.0, default 0.95)"),
+            min_island_size: zod_1.z.number().optional().describe("Optional for defrag (1-10, default 3)"),
             model: zod_1.z.string().optional().describe("Optional for cleanup/reflect/summarize_communities"),
             entity_id: zod_1.z.string().optional().describe("Optional for reflect"),
             min_community_size: zod_1.z.number().optional().describe("Optional for summarize_communities"),
@@ -3934,6 +4298,9 @@ Supported actions:
 - 'cleanup': Janitor service for consolidation. Params: { confirm: boolean, older_than_days?: number, max_observations?: number, min_entity_degree?: number, model?: string }.
   * With confirm=false: Dry-Run (shows candidates).
   * With confirm=true: Merges old/isolated fragments using LLM (Executive Summary) and removes noise.
+- 'defrag': Memory defragmentation. Reorganizes memory structure by detecting/merging duplicates, connecting fragmented knowledge islands, and removing orphaned entities. Params: { confirm: boolean, similarity_threshold?: number (0.8-1.0, default 0.95), min_island_size?: number (1-10, default 3) }.
+  * With confirm=false: Dry-Run (shows analysis and candidates).
+  * With confirm=true: Executes defragmentation and returns statistics.
 - 'reflect': Reflection service. Analyzes memory for contradictions and insights. Params: { entity_id?: string, model?: string }.
 - 'clear_memory': Resets the entire database. Params: { confirm: boolean (must be true) }.
 - 'summarize_communities': Hierarchical GraphRAG. Generates summaries for entity clusters. Params: { model?: string, min_community_size?: number }.`,
@@ -4124,6 +4491,19 @@ Supported actions:
                         return JSON.stringify({ error: error.message || "Error during cleanup" });
                     }
                 }
+                if (input.action === "defrag") {
+                    try {
+                        const result = await this.defragMemory({
+                            confirm: Boolean(input.confirm),
+                            similarity_threshold: input.similarity_threshold,
+                            min_island_size: input.min_island_size,
+                        });
+                        return JSON.stringify(result);
+                    }
+                    catch (error) {
+                        return JSON.stringify({ error: error.message || "Error during defragmentation" });
+                    }
+                }
                 if (input.action === "reflect") {
                     try {
                         const result = await this.reflectMemory({