npm - cccmemory - Versions diffs - 1.9.0 → 2.0.1 - Mend

cccmemory 1.9.0 → 2.0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (72) hide show

package/README.md +96 -50
package/dist/chunking/ChunkingConfig.d.ts +63 -0
package/dist/chunking/ChunkingConfig.d.ts.map +1 -0
package/dist/chunking/ChunkingConfig.js +44 -0
package/dist/chunking/ChunkingConfig.js.map +1 -0
package/dist/chunking/TextChunker.d.ts +59 -0
package/dist/chunking/TextChunker.d.ts.map +1 -0
package/dist/chunking/TextChunker.js +130 -0
package/dist/chunking/TextChunker.js.map +1 -0
package/dist/chunking/index.d.ts +9 -0
package/dist/chunking/index.d.ts.map +1 -0
package/dist/chunking/index.js +8 -0
package/dist/chunking/index.js.map +1 -0
package/dist/chunking/strategies/SentenceChunker.d.ts +19 -0
package/dist/chunking/strategies/SentenceChunker.d.ts.map +1 -0
package/dist/chunking/strategies/SentenceChunker.js +251 -0
package/dist/chunking/strategies/SentenceChunker.js.map +1 -0
package/dist/chunking/strategies/SlidingWindowChunker.d.ts +10 -0
package/dist/chunking/strategies/SlidingWindowChunker.d.ts.map +1 -0
package/dist/chunking/strategies/SlidingWindowChunker.js +133 -0
package/dist/chunking/strategies/SlidingWindowChunker.js.map +1 -0
package/dist/embeddings/VectorStore.d.ts +78 -3
package/dist/embeddings/VectorStore.d.ts.map +1 -1
package/dist/embeddings/VectorStore.js +352 -21
package/dist/embeddings/VectorStore.js.map +1 -1
package/dist/mcp-server.d.ts +5 -0
package/dist/mcp-server.d.ts.map +1 -1
package/dist/mcp-server.js +79 -11
package/dist/mcp-server.js.map +1 -1
package/dist/parsers/ExtractionValidator.d.ts +84 -0
package/dist/parsers/ExtractionValidator.d.ts.map +1 -0
package/dist/parsers/ExtractionValidator.js +296 -0
package/dist/parsers/ExtractionValidator.js.map +1 -0
package/dist/search/HybridReranker.d.ts +80 -0
package/dist/search/HybridReranker.d.ts.map +1 -0
package/dist/search/HybridReranker.js +146 -0
package/dist/search/HybridReranker.js.map +1 -0
package/dist/search/QueryExpander.d.ts +53 -0
package/dist/search/QueryExpander.d.ts.map +1 -0
package/dist/search/QueryExpander.js +178 -0
package/dist/search/QueryExpander.js.map +1 -0
package/dist/search/ResultAggregator.d.ts +70 -0
package/dist/search/ResultAggregator.d.ts.map +1 -0
package/dist/search/ResultAggregator.js +155 -0
package/dist/search/ResultAggregator.js.map +1 -0
package/dist/search/SemanticSearch.d.ts +25 -1
package/dist/search/SemanticSearch.d.ts.map +1 -1
package/dist/search/SemanticSearch.js +264 -53
package/dist/search/SemanticSearch.js.map +1 -1
package/dist/search/SnippetGenerator.d.ts +81 -0
package/dist/search/SnippetGenerator.d.ts.map +1 -0
package/dist/search/SnippetGenerator.js +268 -0
package/dist/search/SnippetGenerator.js.map +1 -0
package/dist/search/index.d.ts +15 -0
package/dist/search/index.d.ts.map +1 -0
package/dist/search/index.js +10 -0
package/dist/search/index.js.map +1 -0
package/dist/storage/migrations.d.ts +3 -2
package/dist/storage/migrations.d.ts.map +1 -1
package/dist/storage/migrations.js +235 -13
package/dist/storage/migrations.js.map +1 -1
package/dist/tools/ToolDefinitions.d.ts +786 -0
package/dist/tools/ToolDefinitions.d.ts.map +1 -1
package/dist/tools/ToolDefinitions.js +758 -1
package/dist/tools/ToolDefinitions.js.map +1 -1
package/dist/tools/ToolHandlers.d.ts +96 -21
package/dist/tools/ToolHandlers.d.ts.map +1 -1
package/dist/tools/ToolHandlers.js +1926 -127
package/dist/tools/ToolHandlers.js.map +1 -1
package/dist/types/ToolTypes.d.ts +495 -18
package/dist/types/ToolTypes.d.ts.map +1 -1
package/package.json +1 -1

package/README.md CHANGED Viewed

@@ -4,76 +4,51 @@ An MCP server that gives Claude long-term memory by indexing conversation histor
 ---
-## ⚠️ Breaking Changes in v1.8.0
+## What's New in v2.0
-**This package has been renamed from `claude-conversation-memory-mcp` to `cccmemory`.**
+Version 2.0 brings major improvements to search quality and accuracy:
-If you were using the old package, follow these migration steps:
+- **Smart Chunking** - Long messages are now split at sentence boundaries, ensuring full content is searchable (previously truncated at 512 tokens)
+- **Hybrid Search** - Combines semantic search with full-text search using Reciprocal Rank Fusion (RRF) for better ranking
+- **Dynamic Thresholds** - Similarity thresholds adjust based on query length for better precision
+- **Improved Snippets** - Search results highlight matching terms in context
+- **Extraction Validation** - Reduces false positives in decision/mistake detection
+- **Query Expansion** - Optional synonym expansion for broader recall (disabled by default)
-### 1. Uninstall the old package
-```bash
-npm uninstall -g claude-conversation-memory-mcp
-```
-### 2. Install the new package
-```bash
-npm install -g cccmemory
-```
-### 3. Update your MCP configuration
-**Claude Desktop** (`~/Library/Application Support/Claude/claude_desktop_config.json`):
-```json
-{
-  "mcpServers": {
-    "cccmemory": {
-      "command": "npx",
-      "args": ["-y", "cccmemory"]
-    }
-  }
-}
-```
+---
-**Claude Code** (`~/.claude.json`):
-```json
-{
-  "mcpServers": {
-    "cccmemory": {
-      "command": "npx",
-      "args": ["-y", "cccmemory"]
-    }
-  }
-}
-```
+<details>
+<summary><strong>⚠️ Breaking Changes in v1.8.0</strong> (click to expand)</summary>
-**Codex** (`~/.codex/config.toml`):
-```toml
-[mcp_servers.cccmemory]
-command = "npx"
-args = ["-y", "cccmemory"]
-```
+**This package was renamed from `claude-conversation-memory-mcp` to `cccmemory`.**
-### 4. Database migration (automatic)
+If upgrading from the old package:
-Your conversation history is preserved. The database files are automatically migrated:
-- `.claude-conversations-memory.db` → `.cccmemory.db`
-- `.codex-conversations-memory.db` → `.cccmemory.db`
+1. Uninstall old package: `npm uninstall -g claude-conversation-memory-mcp`
+2. Install new package: `npm install -g cccmemory`
+3. Update MCP config to use `cccmemory` command
+4. Database migration is automatic (`.claude-conversations-memory.db` → `.cccmemory.db`)
-No manual action required - the migration happens on first run.
+</details>
 ---
 ## Features
 - **Search conversations** - Natural language search across your chat history
+- **Smart chunking** - Long messages fully indexed without truncation
+- **Hybrid search** - Combines vector + keyword search with RRF re-ranking
 - **Track decisions** - Remember why you made technical choices
 - **Prevent mistakes** - Learn from past errors
 - **Git integration** - Link conversations to commits
 - **Cross-project search** - Search across all your projects globally
 - **Project migration** - Keep history when renaming/moving projects
 - **Semantic search** - Uses Transformers.js embeddings (bundled, works offline)
+- **Working memory** - Store and recall facts, decisions, and context across sessions
+- **Session handoff** - Seamless context transfer between conversations
+- **Tag management** - Organize memories, decisions, and patterns with tags
+- **Memory quality** - Track confidence, importance, and verification status
+- **Database maintenance** - Find duplicates, clean stale data, health reports
 ## Installation
@@ -249,6 +224,19 @@ Config:
 Set `OPENAI_API_KEY` environment variable.
 </details>
+### Search Configuration (Optional)
+Tune search behavior with environment variables:
+| Variable | Default | Description |
+|----------|---------|-------------|
+| `CCCMEMORY_CHUNKING_ENABLED` | `true` | Enable smart chunking for long messages |
+| `CCCMEMORY_CHUNK_SIZE` | `450` | Target chunk size in tokens |
+| `CCCMEMORY_CHUNK_OVERLAP` | `0.1` | Overlap between chunks (0-1) |
+| `CCCMEMORY_RERANK_ENABLED` | `true` | Enable hybrid re-ranking (vector + FTS) |
+| `CCCMEMORY_RERANK_WEIGHT` | `0.7` | Vector weight in re-ranking (FTS gets 1-weight) |
+| `CCCMEMORY_QUERY_EXPANSION` | `false` | Enable synonym expansion for queries |
 ## MCP Tools
 ### Indexing
@@ -290,6 +278,64 @@ Set `OPENAI_API_KEY` environment variable.
 | `forget_by_topic` | Delete conversations by keyword |
 | `generate_documentation` | Generate docs from local code scan + conversations |
+### Working Memory
+| Tool | Description |
+|------|-------------|
+| `remember` | Store a fact, decision, or context with optional TTL |
+| `recall` | Retrieve a specific memory by key |
+| `recall_relevant` | Semantic search across stored memories |
+| `list_memory` | List all memories, optionally filtered by tags |
+| `forget` | Remove a memory by key |
+### Session Handoff
+| Tool | Description |
+|------|-------------|
+| `prepare_handoff` | Create handoff document for session transition |
+| `resume_from_handoff` | Resume work from a previous handoff |
+| `list_handoffs` | List available handoff documents |
+### Context Injection
+| Tool | Description |
+|------|-------------|
+| `get_startup_context` | Get relevant context at conversation start |
+| `inject_relevant_context` | Auto-inject context based on user message |
+### Tag Management
+| Tool | Description |
+|------|-------------|
+| `list_tags` | List all tags with usage statistics |
+| `search_by_tags` | Find items by tag (memories, decisions, patterns) |
+| `rename_tag` | Rename a tag across all items |
+| `merge_tags` | Merge multiple tags into one |
+| `delete_tag` | Delete a tag and unlink all items |
+| `tag_item` | Add tags to an item |
+| `untag_item` | Remove tags from an item |
+### Memory Quality
+| Tool | Description |
+|------|-------------|
+| `set_memory_confidence` | Set confidence level (uncertain/likely/confirmed/verified) |
+| `set_memory_importance` | Set importance level (low/normal/high/critical) |
+| `pin_memory` | Pin a memory to prevent cleanup |
+| `archive_memory` | Archive a memory with optional reason |
+| `unarchive_memory` | Restore an archived memory |
+| `search_memory_by_quality` | Search memories by confidence/importance |
+| `get_memory_stats` | Get memory statistics by confidence/importance |
+### Maintenance
+| Tool | Description |
+|------|-------------|
+| `get_storage_stats` | Database size and item counts |
+| `find_stale_items` | Find items not accessed recently |
+| `find_duplicates` | Find similar/duplicate items |
+| `merge_duplicates` | Merge duplicate items |
+| `cleanup_stale` | Archive or delete stale items |
+| `vacuum_database` | Reclaim disk space |
+| `cleanup_orphans` | Remove orphaned records |
+| `get_health_report` | Overall database health check |
+| `run_maintenance` | Run multiple maintenance tasks |
+| `get_maintenance_history` | View past maintenance operations |
 ### Session IDs
 `list_recent_sessions` returns **two identifiers**:

package/dist/chunking/ChunkingConfig.d.ts ADDED Viewed

@@ -0,0 +1,63 @@
+/**
+ * Chunking Configuration Types
+ * Defines configuration options for text chunking strategies
+ */
+export type ChunkingStrategy = "sentence" | "sliding_window" | "paragraph";
+export interface ChunkingConfig {
+    /** Enable or disable chunking (default: true) */
+    enabled: boolean;
+    /** Chunking strategy to use (default: "sentence") */
+    strategy: ChunkingStrategy;
+    /** Target chunk size in tokens (default: 450 for 512 limit with margin) */
+    chunkSize: number;
+    /** Overlap between chunks as a fraction (default: 0.1 = 10%) */
+    overlap: number;
+    /** Minimum chunk size in tokens - don't split smaller texts (default: 50) */
+    minChunkSize: number;
+    /** Maximum chunk size as hard limit (default: 500) */
+    maxChunkSize: number;
+    /** Characters per token estimate for prose (default: 4) */
+    charsPerTokenProse: number;
+    /** Characters per token estimate for code (default: 3.5) */
+    charsPerTokenCode: number;
+}
+export declare const DEFAULT_CHUNKING_CONFIG: ChunkingConfig;
+/**
+ * Result of chunking a text
+ */
+export interface TextChunk {
+    /** The chunk content */
+    content: string;
+    /** Index of this chunk within the source text */
+    index: number;
+    /** Total number of chunks from the source text */
+    totalChunks: number;
+    /** Character offset where this chunk starts in the original text */
+    startOffset: number;
+    /** Character offset where this chunk ends in the original text */
+    endOffset: number;
+    /** Estimated token count for this chunk */
+    estimatedTokens: number;
+    /** Strategy used to create this chunk */
+    strategy: ChunkingStrategy;
+}
+/**
+ * Metadata about the chunking operation
+ */
+export interface ChunkingResult {
+    /** Original text that was chunked */
+    originalLength: number;
+    /** Whether the text was actually chunked or returned as-is */
+    wasChunked: boolean;
+    /** Chunks produced */
+    chunks: TextChunk[];
+    /** Strategy used */
+    strategy: ChunkingStrategy;
+    /** Estimated total tokens in original text */
+    estimatedTotalTokens: number;
+}
+/**
+ * Get chunking config from environment or defaults
+ */
+export declare function getChunkingConfig(): ChunkingConfig;
+//# sourceMappingURL=ChunkingConfig.d.ts.map

package/dist/chunking/ChunkingConfig.d.ts.map ADDED Viewed

@@ -0,0 +1 @@

+ {"version":3,"file":"ChunkingConfig.d.ts","sourceRoot":"","sources":["../../src/chunking/ChunkingConfig.ts"],"names":[],"mappings":"AAAA;;;GAGG;AAEH,MAAM,MAAM,gBAAgB,GAAG,UAAU,GAAG,gBAAgB,GAAG,WAAW,CAAC;AAE3E,MAAM,WAAW,cAAc;IAC7B,iDAAiD;IACjD,OAAO,EAAE,OAAO,CAAC;IAEjB,qDAAqD;IACrD,QAAQ,EAAE,gBAAgB,CAAC;IAE3B,2EAA2E;IAC3E,SAAS,EAAE,MAAM,CAAC;IAElB,gEAAgE;IAChE,OAAO,EAAE,MAAM,CAAC;IAEhB,6EAA6E;IAC7E,YAAY,EAAE,MAAM,CAAC;IAErB,sDAAsD;IACtD,YAAY,EAAE,MAAM,CAAC;IAErB,2DAA2D;IAC3D,kBAAkB,EAAE,MAAM,CAAC;IAE3B,4DAA4D;IAC5D,iBAAiB,EAAE,MAAM,CAAC;CAC3B;AAED,eAAO,MAAM,uBAAuB,EAAE,cASrC,CAAC;AAEF;;GAEG;AACH,MAAM,WAAW,SAAS;IACxB,wBAAwB;IACxB,OAAO,EAAE,MAAM,CAAC;IAEhB,iDAAiD;IACjD,KAAK,EAAE,MAAM,CAAC;IAEd,kDAAkD;IAClD,WAAW,EAAE,MAAM,CAAC;IAEpB,oEAAoE;IACpE,WAAW,EAAE,MAAM,CAAC;IAEpB,kEAAkE;IAClE,SAAS,EAAE,MAAM,CAAC;IAElB,2CAA2C;IAC3C,eAAe,EAAE,MAAM,CAAC;IAExB,yCAAyC;IACzC,QAAQ,EAAE,gBAAgB,CAAC;CAC5B;AAED;;GAEG;AACH,MAAM,WAAW,cAAc;IAC7B,qCAAqC;IACrC,cAAc,EAAE,MAAM,CAAC;IAEvB,8DAA8D;IAC9D,UAAU,EAAE,OAAO,CAAC;IAEpB,sBAAsB;IACtB,MAAM,EAAE,SAAS,EAAE,CAAC;IAEpB,oBAAoB;IACpB,QAAQ,EAAE,gBAAgB,CAAC;IAE3B,8CAA8C;IAC9C,oBAAoB,EAAE,MAAM,CAAC;CAC9B;AAED;;GAEG;AACH,wBAAgB,iBAAiB,IAAI,cAAc,CA8BlD"}

package/dist/chunking/ChunkingConfig.js ADDED Viewed

@@ -0,0 +1,44 @@
+/**
+ * Chunking Configuration Types
+ * Defines configuration options for text chunking strategies
+ */
+export const DEFAULT_CHUNKING_CONFIG = {
+    enabled: true,
+    strategy: "sentence",
+    chunkSize: 450,
+    overlap: 0.1,
+    minChunkSize: 50,
+    maxChunkSize: 500,
+    charsPerTokenProse: 4,
+    charsPerTokenCode: 3.5,
+};
+/**
+ * Get chunking config from environment or defaults
+ */
+export function getChunkingConfig() {
+    const config = { ...DEFAULT_CHUNKING_CONFIG };
+    // Environment overrides
+    if (process.env.CCCMEMORY_CHUNKING_ENABLED !== undefined) {
+        config.enabled = process.env.CCCMEMORY_CHUNKING_ENABLED === "true";
+    }
+    if (process.env.CCCMEMORY_CHUNK_SIZE) {
+        const size = parseInt(process.env.CCCMEMORY_CHUNK_SIZE, 10);
+        if (!isNaN(size) && size > 0) {
+            config.chunkSize = size;
+        }
+    }
+    if (process.env.CCCMEMORY_CHUNKING_STRATEGY) {
+        const strategy = process.env.CCCMEMORY_CHUNKING_STRATEGY;
+        if (["sentence", "sliding_window", "paragraph"].includes(strategy)) {
+            config.strategy = strategy;
+        }
+    }
+    if (process.env.CCCMEMORY_CHUNK_OVERLAP) {
+        const overlap = parseFloat(process.env.CCCMEMORY_CHUNK_OVERLAP);
+        if (!isNaN(overlap) && overlap >= 0 && overlap < 1) {
+            config.overlap = overlap;
+        }
+    }
+    return config;
+}
+//# sourceMappingURL=ChunkingConfig.js.map

package/dist/chunking/ChunkingConfig.js.map ADDED Viewed

@@ -0,0 +1 @@

+ {"version":3,"file":"ChunkingConfig.js","sourceRoot":"","sources":["../../src/chunking/ChunkingConfig.ts"],"names":[],"mappings":"AAAA;;;GAGG;AA8BH,MAAM,CAAC,MAAM,uBAAuB,GAAmB;IACrD,OAAO,EAAE,IAAI;IACb,QAAQ,EAAE,UAAU;IACpB,SAAS,EAAE,GAAG;IACd,OAAO,EAAE,GAAG;IACZ,YAAY,EAAE,EAAE;IAChB,YAAY,EAAE,GAAG;IACjB,kBAAkB,EAAE,CAAC;IACrB,iBAAiB,EAAE,GAAG;CACvB,CAAC;AAgDF;;GAEG;AACH,MAAM,UAAU,iBAAiB;IAC/B,MAAM,MAAM,GAAG,EAAE,GAAG,uBAAuB,EAAE,CAAC;IAE9C,wBAAwB;IACxB,IAAI,OAAO,CAAC,GAAG,CAAC,0BAA0B,KAAK,SAAS,EAAE,CAAC;QACzD,MAAM,CAAC,OAAO,GAAG,OAAO,CAAC,GAAG,CAAC,0BAA0B,KAAK,MAAM,CAAC;IACrE,CAAC;IAED,IAAI,OAAO,CAAC,GAAG,CAAC,oBAAoB,EAAE,CAAC;QACrC,MAAM,IAAI,GAAG,QAAQ,CAAC,OAAO,CAAC,GAAG,CAAC,oBAAoB,EAAE,EAAE,CAAC,CAAC;QAC5D,IAAI,CAAC,KAAK,CAAC,IAAI,CAAC,IAAI,IAAI,GAAG,CAAC,EAAE,CAAC;YAC7B,MAAM,CAAC,SAAS,GAAG,IAAI,CAAC;QAC1B,CAAC;IACH,CAAC;IAED,IAAI,OAAO,CAAC,GAAG,CAAC,2BAA2B,EAAE,CAAC;QAC5C,MAAM,QAAQ,GAAG,OAAO,CAAC,GAAG,CAAC,2BAA+C,CAAC;QAC7E,IAAI,CAAC,UAAU,EAAE,gBAAgB,EAAE,WAAW,CAAC,CAAC,QAAQ,CAAC,QAAQ,CAAC,EAAE,CAAC;YACnE,MAAM,CAAC,QAAQ,GAAG,QAAQ,CAAC;QAC7B,CAAC;IACH,CAAC;IAED,IAAI,OAAO,CAAC,GAAG,CAAC,uBAAuB,EAAE,CAAC;QACxC,MAAM,OAAO,GAAG,UAAU,CAAC,OAAO,CAAC,GAAG,CAAC,uBAAuB,CAAC,CAAC;QAChE,IAAI,CAAC,KAAK,CAAC,OAAO,CAAC,IAAI,OAAO,IAAI,CAAC,IAAI,OAAO,GAAG,CAAC,EAAE,CAAC;YACnD,MAAM,CAAC,OAAO,GAAG,OAAO,CAAC;QAC3B,CAAC;IACH,CAAC;IAED,OAAO,MAAM,CAAC;AAChB,CAAC"}

package/dist/chunking/TextChunker.d.ts ADDED Viewed

@@ -0,0 +1,59 @@
+/**
+ * Text Chunker Factory
+ * Provides unified interface for text chunking strategies
+ */
+import type { ChunkingConfig, ChunkingResult, TextChunk } from "./ChunkingConfig.js";
+/**
+ * Interface for chunking strategies
+ */
+export interface ChunkingStrategy {
+    chunk(text: string, config: ChunkingConfig): ChunkingResult;
+}
+/**
+ * Text Chunker - Factory for creating and using chunking strategies
+ */
+export declare class TextChunker {
+    private config;
+    constructor(config?: Partial<ChunkingConfig>);
+    /**
+     * Get current configuration
+     */
+    getConfig(): ChunkingConfig;
+    /**
+     * Check if text needs chunking based on estimated token count
+     */
+    needsChunking(text: string): boolean;
+    /**
+     * Estimate token count for text
+     */
+    estimateTokens(text: string): number;
+    /**
+     * Chunk text using configured strategy
+     */
+    chunk(text: string): ChunkingResult;
+    /**
+     * Chunk multiple texts in batch
+     */
+    chunkBatch(texts: string[]): ChunkingResult[];
+    /**
+     * Flatten chunks from multiple texts into a single array with source tracking
+     */
+    chunkBatchFlat(texts: Array<{
+        id: string | number;
+        content: string;
+    }>): Array<TextChunk & {
+        sourceId: string | number;
+    }>;
+}
+/**
+ * Get or create global chunker instance
+ */
+export declare function getTextChunker(config?: Partial<ChunkingConfig>): TextChunker;
+/**
+ * Reset global chunker (useful for testing)
+ */
+export declare function resetTextChunker(): void;
+export type { ChunkingConfig, ChunkingResult, TextChunk };
+export { DEFAULT_CHUNKING_CONFIG, getChunkingConfig } from "./ChunkingConfig.js";
+export { estimateTokens } from "./strategies/SentenceChunker.js";
+//# sourceMappingURL=TextChunker.d.ts.map

package/dist/chunking/TextChunker.d.ts.map ADDED Viewed

@@ -0,0 +1 @@

+ {"version":3,"file":"TextChunker.d.ts","sourceRoot":"","sources":["../../src/chunking/TextChunker.ts"],"names":[],"mappings":"AAAA;;;GAGG;AAEH,OAAO,KAAK,EACV,cAAc,EACd,cAAc,EACd,SAAS,EACV,MAAM,qBAAqB,CAAC;AAQ7B;;GAEG;AACH,MAAM,WAAW,gBAAgB;IAC/B,KAAK,CAAC,IAAI,EAAE,MAAM,EAAE,MAAM,EAAE,cAAc,GAAG,cAAc,CAAC;CAC7D;AAED;;GAEG;AACH,qBAAa,WAAW;IACtB,OAAO,CAAC,MAAM,CAAiB;gBAEnB,MAAM,CAAC,EAAE,OAAO,CAAC,cAAc,CAAC;IAU5C;;OAEG;IACH,SAAS,IAAI,cAAc;IAI3B;;OAEG;IACH,aAAa,CAAC,IAAI,EAAE,MAAM,GAAG,OAAO;IASpC;;OAEG;IACH,cAAc,CAAC,IAAI,EAAE,MAAM,GAAG,MAAM;IAIpC;;OAEG;IACH,KAAK,CAAC,IAAI,EAAE,MAAM,GAAG,cAAc;IAyCnC;;OAEG;IACH,UAAU,CAAC,KAAK,EAAE,MAAM,EAAE,GAAG,cAAc,EAAE;IAI7C;;OAEG;IACH,cAAc,CACZ,KAAK,EAAE,KAAK,CAAC;QAAE,EAAE,EAAE,MAAM,GAAG,MAAM,CAAC;QAAC,OAAO,EAAE,MAAM,CAAA;KAAE,CAAC,GACrD,KAAK,CAAC,SAAS,GAAG;QAAE,QAAQ,EAAE,MAAM,GAAG,MAAM,CAAA;KAAE,CAAC;CAepD;AAOD;;GAEG;AACH,wBAAgB,cAAc,CAAC,MAAM,CAAC,EAAE,OAAO,CAAC,cAAc,CAAC,GAAG,WAAW,CAU5E;AAED;;GAEG;AACH,wBAAgB,gBAAgB,IAAI,IAAI,CAEvC;AAGD,YAAY,EAAE,cAAc,EAAE,cAAc,EAAE,SAAS,EAAE,CAAC;AAC1D,OAAO,EAAE,uBAAuB,EAAE,iBAAiB,EAAE,MAAM,qBAAqB,CAAC;AACjF,OAAO,EAAE,cAAc,EAAE,MAAM,iCAAiC,CAAC"}

package/dist/chunking/TextChunker.js ADDED Viewed

@@ -0,0 +1,130 @@
+/**
+ * Text Chunker Factory
+ * Provides unified interface for text chunking strategies
+ */
+import { DEFAULT_CHUNKING_CONFIG, getChunkingConfig, } from "./ChunkingConfig.js";
+import { chunkWithSentences, estimateTokens } from "./strategies/SentenceChunker.js";
+import { chunkWithSlidingWindow } from "./strategies/SlidingWindowChunker.js";
+/**
+ * Text Chunker - Factory for creating and using chunking strategies
+ */
+export class TextChunker {
+    config;
+    constructor(config) {
+        // Merge with defaults and environment config
+        const envConfig = getChunkingConfig();
+        this.config = {
+            ...DEFAULT_CHUNKING_CONFIG,
+            ...envConfig,
+            ...config,
+        };
+    }
+    /**
+     * Get current configuration
+     */
+    getConfig() {
+        return { ...this.config };
+    }
+    /**
+     * Check if text needs chunking based on estimated token count
+     */
+    needsChunking(text) {
+        if (!this.config.enabled) {
+            return false;
+        }
+        const estimatedTokenCount = estimateTokens(text, this.config);
+        return estimatedTokenCount > this.config.chunkSize;
+    }
+    /**
+     * Estimate token count for text
+     */
+    estimateTokens(text) {
+        return estimateTokens(text, this.config);
+    }
+    /**
+     * Chunk text using configured strategy
+     */
+    chunk(text) {
+        // If chunking disabled, return single chunk
+        if (!this.config.enabled) {
+            return {
+                originalLength: text.length,
+                wasChunked: false,
+                chunks: [
+                    {
+                        content: text,
+                        index: 0,
+                        totalChunks: 1,
+                        startOffset: 0,
+                        endOffset: text.length,
+                        estimatedTokens: estimateTokens(text, this.config),
+                        strategy: this.config.strategy,
+                    },
+                ],
+                strategy: this.config.strategy,
+                estimatedTotalTokens: estimateTokens(text, this.config),
+            };
+        }
+        // Select strategy based on configuration
+        switch (this.config.strategy) {
+            case "sentence":
+                return chunkWithSentences(text, this.config);
+            case "sliding_window":
+                return chunkWithSlidingWindow(text, this.config);
+            case "paragraph":
+                // Fall back to sentence chunking for now
+                // Paragraph chunking would split at \n\n boundaries
+                return chunkWithSentences(text, this.config);
+            default:
+                // Default to sentence chunking
+                return chunkWithSentences(text, this.config);
+        }
+    }
+    /**
+     * Chunk multiple texts in batch
+     */
+    chunkBatch(texts) {
+        return texts.map((text) => this.chunk(text));
+    }
+    /**
+     * Flatten chunks from multiple texts into a single array with source tracking
+     */
+    chunkBatchFlat(texts) {
+        const results = [];
+        for (const { id, content } of texts) {
+            const result = this.chunk(content);
+            for (const chunk of result.chunks) {
+                results.push({
+                    ...chunk,
+                    sourceId: id,
+                });
+            }
+        }
+        return results;
+    }
+}
+/**
+ * Global chunker instance with default config
+ */
+let defaultChunker = null;
+/**
+ * Get or create global chunker instance
+ */
+export function getTextChunker(config) {
+    if (config) {
+        return new TextChunker(config);
+    }
+    if (!defaultChunker) {
+        defaultChunker = new TextChunker();
+    }
+    return defaultChunker;
+}
+/**
+ * Reset global chunker (useful for testing)
+ */
+export function resetTextChunker() {
+    defaultChunker = null;
+}
+export { DEFAULT_CHUNKING_CONFIG, getChunkingConfig } from "./ChunkingConfig.js";
+export { estimateTokens } from "./strategies/SentenceChunker.js";
+//# sourceMappingURL=TextChunker.js.map

package/dist/chunking/TextChunker.js.map ADDED Viewed

@@ -0,0 +1 @@

+ {"version":3,"file":"TextChunker.js","sourceRoot":"","sources":["../../src/chunking/TextChunker.ts"],"names":[],"mappings":"AAAA;;;GAGG;AAOH,OAAO,EACL,uBAAuB,EACvB,iBAAiB,GAClB,MAAM,qBAAqB,CAAC;AAC7B,OAAO,EAAE,kBAAkB,EAAE,cAAc,EAAE,MAAM,iCAAiC,CAAC;AACrF,OAAO,EAAE,sBAAsB,EAAE,MAAM,sCAAsC,CAAC;AAS9E;;GAEG;AACH,MAAM,OAAO,WAAW;IACd,MAAM,CAAiB;IAE/B,YAAY,MAAgC;QAC1C,6CAA6C;QAC7C,MAAM,SAAS,GAAG,iBAAiB,EAAE,CAAC;QACtC,IAAI,CAAC,MAAM,GAAG;YACZ,GAAG,uBAAuB;YAC1B,GAAG,SAAS;YACZ,GAAG,MAAM;SACV,CAAC;IACJ,CAAC;IAED;;OAEG;IACH,SAAS;QACP,OAAO,EAAE,GAAG,IAAI,CAAC,MAAM,EAAE,CAAC;IAC5B,CAAC;IAED;;OAEG;IACH,aAAa,CAAC,IAAY;QACxB,IAAI,CAAC,IAAI,CAAC,MAAM,CAAC,OAAO,EAAE,CAAC;YACzB,OAAO,KAAK,CAAC;QACf,CAAC;QAED,MAAM,mBAAmB,GAAG,cAAc,CAAC,IAAI,EAAE,IAAI,CAAC,MAAM,CAAC,CAAC;QAC9D,OAAO,mBAAmB,GAAG,IAAI,CAAC,MAAM,CAAC,SAAS,CAAC;IACrD,CAAC;IAED;;OAEG;IACH,cAAc,CAAC,IAAY;QACzB,OAAO,cAAc,CAAC,IAAI,EAAE,IAAI,CAAC,MAAM,CAAC,CAAC;IAC3C,CAAC;IAED;;OAEG;IACH,KAAK,CAAC,IAAY;QAChB,4CAA4C;QAC5C,IAAI,CAAC,IAAI,CAAC,MAAM,CAAC,OAAO,EAAE,CAAC;YACzB,OAAO;gBACL,cAAc,EAAE,IAAI,CAAC,MAAM;gBAC3B,UAAU,EAAE,KAAK;gBACjB,MAAM,EAAE;oBACN;wBACE,OAAO,EAAE,IAAI;wBACb,KAAK,EAAE,CAAC;wBACR,WAAW,EAAE,CAAC;wBACd,WAAW,EAAE,CAAC;wBACd,SAAS,EAAE,IAAI,CAAC,MAAM;wBACtB,eAAe,EAAE,cAAc,CAAC,IAAI,EAAE,IAAI,CAAC,MAAM,CAAC;wBAClD,QAAQ,EAAE,IAAI,CAAC,MAAM,CAAC,QAAQ;qBAC/B;iBACF;gBACD,QAAQ,EAAE,IAAI,CAAC,MAAM,CAAC,QAAQ;gBAC9B,oBAAoB,EAAE,cAAc,CAAC,IAAI,EAAE,IAAI,CAAC,MAAM,CAAC;aACxD,CAAC;QACJ,CAAC;QAED,yCAAyC;QACzC,QAAQ,IAAI,CAAC,MAAM,CAAC,QAAQ,EAAE,CAAC;YAC7B,KAAK,UAAU;gBACb,OAAO,kBAAkB,CAAC,IAAI,EAAE,IAAI,CAAC,MAAM,CAAC,CAAC;YAE/C,KAAK,gBAAgB;gBACnB,OAAO,sBAAsB,CAAC,IAAI,EAAE,IAAI,CAAC,MAAM,CAAC,CAAC;YAEnD,KAAK,WAAW;gBACd,yCAAyC;gBACzC,oDAAoD;gBACpD,OAAO,kBAAkB,CAAC,IAAI,EAAE,IAAI,CAAC,MAAM,CAAC,CAAC;YAE/C;gBACE,+BAA+B;gBAC/B,OAAO,kBAAkB,CAAC,IAAI,EAAE,IAAI,CAAC,MAAM,CAAC,CAAC;QACjD,CAAC;IACH,CAAC;IAED;;OAEG;IACH,UAAU,CAAC,KAAe;QACxB,OAAO,KAAK,CAAC,GAAG,CAAC,CAAC,IAAI,EAAE,EAAE,CAAC,IAAI,CAAC,KAAK,CAAC,IAAI,CAAC,CAAC,CAAC;IAC/C,CAAC;IAED;;OAEG;IACH,cAAc,CACZ,KAAsD;QAEtD,MAAM,OAAO,GAAqD,EAAE,CAAC;QAErE,KAAK,MAAM,EAAE,EAAE,EAAE,OAAO,EAAE,IAAI,KAAK,EAAE,CAAC;YACpC,MAAM,MAAM,GAAG,IAAI,CAAC,KAAK,CAAC,OAAO,CAAC,CAAC;YACnC,KAAK,MAAM,KAAK,IAAI,MAAM,CAAC,MAAM,EAAE,CAAC;gBAClC,OAAO,CAAC,IAAI,CAAC;oBACX,GAAG,KAAK;oBACR,QAAQ,EAAE,EAAE;iBACb,CAAC,CAAC;YACL,CAAC;QACH,CAAC;QAED,OAAO,OAAO,CAAC;IACjB,CAAC;CACF;AAED;;GAEG;AACH,IAAI,cAAc,GAAuB,IAAI,CAAC;AAE9C;;GAEG;AACH,MAAM,UAAU,cAAc,CAAC,MAAgC;IAC7D,IAAI,MAAM,EAAE,CAAC;QACX,OAAO,IAAI,WAAW,CAAC,MAAM,CAAC,CAAC;IACjC,CAAC;IAED,IAAI,CAAC,cAAc,EAAE,CAAC;QACpB,cAAc,GAAG,IAAI,WAAW,EAAE,CAAC;IACrC,CAAC;IAED,OAAO,cAAc,CAAC;AACxB,CAAC;AAED;;GAEG;AACH,MAAM,UAAU,gBAAgB;IAC9B,cAAc,GAAG,IAAI,CAAC;AACxB,CAAC;AAID,OAAO,EAAE,uBAAuB,EAAE,iBAAiB,EAAE,MAAM,qBAAqB,CAAC;AACjF,OAAO,EAAE,cAAc,EAAE,MAAM,iCAAiC,CAAC"}

package/dist/chunking/index.d.ts ADDED Viewed

@@ -0,0 +1,9 @@
+/**
+ * Text Chunking Module
+ * Provides text chunking strategies for handling long messages that exceed embedding model limits
+ */
+export { TextChunker, getTextChunker, resetTextChunker, estimateTokens, DEFAULT_CHUNKING_CONFIG, getChunkingConfig, } from "./TextChunker.js";
+export type { ChunkingConfig, ChunkingResult, TextChunk, ChunkingStrategy as ChunkingStrategyType, } from "./ChunkingConfig.js";
+export { chunkWithSentences } from "./strategies/SentenceChunker.js";
+export { chunkWithSlidingWindow } from "./strategies/SlidingWindowChunker.js";
+//# sourceMappingURL=index.d.ts.map

package/dist/chunking/index.d.ts.map ADDED Viewed

@@ -0,0 +1 @@

+ {"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../src/chunking/index.ts"],"names":[],"mappings":"AAAA;;;GAGG;AAEH,OAAO,EACL,WAAW,EACX,cAAc,EACd,gBAAgB,EAChB,cAAc,EACd,uBAAuB,EACvB,iBAAiB,GAClB,MAAM,kBAAkB,CAAC;AAE1B,YAAY,EACV,cAAc,EACd,cAAc,EACd,SAAS,EACT,gBAAgB,IAAI,oBAAoB,GACzC,MAAM,qBAAqB,CAAC;AAE7B,OAAO,EAAE,kBAAkB,EAAE,MAAM,iCAAiC,CAAC;AACrE,OAAO,EAAE,sBAAsB,EAAE,MAAM,sCAAsC,CAAC"}

package/dist/chunking/index.js ADDED Viewed

@@ -0,0 +1,8 @@
+/**
+ * Text Chunking Module
+ * Provides text chunking strategies for handling long messages that exceed embedding model limits
+ */
+export { TextChunker, getTextChunker, resetTextChunker, estimateTokens, DEFAULT_CHUNKING_CONFIG, getChunkingConfig, } from "./TextChunker.js";
+export { chunkWithSentences } from "./strategies/SentenceChunker.js";
+export { chunkWithSlidingWindow } from "./strategies/SlidingWindowChunker.js";
+//# sourceMappingURL=index.js.map

package/dist/chunking/index.js.map ADDED Viewed

	@@ -0,0 +1 @@
1	+ {"version":3,"file":"index.js","sourceRoot":"","sources":["../../src/chunking/index.ts"],"names":[],"mappings":"AAAA;;;GAGG;AAEH,OAAO,EACL,WAAW,EACX,cAAc,EACd,gBAAgB,EAChB,cAAc,EACd,uBAAuB,EACvB,iBAAiB,GAClB,MAAM,kBAAkB,CAAC;AAS1B,OAAO,EAAE,kBAAkB,EAAE,MAAM,iCAAiC,CAAC;AACrE,OAAO,EAAE,sBAAsB,EAAE,MAAM,sCAAsC,CAAC"}

package/dist/chunking/strategies/SentenceChunker.d.ts ADDED Viewed

@@ -0,0 +1,19 @@
+/**
+ * Sentence-Aware Text Chunker
+ * Splits text at sentence boundaries while respecting code blocks and paragraphs
+ */
+import type { ChunkingConfig, ChunkingResult } from "../ChunkingConfig.js";
+/**
+ * Estimate token count using character ratios
+ */
+declare function estimateTokens(text: string, config: ChunkingConfig): number;
+/**
+ * Detect if text contains code patterns
+ */
+declare function isCodeLike(text: string): boolean;
+/**
+ * Chunk text using sentence-aware strategy
+ */
+export declare function chunkWithSentences(text: string, config: ChunkingConfig): ChunkingResult;
+export { estimateTokens, isCodeLike };
+//# sourceMappingURL=SentenceChunker.d.ts.map

package/dist/chunking/strategies/SentenceChunker.d.ts.map ADDED Viewed

@@ -0,0 +1 @@

+ {"version":3,"file":"SentenceChunker.d.ts","sourceRoot":"","sources":["../../../src/chunking/strategies/SentenceChunker.ts"],"names":[],"mappings":"AAAA;;;GAGG;AAEH,OAAO,KAAK,EAAE,cAAc,EAAa,cAAc,EAAE,MAAM,sBAAsB,CAAC;AAEtF;;GAEG;AACH,iBAAS,cAAc,CAAC,IAAI,EAAE,MAAM,EAAE,MAAM,EAAE,cAAc,GAAG,MAAM,CAWpE;AAED;;GAEG;AACH,iBAAS,UAAU,CAAC,IAAI,EAAE,MAAM,GAAG,OAAO,CAczC;AAuND;;GAEG;AACH,wBAAgB,kBAAkB,CAChC,IAAI,EAAE,MAAM,EACZ,MAAM,EAAE,cAAc,GACrB,cAAc,CAqChB;AAED,OAAO,EAAE,cAAc,EAAE,UAAU,EAAE,CAAC"}