npm - context-compress - Versions diffs - 2026.3.21 → 2026.5.0 - Mend

context-compress 2026.3.21 → 2026.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (115) hide show

package/README.md +258 -44
package/dist/cli/doctor.d.ts.map +1 -1
package/dist/cli/doctor.js +2 -10
package/dist/cli/doctor.js.map +1 -1
package/dist/cli/filter.d.ts +52 -0
package/dist/cli/filter.d.ts.map +1 -0
package/dist/cli/filter.js +200 -0
package/dist/cli/filter.js.map +1 -0
package/dist/cli/index.d.ts +8 -4
package/dist/cli/index.d.ts.map +1 -1
package/dist/cli/index.js +19 -6
package/dist/cli/index.js.map +1 -1
package/dist/cli/lite.d.ts +15 -0
package/dist/cli/lite.d.ts.map +1 -0
package/dist/cli/lite.js +37 -0
package/dist/cli/lite.js.map +1 -0
package/dist/cli/setup.d.ts +23 -1
package/dist/cli/setup.d.ts.map +1 -1
package/dist/cli/setup.js +122 -21
package/dist/cli/setup.js.map +1 -1
package/dist/executor.d.ts +7 -1
package/dist/executor.d.ts.map +1 -1
package/dist/executor.js +51 -4
package/dist/executor.js.map +1 -1
package/dist/filters.d.ts +52 -0
package/dist/filters.d.ts.map +1 -0
package/dist/filters.js +719 -0
package/dist/filters.js.map +1 -0
package/dist/hooks/pretooluse.js +57 -0
package/dist/hooks/pretooluse.js.map +1 -1
package/dist/network.d.ts.map +1 -1
package/dist/network.js +11 -0
package/dist/network.js.map +1 -1
package/dist/server.bundle.mjs +1333 -619
package/dist/server.bundle.mjs.map +4 -4
package/dist/server.d.ts.map +1 -1
package/dist/server.js +44 -610
package/dist/server.js.map +1 -1
package/dist/stats.d.ts +7 -1
package/dist/stats.d.ts.map +1 -1
package/dist/stats.js +65 -0
package/dist/stats.js.map +1 -1
package/dist/store.d.ts +1 -0
package/dist/store.d.ts.map +1 -1
package/dist/store.js +15 -2
package/dist/store.js.map +1 -1
package/dist/tools/batch-execute.d.ts +4 -0
package/dist/tools/batch-execute.d.ts.map +1 -0
package/dist/tools/batch-execute.js +75 -0
package/dist/tools/batch-execute.js.map +1 -0
package/dist/tools/context.d.ts +17 -0
package/dist/tools/context.d.ts.map +1 -0
package/dist/tools/context.js +2 -0
package/dist/tools/context.js.map +1 -0
package/dist/tools/discover.d.ts +4 -0
package/dist/tools/discover.d.ts.map +1 -0
package/dist/tools/discover.js +65 -0
package/dist/tools/discover.js.map +1 -0
package/dist/tools/execute-file.d.ts +4 -0
package/dist/tools/execute-file.d.ts.map +1 -0
package/dist/tools/execute-file.js +66 -0
package/dist/tools/execute-file.js.map +1 -0
package/dist/tools/execute.d.ts +4 -0
package/dist/tools/execute.d.ts.map +1 -0
package/dist/tools/execute.js +54 -0
package/dist/tools/execute.js.map +1 -0
package/dist/tools/fetch-and-index.d.ts +4 -0
package/dist/tools/fetch-and-index.d.ts.map +1 -0
package/dist/tools/fetch-and-index.js +91 -0
package/dist/tools/fetch-and-index.js.map +1 -0
package/dist/tools/index-content.d.ts +4 -0
package/dist/tools/index-content.d.ts.map +1 -0
package/dist/tools/index-content.js +85 -0
package/dist/tools/index-content.js.map +1 -0
package/dist/tools/search.d.ts +4 -0
package/dist/tools/search.d.ts.map +1 -0
package/dist/tools/search.js +57 -0
package/dist/tools/search.js.map +1 -0
package/dist/tools/stats.d.ts +4 -0
package/dist/tools/stats.d.ts.map +1 -0
package/dist/tools/stats.js +10 -0
package/dist/tools/stats.js.map +1 -0
package/dist/types.d.ts +11 -0
package/dist/types.d.ts.map +1 -1
package/dist/util/auto-mode.d.ts +40 -0
package/dist/util/auto-mode.d.ts.map +1 -0
package/dist/util/auto-mode.js +181 -0
package/dist/util/auto-mode.js.map +1 -0
package/dist/util/fetch-code.d.ts +10 -0
package/dist/util/fetch-code.d.ts.map +1 -0
package/dist/util/fetch-code.js +87 -0
package/dist/util/fetch-code.js.map +1 -0
package/dist/util/intent-filter.d.ts +17 -0
package/dist/util/intent-filter.d.ts.map +1 -0
package/dist/util/intent-filter.js +28 -0
package/dist/util/intent-filter.js.map +1 -0
package/dist/util/label.d.ts +4 -0
package/dist/util/label.d.ts.map +1 -0
package/dist/util/label.js +14 -0
package/dist/util/label.js.map +1 -0
package/dist/util/path.d.ts +8 -0
package/dist/util/path.d.ts.map +1 -0
package/dist/util/path.js +21 -0
package/dist/util/path.js.map +1 -0
package/dist/util/stream-compress.d.ts +36 -0
package/dist/util/stream-compress.d.ts.map +1 -0
package/dist/util/stream-compress.js +104 -0
package/dist/util/stream-compress.js.map +1 -0
package/dist/util/version.d.ts +2 -0
package/dist/util/version.d.ts.map +1 -0
package/dist/util/version.js +15 -0
package/dist/util/version.js.map +1 -0
package/docs/token-reduction-report.md +164 -88
package/hooks/pretooluse.mjs +38 -0
package/package.json +5 -4

package/docs/token-reduction-report.md CHANGED Viewed

@@ -6,6 +6,8 @@
 > provides a detailed before/after comparison for 12 common operations,
 > and addresses the natural question: "doesn't less tokens mean losing context?"
+**Version**: 2026.5.0 | **Last updated**: 2026-05-10
 ---
 ## Table of Contents
@@ -17,6 +19,7 @@
 - [Context Window Impact](#context-window-impact)
 - [Cost Impact](#cost-impact)
 - [Deep Dive: How Playwright Snapshot Goes from 56KB to 299B](#deep-dive-how-playwright-snapshot-goes-from-56kb-to-299b)
+- [Security and Reliability](#security-and-reliability)
 - [FAQ: Doesn't Less Tokens Mean Losing Context?](#faq-doesnt-less-tokens-mean-losing-context)
 ---
@@ -26,28 +29,48 @@
 Every byte of tool output that enters Claude Code's context window **consumes tokens permanently**. In a typical coding session:
 ```
-Read a bundled file          →  776KB  →  194,076 tokens
-Playwright browser snapshot  →   56KB  →   14,000 tokens
-npm test (42 tests)          →    4KB  →      935 tokens
-git diff (3 commits)         →    8KB  →    2,000 tokens
+Read a bundled file          →  776KB  →  155K-259K tokens
+Playwright browser snapshot  →   56KB  →   11K-19K tokens
+npm test (42 tests)          →    4KB  →     748-1,246 tokens
+git diff (3 commits)         →    8KB  →   1,600-2,667 tokens
                                          ─────────────────
-                                Total:    211,011 tokens
-                                         ← already exceeds 200K window
+                                Total:    169K-282K tokens
+                                         ← can overflow 200K window
 ```
-With just 4 operations, you've **overflowed the entire context window**. Earlier conversation messages get compressed or lost. The agent forgets what you asked. Quality degrades.
+> **Token estimation**: 1 token ≈ 3-5 bytes depending on content. We use a range (bytes/5 to bytes/3) because Anthropic does not publish a local tokenizer for Claude 3+ models.
+With just 4 operations, you risk **overflowing the entire context window**. Earlier conversation messages get compressed or lost. The agent forgets what you asked. Quality degrades.
 The worst part: **99% of that tool output is noise** — import statements, boilerplate, minified code, irrelevant test output. The agent doesn't benefit from seeing it. It just crowds out the conversation.
 ---
-## The Solution: 3-Layer Architecture
+## The Solution: 4-Layer Architecture
 context-compress doesn't delete data — it **defers** it. All data is preserved and searchable. Only the relevant parts enter context.
+### Layer 0: Command-Specific Output Filters (v2026.3.22)
+Before generic compression, output passes through command-aware filters that strip noise specific to each tool:
+| Command | What's Stripped | Typical Savings |
+|:--|:--|:--|
+| `git push/pull/fetch/clone` | Remote progress lines, object counting, delta resolution | 40-60% |
+| `git status` | Hint lines (`use "git add"...`), blank lines | 20-30% |
+| `npm/yarn/pnpm install` | Deprecation warnings, funding prompts, tree-drawing chars | 30-50% |
+| `npm test / jest / vitest / pytest` | Passing test details, keeps only failures + summary | 70-95% |
+| `cargo build / make / gradle` | Download progress, "Compiling X/Y", lock waits | 50-70% |
+| `docker build` | Layer hash lines (` ---> abc123`), build context transfer | 30-50% |
+| `ls -R / find / tree` | Directory grouping for large listings (50+ files) | 60-80% |
+Additionally, all output passes through:
+- **ANSI stripping**: Terminal escape codes (colors, cursor movement) are always removed — pure noise for LLMs
+- **Progress line removal**: Spinner characters, percentage bars, download/ETA lines are filtered
 ### Layer 1: Sandbox Execution
-The agent writes code to process data. Only `console.log()` output enters context.
+The agent writes code to process data. Only `console.log()` output enters context. 11 languages supported: JavaScript, TypeScript, Python, Shell, Ruby, Go, Rust, PHP, Perl, R, Elixir.
 ```
 execute_file("server.bundle.mjs", code: `
@@ -61,9 +84,11 @@ Context:       420 bytes (the extracted schema)
 The agent isn't blindly losing context — it's **choosing** what matters via code.
+**Safeguards**: Code input limited to 1MB. Subprocess timeout (default 30s). Output hard cap (100MB). Process group kill on timeout. Concurrent executions limited to 8 globally.
 ### Layer 2: FTS5 Knowledge Base
-Full data is stored in a searchable SQLite FTS5 database with BM25 ranking, Porter stemming, and fuzzy matching. The agent can query it at any time.
+Full data is stored in a searchable SQLite FTS5 database with BM25 ranking, Porter stemming, trigram matching, and Levenshtein fuzzy correction (with early-exit optimization).
 ```
 index(path: "snapshot.md")          → 56KB stored, 42 chunks created
@@ -74,6 +99,8 @@ search("order table row headers")   → 180B match returned
 Data is **not lost**. It's **indexed and searchable on demand**.
+**Persistence option**: Set `persistDb: true` in config to survive MCP server restarts.
 ### Layer 3: Intent-Based Auto-Filter
 When the agent provides an `intent` parameter, large outputs are automatically filtered:
@@ -93,116 +120,130 @@ Small outputs are **never compressed**. Large outputs are filtered by what was a
 The following comparison uses realistic output sizes measured from the context-compress project itself.
-> **Token calculation**: 1 token ≈ 4 bytes (English text average)
+> **Token calculation**: 1 token ≈ 3-5 bytes. The "Tokens" column shows the midpoint estimate (bytes/4). See [Cost Impact](#cost-impact) for range-based calculations.
 ### 1. Read large source file (server.ts ~21KB)
-| | Bytes | Tokens | Method |
+| | Bytes | Tokens (est.) | Method |
 |:--|--:|--:|:--|
-| **Before** | 21,000 | 5,250 | `Read` tool → full file dumped into context |
-| **After** | 350 | 88 | `execute_file` → agent prints only what it needs |
-| **Saved** | | **5,162** | **98.3% reduction** |
+| **Before** | 21,000 | ~5,250 | `Read` tool → full file dumped into context |
+| **After** | 350 | ~88 | `execute_file` → agent prints only what it needs |
+| **Saved** | | **~5,162** | **98.3% reduction** |
 ### 2. Read bundled file (server.bundle.mjs ~776KB)
-| | Bytes | Tokens | Method |
+| | Bytes | Tokens (est.) | Method |
 |:--|--:|--:|:--|
-| **Before** | 776,304 | 194,076 | `Read` tool → full file in context (truncated at 2000 lines) |
-| **After** | 420 | 105 | `execute_file` → extract specific function/pattern |
-| **Saved** | | **193,971** | **99.9% reduction** |
+| **Before** | 776,304 | ~194,076 | `Read` tool → full file in context (truncated at 2000 lines) |
+| **After** | 420 | ~105 | `execute_file` → extract specific function/pattern |
+| **Saved** | | **~193,971** | **99.9% reduction** |
 ### 3. npm test output (42 tests, ~3.7KB)
-| | Bytes | Tokens | Method |
+| | Bytes | Tokens (est.) | Method |
 |:--|--:|--:|:--|
-| **Before** | 3,739 | 935 | `Bash` → full stdout in context |
-| **After** | 180 | 45 | `execute` with `intent: "failing tests"` → summary only |
-| **Saved** | | **890** | **95.2% reduction** |
+| **Before** | 3,739 | ~935 | `Bash` → full stdout in context |
+| **After** | 180 | ~45 | `execute` with `intent: "failing tests"` → summary only |
+| **Saved** | | **~890** | **95.2% reduction** |
 ### 4. git log (full history, ~5KB)
-| | Bytes | Tokens | Method |
+| | Bytes | Tokens (est.) | Method |
 |:--|--:|--:|:--|
-| **Before** | 5,000 | 1,250 | `Bash git log` → all commits in context |
-| **After** | 250 | 63 | `execute` + `search` for specific commits |
-| **Saved** | | **1,187** | **95.0% reduction** |
+| **Before** | 5,000 | ~1,250 | `Bash git log` → all commits in context |
+| **After** | 250 | ~63 | `execute` + `search` for specific commits |
+| **Saved** | | **~1,187** | **95.0% reduction** |
 ### 5. git diff (3 commits, ~8KB)
-| | Bytes | Tokens | Method |
+| | Bytes | Tokens (est.) | Method |
 |:--|--:|--:|:--|
-| **Before** | 8,000 | 2,000 | `Bash git diff` → full patch in context |
-| **After** | 400 | 100 | `execute` + `search` for changed functions |
-| **Saved** | | **1,900** | **95.0% reduction** |
+| **Before** | 8,000 | ~2,000 | `Bash git diff` → full patch in context |
+| **After** | 400 | ~100 | `execute` + `search` for changed functions |
+| **Saved** | | **~1,900** | **95.0% reduction** |
 ### 6. grep across codebase (~1.4KB)
-| | Bytes | Tokens | Method |
+| | Bytes | Tokens (est.) | Method |
 |:--|--:|--:|:--|
-| **Before** | 1,442 | 361 | `Grep` → all matching lines in context |
-| **After** | 1,442 | 361 | Same — small output passes through as-is |
+| **Before** | 1,442 | ~361 | `Grep` → all matching lines in context |
+| **After** | 1,442 | ~361 | Same — small output passes through as-is |
 | **Saved** | | **0** | **0% — no overhead for small outputs** |
 ### 7. Playwright browser_snapshot (~56KB)
-| | Bytes | Tokens | Method |
+| | Bytes | Tokens (est.) | Method |
 |:--|--:|--:|:--|
-| **Before** | 56,000 | 14,000 | `browser_snapshot` → full accessibility tree in context |
-| **After** | 299 | 75 | save → `index` → `search` for specific elements |
-| **Saved** | | **13,925** | **99.5% reduction** |
+| **Before** | 56,000 | ~14,000 | `browser_snapshot` → full accessibility tree in context |
+| **After** | 299 | ~75 | save → `index` → `search` for specific elements |
+| **Saved** | | **~13,925** | **99.5% reduction** |
 ### 8. curl API response (JSON ~12KB)
-| | Bytes | Tokens | Method |
+| | Bytes | Tokens (est.) | Method |
 |:--|--:|--:|:--|
-| **Before** | 12,000 | 3,000 | `Bash curl` → full JSON response in context |
-| **After** | 350 | 88 | `execute` → extract specific fields with code |
-| **Saved** | | **2,912** | **97.1% reduction** |
+| **Before** | 12,000 | ~3,000 | `Bash curl` → full JSON response in context |
+| **After** | 350 | ~88 | `execute` → extract specific fields with code |
+| **Saved** | | **~2,912** | **97.1% reduction** |
 ### 9. fetch_and_index (web docs ~45KB)
-| | Bytes | Tokens | Method |
+| | Bytes | Tokens (est.) | Method |
 |:--|--:|--:|:--|
-| **Before** | 45,000 | 11,250 | `WebFetch` → full page markdown in context |
-| **After** | 3,000 | 750 | `fetch_and_index` → 3KB preview + rest searchable |
-| **Saved** | | **10,500** | **93.3% reduction** |
+| **Before** | 45,000 | ~11,250 | `WebFetch` → full page markdown in context |
+| **After** | 3,000 | ~750 | `fetch_and_index` → 3KB preview + rest searchable |
+| **Saved** | | **~10,500** | **93.3% reduction** |
+**Security**: SSRF protection with DNS rebinding prevention, IP pinning, redirect blocking, and 10MB response size limit. Prompt injection detection on fetched content.
 ### 10. batch_execute (5 commands, ~25KB total)
-| | Bytes | Tokens | Method |
+| | Bytes | Tokens (est.) | Method |
 |:--|--:|--:|:--|
-| **Before** | 25,000 | 6,250 | 5x `Bash` → all output in context |
-| **After** | 1,500 | 375 | `batch_execute` + search across all in 1 call |
-| **Saved** | | **5,875** | **94.0% reduction** |
+| **Before** | 25,000 | ~6,250 | 5x `Bash` → all output in context |
+| **After** | 1,500 | ~375 | `batch_execute` + search across all in 1 call |
+| **Saved** | | **~5,875** | **94.0% reduction** |
+**Performance**: Commands run with bounded concurrency (max 4 parallel). Global execution limit of 8 prevents resource exhaustion.
 ### 11. Read CSV/JSON data file (~100KB)
-| | Bytes | Tokens | Method |
+| | Bytes | Tokens (est.) | Method |
 |:--|--:|--:|:--|
-| **Before** | 100,000 | 25,000 | `Read` → file contents in context |
-| **After** | 500 | 125 | `execute_file` → extract/aggregate specific data |
-| **Saved** | | **24,875** | **99.5% reduction** |
+| **Before** | 100,000 | ~25,000 | `Read` → file contents in context |
+| **After** | 500 | ~125 | `execute_file` → extract/aggregate specific data |
+| **Saved** | | **~24,875** | **99.5% reduction** |
 ### 12. npm install log (~15KB)
-| | Bytes | Tokens | Method |
+| | Bytes | Tokens (est.) | Method |
+|:--|--:|--:|:--|
+| **Before** | 15,000 | ~3,750 | `Bash npm install` → full install log in context |
+| **After** | 200 | ~50 | `execute` with `intent: "errors"` → only issues shown |
+| **Saved** | | **~3,700** | **98.7% reduction** |
+### 13. npm test with ANSI + verbose output (~8KB, v2026.3.22)
+| | Bytes | Tokens (est.) | Method |
 |:--|--:|--:|:--|
-| **Before** | 15,000 | 3,750 | `Bash npm install` → full install log in context |
-| **After** | 200 | 50 | `execute` with `intent: "errors"` → only issues shown |
-| **Saved** | | **3,700** | **98.7% reduction** |
+| **Before** | 8,000 | ~2,000 | `Bash npm test` → full ANSI-colored verbose output in context |
+| **After** | 350 | ~88 | Command filter strips ANSI + passing tests → only failures + summary |
+| **Saved** | | **~1,912** | **95.6% reduction** |
+**Pipeline**: ANSI stripping → command filter (test runner detection) → progress line removal → deduplication → smart truncation. All 5 layers applied automatically.
 ---
 ## Session Totals
-Combining all 12 operations from a single coding session:
+Combining all 13 operations from a single coding session:
 ```
-BEFORE:  1,043 KB  →  267,121 tokens consumed
-AFTER:       9 KB  →    2,223 tokens consumed
+BEFORE:  1,051 KB  →  ~263K tokens consumed (bytes/4 midpoint)
+AFTER:       9 KB  →    ~2.3K tokens consumed
                        ────────────────────────
-SAVED:   1,035 KB  →  264,898 tokens
-REDUCTION:                99.2%
+SAVED:   1,042 KB  →  ~260K tokens
+REDUCTION:                99.1%
 ```
 ---
@@ -216,42 +257,43 @@ Claude Code uses a 200K token context window.
 │                   200,000 token context window               │
 │                                                              │
 │  WITHOUT context-compress:                                   │
-│  ████████████████████████████████████████████████████ 133.6% │
-│  ← 12 operations OVERFLOW the window. Conversation lost.     │
+│  ████████████████████████████████████████████████████ ~132%  │
+│  ← 13 operations OVERFLOW the window. Conversation lost.     │
 │                                                              │
 │  WITH context-compress:                                      │
-│  █ 1.1%                                                      │
-│  ← 12 operations use 1.1%. 98.9% free for conversation.     │
+│  █ ~1.2%                                                     │
+│  ← 13 operations use ~1.2%. ~98.8% free for conversation.   │
 └─────────────────────────────────────────────────────────────┘
 ```
 | Metric | Before | After |
 |:--|--:|--:|
-| Tokens consumed | 267,121 | 2,223 |
-| % of context window | 133.6% | 1.1% |
-| Operations before compaction | ~9 | **~1,100** |
-| Conversation longevity | Short | **~121x longer** |
+| Tokens consumed (est.) | ~263,000 | ~2,300 |
+| % of context window | ~132% | ~1.2% |
+| Operations before compaction | ~9 | **~1,080** |
+| Conversation longevity | Short | **~117x longer** |
 ---
 ## Cost Impact
-Input token pricing (per session, 12 operations):
+Input token pricing (per session, 12 operations). Using midpoint estimate (bytes/4):
 | Model | Before | After | Saved per Session |
 |:--|--:|--:|--:|
-| Sonnet 4 ($3/MTok) | $0.80 | $0.007 | **$0.79** |
-| Opus 4 ($15/MTok) | $4.01 | $0.033 | **$3.97** |
+| Haiku 4.5 ($0.80/MTok) | $0.21 | $0.002 | **$0.21** |
+| Sonnet 4.6 ($3/MTok) | $0.78 | $0.007 | **$0.78** |
+| Opus 4.6 ($15/MTok) | $3.92 | $0.033 | **$3.89** |
-### Extrapolated Savings
+### Extrapolated Monthly Savings
-| Usage | Sonnet Monthly | Opus Monthly |
-|:--|--:|--:|
-| 5 sessions/day | $118.50 | $592.50 |
-| 10 sessions/day | $237.00 | **$1,185.00** |
-| 20 sessions/day | $474.00 | **$2,370.00** |
+| Usage | Haiku | Sonnet | Opus |
+|:--|--:|--:|--:|
+| 5 sessions/day | $31.05 | $116.44 | **$582.19** |
+| 10 sessions/day | $62.10 | $232.88 | **$1,164.38** |
+| 20 sessions/day | $124.20 | $465.75 | **$2,328.75** |
-> Note: These are input token savings only. Actual savings vary based on session complexity. Output tokens are unaffected.
+> Note: These are input token savings only. Actual savings vary based on session complexity. Output tokens are unaffected. Token estimates use bytes/4 midpoint; actual counts may vary 20-30%.
 ---
@@ -317,7 +359,7 @@ The `browser_snapshot()` tool returns a full accessibility tree:
   ... (thousands more lines for a real application)
 ```
-**All 56,000 bytes (14,000 tokens) dumped into context. Gone.**
+**All 56,000 bytes (~14,000 tokens) dumped into context. Gone.**
 The agent probably only needed the login form. But it paid for the entire page.
@@ -363,6 +405,37 @@ The other 55,701 bytes are still in FTS5 — fully searchable. Need the order ta
 ---
+## Security and Reliability
+context-compress v2026.5.0 includes comprehensive security and reliability features:
+### Security
+| Feature | Description |
+|:--|:--|
+| Environment isolation | Opt-in credential passthrough (`passthroughEnvVars` defaults to empty) |
+| SSRF protection | 4-layer defense: hostname validation, DNS rebinding prevention, IP pinning, redirect blocking |
+| Input limits | Code: 1MB max. Fetch response: 10MB max. Index content: 50MB max |
+| Concurrency control | Global limit of 8 concurrent executions. batch_execute: max 4 parallel |
+| Prompt injection detection | Regex-based advisory warnings on fetched content (7 patterns) |
+| Path traversal protection | `realpathSync` with symlink resolution + project boundary enforcement |
+| Process isolation | Timeout, output caps (100MB), process group kill, safe environment |
+### Reliability
+| Feature | Description |
+|:--|:--|
+| Graceful shutdown | Active subprocess tracking, SIGTERM/SIGINT cleanup, uncaughtException handling |
+| DB resilience | In-memory fallback on disk-full. WAL mode for crash recovery. Stale DB cleanup |
+| Output processing | ANSI stripping, progress line removal, command-specific filters, line deduplication, error grouping, smart 60/40 head/tail truncation |
+| Cumulative stats | Cross-session token savings persisted to `stats.json` when `persistDb` is enabled |
+| Search fallback | 3-layer: Porter stemming → trigram (lazy) → Levenshtein fuzzy correction |
+| Configuration | ENV > file > defaults with Zod validation and sanity clamping |
+For the full security model, see [SECURITY.md](../SECURITY.md).
+---
 ## FAQ: Doesn't Less Tokens Mean Losing Context?
 **This is the right question to ask.** If we're feeding the agent fewer tokens, doesn't it see less?
@@ -374,7 +447,7 @@ The other 55,701 bytes are still in FTS5 — fully searchable. Need the order ta
 ```
 WITHOUT context-compress (passive exposure):
 ┌──────────────────────────────────────────────────────┐
-│ 194,076 tokens loaded into context                   │
+│ ~194,000 tokens loaded into context                   │
 │                                                      │
 │  99% = imports, boilerplate, minified code,          │
 │        source maps, irrelevant functions...          │
@@ -390,7 +463,7 @@ WITHOUT context-compress (passive exposure):
 WITH context-compress (active retrieval):
 ┌──────────────────────────────────────────────────────┐
-│ 105 tokens loaded into context                       │
+│ ~105 tokens loaded into context                       │
 │                                                      │
 │  100% = exactly the function you care about          │
 │                                                      │
@@ -443,11 +516,13 @@ context-compress trades **passive exposure to noise** for **active retrieval of
 | Tool | Mechanism | Best For |
 |:--|:--|:--|
-| `execute` | Runs code in sandbox. Only `console.log` enters context | CLI commands, API calls, test runners |
+| `execute` | Runs code in sandbox (11 languages). Only `console.log` enters context | CLI commands, API calls, test runners |
 | `execute_file` | Reads file into sandbox. Only printed summary enters context | Large source files, CSVs, logs, data files |
 | `index` + `search` | FTS5 stores all data. BM25 returns only matching chunks | Documentation, snapshots, large datasets |
 | `fetch_and_index` | HTML → markdown → FTS5. Returns 3KB preview + searchable index | Web pages, API docs, reference material |
-| `batch_execute` | Runs N commands, indexes all output, searches across all in 1 call | Multi-step workflows, exploration |
+| `batch_execute` | Runs N commands (max 4 parallel), indexes all output, searches across all in 1 call | Multi-step workflows, exploration |
+| `discover` | Shows knowledge base inventory and optimization suggestions | Understanding available indexed data |
+| `stats` | Real-time session statistics with token range estimates and cost | Monitoring compression effectiveness |
 The core principle:
@@ -455,5 +530,6 @@ The core principle:
 ---
-*Generated from real benchmarks on the context-compress v1.0.0 codebase.*
-*Token calculation: 1 token ≈ 4 bytes (English text average).*
+*Generated from real benchmarks on the context-compress v2026.5.0 codebase.*
+*Token estimates use bytes/4 midpoint. Actual token counts may vary by 20-30% depending on content type.*
+*See SECURITY.md for the full trust model and security architecture.*

package/hooks/pretooluse.mjs CHANGED Viewed

@@ -6,6 +6,36 @@ var blockCurl = process.env.CONTEXT_COMPRESS_BLOCK_CURL !== "0";
 var blockWebFetch = process.env.CONTEXT_COMPRESS_BLOCK_WEBFETCH !== "0";
 var nudgeOnRead = process.env.CONTEXT_COMPRESS_NUDGE_READ !== "0";
 var nudgeOnGrep = process.env.CONTEXT_COMPRESS_NUDGE_GREP !== "0";
+var filterBash = process.env.CONTEXT_COMPRESS_FILTER_BASH === "1";
+var ccBin = process.env.CONTEXT_COMPRESS_BIN ?? "context-compress";
+var ccMode = process.env.CONTEXT_COMPRESS_MODE;
+var WRAP_TARGETS = [
+  /^git\s+(status|log|diff|show|blame|branch|stash\s+list|grep|ls-files)/,
+  /^(npm|yarn|pnpm|bun)\s+(install|i|add|test|run\s|update|outdated|audit|list|ls|view|info)/,
+  /^cargo\s+(build|test|check|run|clippy|tree|search|metadata)/,
+  /^(pytest|jest|mocha|vitest|tap|bats)\b/,
+  /^(find|grep|rg|fd|ag|ripgrep)\b/,
+  /^ls\s+(-R|-la|-al)/,
+  /^docker\s+(build|ps|logs|images|inspect|stats)/,
+  /^kubectl\s+(get|describe|logs|top|api-resources)/,
+  /^terraform\s+(plan|show|state\s+list|state\s+show|validate)/,
+  /^helm\s+(list|status|history|get)/,
+  /^(make|gradle|bazel|nx|turbo)\b/,
+  /^ps\s+(aux|-ef)/,
+  /^(top|htop)\b/,
+  /^(df|du)\b/,
+  /^(go|rustc)\s+(test|build|vet|run)/
+];
+function shouldWrap(cmd) {
+  const trimmed = cmd.trim();
+  if (/(?:^|\s)(?:>|>>|\d?>&)\s*\S/.test(trimmed)) return false;
+  if (/\|/.test(trimmed)) return false;
+  if (/&&|\|\||;/.test(trimmed)) return false;
+  return WRAP_TARGETS.some((re) => re.test(trimmed));
+}
+function shellQuote(s) {
+  return `'${s.replace(/'/g, "'\\''")}'`;
+}
 var raw = "";
 process.stdin.setEncoding("utf-8");
 for await (const chunk of process.stdin) raw += chunk;
@@ -37,6 +67,14 @@ if (tool === "Bash") {
       }
     });
   }
+  if (filterBash && shouldWrap(command)) {
+    const modeFlag = ccMode ? ` --mode ${ccMode}` : "";
+    respond({
+      updatedInput: {
+        command: `${ccBin} wrap${modeFlag} ${shellQuote(command)}`
+      }
+    });
+  }
   process.exit(0);
 }
 if (tool === "Read" && nudgeOnRead) {

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "context-compress",
-  "version": "2026.3.21",
+  "version": "2026.5.0",
   "description": "Context-aware MCP server that compresses tool output for Claude Code",
   "type": "module",
   "main": "dist/server.js",
@@ -12,12 +12,13 @@
     "build:hooks": "esbuild src/hooks/pretooluse.ts --bundle --platform=node --format=esm --outfile=hooks/pretooluse.mjs --target=node18 && node -e \"const{createHash}=require('crypto'),{readFileSync,writeFileSync}=require('fs');const h=createHash('sha256').update(readFileSync('hooks/pretooluse.mjs')).digest('hex');writeFileSync('hooks/pretooluse.sha256',h+'\\n')\"",
     "dev": "tsx src/index.ts",
     "typecheck": "tsc --noEmit",
-    "lint": "biome check src/",
-    "lint:fix": "biome check --write src/",
+    "lint": "biome check --max-diagnostics=200 src/",
+    "lint:fix": "biome check --write --max-diagnostics=200 src/",
     "test": "node --import tsx --test tests/**/*.test.ts",
     "test:unit": "node --import tsx --test tests/unit/*.test.ts",
     "test:integration": "node --import tsx --test tests/integration/*.test.ts",
-    "clean": "rm -rf dist",
+    "clean": "rm -rf dist dist-bin",
+    "build:bin": "bun build --compile --target=bun-darwin-arm64 ./src/cli/lite.ts --outfile=./dist-bin/cc-lite-darwin-arm64 && bun build --compile --target=bun-darwin-x64 ./src/cli/lite.ts --outfile=./dist-bin/cc-lite-darwin-x64 && bun build --compile --target=bun-linux-x64 ./src/cli/lite.ts --outfile=./dist-bin/cc-lite-linux-x64 && bun build --compile --target=bun-linux-arm64 ./src/cli/lite.ts --outfile=./dist-bin/cc-lite-linux-arm64",
     "prepublishOnly": "npm run lint && npm run test && npm run build"
   },
   "engines": {