npm - @martian-engineering/lossless-claw - Versions diffs - 0.6.2 → 0.7.0 - Mend

@martian-engineering/lossless-claw 0.6.2 → 0.7.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (31) hide show

package/README.md +16 -4
package/docs/agent-tools.md +7 -1
package/docs/configuration.md +200 -200
package/openclaw.plugin.json +123 -0
package/package.json +1 -1
package/skills/lossless-claw/references/config.md +135 -3
package/src/assembler.ts +5 -1
package/src/compaction.ts +149 -38
package/src/db/config.ts +102 -4
package/src/db/connection.ts +20 -2
package/src/db/migration.ts +57 -0
package/src/engine.ts +980 -122
package/src/lcm-log.ts +37 -0
package/src/plugin/index.ts +407 -74
package/src/plugin/lcm-command.ts +10 -4
package/src/plugin/shared-init.ts +59 -0
package/src/prune.ts +391 -0
package/src/retrieval.ts +7 -5
package/src/startup-banner-log.ts +1 -0
package/src/store/compaction-telemetry-store.ts +156 -0
package/src/store/conversation-store.ts +6 -1
package/src/store/fts5-sanitize.ts +25 -4
package/src/store/full-text-sort.ts +21 -0
package/src/store/index.ts +8 -0
package/src/store/summary-store.ts +21 -14
package/src/summarize.ts +54 -30
package/src/tools/lcm-describe-tool.ts +9 -4
package/src/tools/lcm-expand-query-tool.ts +11 -6
package/src/tools/lcm-expand-tool.ts +9 -4
package/src/tools/lcm-grep-tool.ts +22 -8
package/src/types.ts +1 -0

package/openclaw.plugin.json CHANGED Viewed

@@ -4,6 +4,10 @@
     "skills/lossless-claw"
   ],
   "uiHints": {
+    "enabled": {
+      "label": "Enabled",
+      "help": "Enable or disable lossless-claw without uninstalling it"
+    },
     "contextThreshold": {
       "label": "Context Threshold",
       "help": "Fraction of context window that triggers compaction (0.0–1.0)"
@@ -40,10 +44,26 @@
       "label": "Max Expand Tokens",
       "help": "Token cap for lcm_expand_query expansion calls"
     },
+    "leafMinFanout": {
+      "label": "Leaf Min Fanout",
+      "help": "Minimum number of raw messages required before a leaf compaction pass runs"
+    },
+    "condensedMinFanout": {
+      "label": "Condensed Min Fanout",
+      "help": "Number of same-depth summaries required before condensation is attempted"
+    },
+    "condensedMinFanoutHard": {
+      "label": "Condensed Min Fanout Hard",
+      "help": "Hard floor for condensation grouping during maintenance and repair flows"
+    },
     "dbPath": {
       "label": "Database Path",
       "help": "Path to LCM SQLite database (default: ~/.openclaw/lcm.db)"
     },
+    "databasePath": {
+      "label": "Database Path",
+      "help": "Path to LCM SQLite database (preferred key; alias of dbPath)"
+    },
     "ignoreSessionPatterns": {
       "label": "Ignored Sessions",
       "help": "Glob patterns for session keys to exclude from LCM storage"
@@ -56,6 +76,14 @@
       "label": "Skip Stateless Sessions",
       "help": "When enabled, matching stateless session keys skip LCM persistence and grant writes"
     },
+    "largeFileThresholdTokens": {
+      "label": "Large File Threshold Tokens",
+      "help": "Token threshold that routes text attachments into large-file summarization"
+    },
+    "largeFileTokenThreshold": {
+      "label": "Large File Threshold Tokens",
+      "help": "Legacy alias of largeFileThresholdTokens"
+    },
     "summaryModel": {
       "label": "Summary Model",
       "help": "Model override for LCM summarization (e.g., 'gpt-5.4' to reuse the session provider, or 'openai-resp/gpt-5.4' for a full cross-provider ref)"
@@ -100,6 +128,38 @@
       "label": "Custom Instructions",
       "help": "Natural language instructions injected into all summarization prompts (e.g., formatting rules, tone control)"
     },
+    "circuitBreakerThreshold": {
+      "label": "Circuit Breaker Threshold",
+      "help": "Consecutive auth failures before the summarization circuit breaker trips"
+    },
+    "circuitBreakerCooldownMs": {
+      "label": "Circuit Breaker Cooldown (ms)",
+      "help": "Cooldown before the summarization circuit breaker auto-resets"
+    },
+    "cacheAwareCompaction.enabled": {
+      "label": "Cache-Aware Compaction",
+      "help": "When enabled, hot prompt cache defers incremental compaction while cold cache allows bounded catch-up passes"
+    },
+    "cacheAwareCompaction.maxColdCacheCatchupPasses": {
+      "label": "Cold Cache Catch-Up Passes",
+      "help": "Maximum incremental leaf passes allowed in one maintenance cycle when prompt cache is cold"
+    },
+    "cacheAwareCompaction.hotCachePressureFactor": {
+      "label": "Hot Cache Pressure Factor",
+      "help": "Multiplier applied to the hot-cache leaf trigger before raw-history pressure overrides cache preservation"
+    },
+    "cacheAwareCompaction.hotCacheBudgetHeadroomRatio": {
+      "label": "Hot Cache Budget Headroom",
+      "help": "Fraction of the real token budget that must remain free before hot-cache incremental compaction is skipped entirely"
+    },
+    "dynamicLeafChunkTokens.enabled": {
+      "label": "Dynamic Leaf Chunk Tokens",
+      "help": "When enabled, incremental compaction uses a larger working leaf chunk in busy sessions and keeps the static floor in quieter sessions"
+    },
+    "dynamicLeafChunkTokens.max": {
+      "label": "Dynamic Leaf Chunk Max",
+      "help": "Maximum working leaf chunk target for dynamic incremental compaction. The static leafChunkTokens value remains the floor."
+    },
     "timezone": {
       "label": "Timezone",
       "help": "IANA timezone used for summary timestamps"
@@ -107,6 +167,10 @@
     "pruneHeartbeatOk": {
       "label": "Prune HEARTBEAT_OK",
       "help": "Retroactively delete HEARTBEAT_OK turn cycles from LCM storage"
+    },
+    "fallbackProviders": {
+      "label": "Fallback Providers",
+      "help": "Explicit fallback provider/model pairs for compaction summarization (e.g., [{\"provider\": \"anthropic\", \"model\": \"claude-haiku-4-5\"}])"
     }
   },
   "configSchema": {
@@ -187,6 +251,10 @@
         "type": "integer",
         "minimum": 1000
       },
+      "largeFileTokenThreshold": {
+        "type": "integer",
+        "minimum": 1000
+      },
       "summaryModel": {
         "type": "string"
       },
@@ -224,6 +292,49 @@
       "customInstructions": {
         "type": "string"
       },
+      "circuitBreakerThreshold": {
+        "type": "integer",
+        "minimum": 1
+      },
+      "circuitBreakerCooldownMs": {
+        "type": "integer",
+        "minimum": 1
+      },
+      "cacheAwareCompaction": {
+        "type": "object",
+        "additionalProperties": false,
+        "properties": {
+          "enabled": {
+            "type": "boolean"
+          },
+          "maxColdCacheCatchupPasses": {
+            "type": "integer",
+            "minimum": 1
+          },
+          "hotCachePressureFactor": {
+            "type": "number",
+            "minimum": 1
+          },
+          "hotCacheBudgetHeadroomRatio": {
+            "type": "number",
+            "minimum": 0,
+            "maximum": 0.95
+          }
+        }
+      },
+      "dynamicLeafChunkTokens": {
+        "type": "object",
+        "additionalProperties": false,
+        "properties": {
+          "enabled": {
+            "type": "boolean"
+          },
+          "max": {
+            "type": "integer",
+            "minimum": 1
+          }
+        }
+      },
       "timezone": {
         "type": "string"
       },
@@ -233,6 +344,18 @@
       "databasePath": {
         "description": "Path to LCM SQLite database (alias for dbPath)",
         "type": "string"
+      },
+      "fallbackProviders": {
+        "type": "array",
+        "items": {
+          "type": "object",
+          "properties": {
+            "provider": { "type": "string" },
+            "model": { "type": "string" }
+          },
+          "required": ["provider", "model"],
+          "additionalProperties": false
+        }
       }
     }
   }

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@martian-engineering/lossless-claw",
-  "version": "0.6.2",
+  "version": "0.7.0",
   "description": "Lossless Context Management plugin for OpenClaw — DAG-based conversation summarization with incremental compaction",
   "type": "module",
   "main": "index.ts",

package/skills/lossless-claw/references/config.md CHANGED Viewed

@@ -1,6 +1,6 @@
 # Configuration
-This reference covers the current `lossless-claw` config surface on `main`, based on `openclaw.plugin.json`.
+This reference covers the current `lossless-claw` config surface on `main`, based on `openclaw.plugin.json`, [`docs/configuration.md`](../../../docs/configuration.md), and the runtime defaults in [`src/db/config.ts`](../../../src/db/config.ts).
 `lossless-claw` is most effective when the operator understands which settings change compaction behavior and why.
@@ -57,6 +57,49 @@ Use this when:
 - Your summarizer is rate-limited or expensive.
 - You want fewer but broader leaf summaries.
+### `cacheAwareCompaction`
+Controls how strongly lossless-claw preserves a healthy prompt cache during incremental maintenance.
+Why it matters:
+- Hot cache now prefers to keep the cache intact instead of eagerly compacting old raw history.
+- Cold cache still allows bounded catch-up passes so stale sessions can converge.
+- The new defaults are intentionally more aggressive about preserving cache than earlier builds.
+Good defaults:
+- `enabled: true`
+- `maxColdCacheCatchupPasses: 2`
+- `hotCachePressureFactor: 4`
+- `hotCacheBudgetHeadroomRatio: 0.2`
+Operationally:
+- hot cache stretches the incremental leaf trigger to `dynamicLeafChunkTokens.max`
+- hot cache skips incremental maintenance entirely when the assembled context is comfortably below the real token budget
+- hot cache gets a short hysteresis window so a recent cache hit stays "hot" briefly unless telemetry shows a break
+- if hot-cache maintenance still runs, it stays leaf-only and suppresses follow-on condensed passes
+### `dynamicLeafChunkTokens`
+Controls the working leaf-trigger size used by incremental compaction.
+Why it matters:
+- dynamic sizing is now enabled by default
+- busier sessions can use a larger working chunk without changing the static floor
+- hot cache uses the dynamic max as the working leaf trigger
+Good defaults:
+- `enabled: true`
+- `max: 2 * leafChunkTokens`
+With the default `leafChunkTokens=20000`, that means:
+- `dynamicLeafChunkTokens.max = 40000`
 ### `incrementalMaxDepth`
 Controls how far automatic condensation cascades after leaf compaction.
@@ -112,6 +155,15 @@ Why it matters:
 - useful for custom deployments, testing, or isolating environments
 - wrong path selection is a common reason operators think LCM is empty or not growing
+### `databasePath`
+Preferred alias of `dbPath`.
+Why it matters:
+- this is the documented key new config should use
+- `dbPath` is still accepted for compatibility
 ### `largeFileThresholdTokens`
 Threshold for externalizing oversized tool/file payloads out of the main transcript into large-file storage.
@@ -166,6 +218,16 @@ Why it matters:
 See high-impact settings above.
+### `bootstrapMaxTokens`
+Maximum raw parent-history tokens imported when a brand-new LCM conversation bootstraps.
+Why it matters:
+- keeps first-time bootstrap from flooding the conversation with too much old transcript material
+- defaults to `max(6000, floor(leafChunkTokens * 0.3))`
+- only affects the first import path, not ordinary steady-state turns
 ## Session-selection controls
 ### `ignoreSessionPatterns`
@@ -223,6 +285,62 @@ Why it matters:
 - useful when the runtime model window is smaller than the surrounding system assumes
 - can prevent oversized assembly on smaller-context models
+## Nested objects
+### `cacheAwareCompaction`
+#### `cacheAwareCompaction.enabled`
+Defers incremental leaf compaction more aggressively when prompt-cache telemetry indicates a hot cache.
+#### `cacheAwareCompaction.maxColdCacheCatchupPasses`
+Maximum bounded catch-up passes allowed in one maintenance cycle when cache telemetry is cold.
+#### `cacheAwareCompaction.hotCachePressureFactor`
+Multiplier applied to the hot-cache leaf trigger before raw-history pressure overrides cache preservation.
+Why it matters:
+- higher values preserve hot cache longer
+- lower values revert toward more eager incremental compaction
+Default:
+- `4`
+#### `cacheAwareCompaction.hotCacheBudgetHeadroomRatio`
+Minimum fraction of the real token budget that must remain free before hot-cache incremental compaction is skipped entirely.
+Why it matters:
+- higher values make hot-cache skip behavior stricter
+- lower values allow more hot-cache maintenance before real budget pressure exists
+Default:
+- `0.2`
+### `dynamicLeafChunkTokens`
+#### `dynamicLeafChunkTokens.enabled`
+Enables dynamic working leaf chunk sizes for busier sessions.
+Default:
+- `true`
+#### `dynamicLeafChunkTokens.max`
+Upper bound for the dynamic working chunk size. The static `leafChunkTokens` value remains the floor.
+Default:
+- `max(leafChunkTokens, floor(leafChunkTokens * 2))`
 ## Summary quality and prompt controls
 ### `summaryMaxOverageFactor`
@@ -249,8 +367,12 @@ Why it matters:
 2. Set the context-engine slot to `lossless-claw`.
 3. Start with conservative defaults.
 4. Run `/lossless` after startup to confirm path, size, and summary health.
-5. If recall feels weak, revisit `freshTailCount`, `leafChunkTokens`, and summarizer model quality before changing anything else.
-6. Touch advanced knobs like fanout, large-file thresholds, custom instructions, and assembly caps only after a concrete symptom appears.
+5. If hot-cache turns still compact too often, inspect the decision logs before changing anything else:
+   - `reason=hot-cache-budget-headroom` means the new skip path is working.
+   - `reason=hot-cache-defer` means raw-history pressure is below the configured hot-cache factor.
+   - `allowCondensedPasses=false` on hot-cache turns is expected.
+6. If recall feels weak, revisit `freshTailCount`, `leafChunkTokens`, and summarizer model quality before changing anything else.
+7. Touch advanced knobs like fanout, large-file thresholds, custom instructions, and assembly caps only after a concrete symptom appears.
 ## Reading the status output
@@ -261,3 +383,13 @@ Useful interpretation notes:
 - `tokens in context` is the current LCM frontier token count in the live LCM state.
 - `compression ratio` is shown as a rounded `1:N`, which is easier to read than a tiny percentage for heavily compacted conversations.
 - `/status` may still show a different context number because it reflects the runtime prompt that was actually assembled and sent on the last turn.
+## Keep this reference aligned
+This file should stay consistent with:
+- [`docs/configuration.md`](../../../docs/configuration.md)
+- [`openclaw.plugin.json`](../../../openclaw.plugin.json)
+- [`src/db/config.ts`](../../../src/db/config.ts)
+When config keys, aliases, defaults, or precedence rules change, update all of them together.

package/src/assembler.ts CHANGED Viewed

@@ -93,7 +93,11 @@ function buildSystemPromptAddition(summarySignals: SummaryPromptSignal[]): strin
       "Default recall flow for precision work:",
       "1) `lcm_grep` to locate relevant summary/message IDs",
       "2) `lcm_expand_query` with a focused prompt",
-      "3) Answer with citations to summary IDs used",
+      "3) Answer directly from the retrieved evidence",
+      "",
+      "Keep raw summary IDs in tool context for follow-up; do not include them in the user-facing answer unless the user asks for sources or IDs.",
+      "",
+      "`lcm_grep` tips: prefer `mode: \"full_text\"` for keyword/topic lookup, quote exact multi-word phrases, use `sort: \"relevance\"` for older-topic retrieval, and use `sort: \"hybrid\"` when recency should still influence ranking.",
       "",
       "**Uncertainty checklist (run before answering):**",
       "- Am I making an exact factual claim from a compressed or condensed summary?",