@joshuaswarren/openclaw-engram 9.0.52 → 9.0.53
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +7 -0
- package/dist/index.js +7 -0
- package/dist/index.js.map +1 -1
- package/package.json +1 -1
package/README.md
CHANGED
|
@@ -33,6 +33,7 @@ AI agents forget everything between conversations. Engram fixes that.
|
|
|
33
33
|
- **Benchmark-first roadmap** — Engram now has an evaluation harness with live shadow recall recording and a CI benchmark delta gate, so memory improvements can be measured and regression-checked instead of argued from anecdotes.
|
|
34
34
|
- **Baseline snapshot discipline** — Engram can now, when `benchmarkBaselineSnapshotsEnabled` is enabled, capture typed baseline snapshots of the latest completed benchmark runs so later PR delta reporting can compare candidates against a stable stored reference instead of an ad hoc branch state.
|
|
35
35
|
- **Named baseline delta reporting** — Engram can now, when `benchmarkDeltaReporterEnabled` is enabled, compare the current eval store against a stored baseline snapshot, emit a machine-readable delta report plus markdown summary, and fail fast when a candidate regresses a benchmark that previously passed.
|
|
36
|
+
- **Required CI baseline gate** — Engram's `eval-benchmark-gate` workflow now reads a named stored baseline snapshot from the base branch fixture store and blocks merges when the candidate branch regresses relative to that required baseline.
|
|
36
37
|
- **Objective-state recall** — Engram can now store normalized file, process, and tool outcomes and, when `objectiveStateRecallEnabled` is enabled, inject the most relevant objective-state snapshots back into recall context as a separate `Objective State` section.
|
|
37
38
|
- **Causal trajectory graph foundation** — Engram can now persist typed `goal -> action -> observation -> outcome -> follow-up` chains when `causalTrajectoryMemoryEnabled` is enabled and, with `actionGraphRecallEnabled`, emit deterministic action-conditioned edges into the causal graph for later trajectory-aware retrieval.
|
|
38
39
|
- **Causal trajectory recall** — Engram can now, when `causalTrajectoryRecallEnabled` is enabled, inject prompt-relevant causal chains back into recall context as a separate `Causal Trajectories` section with lightweight match explainability.
|
|
@@ -215,6 +216,12 @@ Key settings:
|
|
|
215
216
|
| `evalShadowModeEnabled` | `false` | Record live recall decisions to the eval store without changing injected output |
|
|
216
217
|
| `benchmarkBaselineSnapshotsEnabled` | `false` | Enable versioned baseline snapshot artifacts for the latest completed benchmark runs |
|
|
217
218
|
| `benchmarkDeltaReporterEnabled` | `false` | Enable named-baseline delta reports against the current eval store |
|
|
219
|
+
|
|
220
|
+
The repo's required benchmark check uses the committed fixture snapshot at
|
|
221
|
+
`tests/fixtures/eval-ci/store/baselines/required-main.json` as the stable
|
|
222
|
+
release baseline for PR gating. During the rollout PR that first introduces
|
|
223
|
+
that file, the gate bootstraps from the candidate branch snapshot once; after
|
|
224
|
+
that, PRs resolve the required baseline from the base branch checkout.
|
|
218
225
|
| `evalStoreDir` | `{memoryDir}/state/evals` | Root directory for benchmark packs, run summaries, and shadow recall records |
|
|
219
226
|
| `objectiveStateMemoryEnabled` | `false` | Enable the objective-state memory foundation for normalized world/tool state snapshots |
|
|
220
227
|
| `objectiveStateSnapshotWritesEnabled` | `false` | Permit objective-state snapshot writers to persist typed state records |
|
package/dist/index.js
CHANGED
|
@@ -12239,6 +12239,13 @@ async function runEvalBaselineDeltaReport(options) {
|
|
|
12239
12239
|
if (!baselineSnapshot) {
|
|
12240
12240
|
throw new Error(`benchmark baseline snapshot not found: ${snapshotId}`);
|
|
12241
12241
|
}
|
|
12242
|
+
return buildEvalBaselineDeltaReport({
|
|
12243
|
+
baselineSnapshot,
|
|
12244
|
+
candidateSnapshot
|
|
12245
|
+
});
|
|
12246
|
+
}
|
|
12247
|
+
function buildEvalBaselineDeltaReport(options) {
|
|
12248
|
+
const { baselineSnapshot, candidateSnapshot } = options;
|
|
12242
12249
|
const regressions = [];
|
|
12243
12250
|
const improvements = [];
|
|
12244
12251
|
if (candidateSnapshot.status.invalidBenchmarks.length > 0) {
|