npm - @simbimbo/memory-ocmemog - Versions diffs - 0.1.4 → 0.1.6 - Mend

@simbimbo/memory-ocmemog 0.1.4 → 0.1.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (32) hide show

package/CHANGELOG.md +27 -0
package/README.md +9 -7
package/brain/runtime/inference.py +31 -1
package/brain/runtime/memory/api.py +824 -5
package/brain/runtime/memory/context_builder.py +101 -76
package/brain/runtime/memory/distill.py +156 -13
package/brain/runtime/memory/freshness.py +24 -1
package/brain/runtime/memory/integrity.py +22 -6
package/brain/runtime/memory/pondering_engine.py +87 -8
package/brain/runtime/memory/promote.py +6 -0
package/brain/runtime/memory/provenance.py +52 -0
package/brain/runtime/memory/retrieval.py +116 -50
package/brain/runtime/memory/vector_index.py +67 -5
package/docs/notes/2026-03-18-memory-repair-and-backfill.md +70 -0
package/docs/notes/local-model-role-matrix-2026-03-18.md +50 -0
package/docs/usage.md +16 -14
package/index.ts +1 -1
package/ocmemog/sidecar/app.py +381 -9
package/ocmemog/sidecar/compat.py +7 -1
package/ocmemog/sidecar/transcript_watcher.py +2 -2
package/package.json +1 -1
package/scripts/install-ocmemog.sh +2 -2
package/scripts/ocmemog-backfill-vectors.py +33 -0
package/scripts/ocmemog-context.sh +1 -1
package/scripts/ocmemog-demo.py +1 -1
package/scripts/ocmemog-load-test.py +1 -1
package/scripts/ocmemog-ponder.sh +2 -2
package/scripts/ocmemog-recall-test.py +1 -1
package/scripts/ocmemog-reindex-vectors.py +8 -0
package/scripts/ocmemog-reliability-soak.py +1 -1
package/scripts/ocmemog-sidecar.sh +33 -7
package/scripts/ocmemog-test-rig.py +1 -1

package/CHANGELOG.md CHANGED Viewed

@@ -1,5 +1,32 @@
 # Changelog
+## 0.1.6 — 2026-03-19
+Port-separation and publish-solid follow-up.
+### Highlights
+- Split ocmemog sidecar onto dedicated loopback port `17891` to avoid collision with the OpenClaw gateway/dashboard on `17890`
+- Restored the plain realtime dashboard on `/dashboard` and fixed the `local_html` template crash
+- Updated plugin/runtime defaults, scripts, and documentation to use the dedicated sidecar endpoint on `17891`
+- Added governance retrieval/governance-policy hardening plus expanded regression coverage for duplicate, contradiction, supersession, queue, audit, rollback, and auto-resolve flows
+- Aligned package/version metadata across npm, Python, and FastAPI surfaces
+## 0.1.5 — 2026-03-18
+Repair and hardening follow-up after the 0.1.4 publish.
+### Highlights
+- Fixed vector reindex defaults so repair scripts use provider-backed Ollama embeddings instead of silently rebuilding weak local/hash vectors
+- Added battery-aware sidecar defaults for macOS laptops (`OCMEMOG_LAPTOP_MODE=auto|ac|battery`)
+- Fixed `record_reinforcement()` so new experiences preserve `memory_reference`, and added integrity repair to backfill legacy missing references
+- Added incremental vector backfill tooling (`scripts/ocmemog-backfill-vectors.py`) for non-destructive backlog repair
+- Cleaned freshness summaries so junk placeholders (`promoted`, `summary`, `No local memory summary available`) do not pollute advisories
+- Improved integrity reporting to count duplicate promotion groups accurately
+### Notes
+- Historical vector backlog still exists and should be burned down in staged backfills, especially for `knowledge`
+- Detailed repair notes: `docs/notes/2026-03-18-memory-repair-and-backfill.md`
 ## 0.1.4 — 2026-03-18
 Package ownership + runtime safety release.

package/README.md CHANGED Viewed

@@ -32,7 +32,7 @@ pip install -r requirements.txt
 ./scripts/ocmemog-sidecar.sh
 # then open
-# http://127.0.0.1:17890/dashboard
+# http://127.0.0.1:17891/dashboard
 ```
 ## Optional: transcript watcher (auto-ingest)
@@ -45,8 +45,8 @@ export OCMEMOG_TRANSCRIPT_DIR="$HOME/.openclaw/workspace/memory/transcripts"
 Default bind:
-- endpoint: `http://127.0.0.1:17890`
-- health: `http://127.0.0.1:17890/healthz`
+- endpoint: `http://127.0.0.1:17891`
+- health: `http://127.0.0.1:17891/healthz`
 ## Continuity proof / benchmark harness
@@ -83,14 +83,15 @@ Optional environment variables:
 - `OCMEMOG_TRANSCRIPT_ROOTS` (comma-separated allowed roots for transcript context retrieval; default: `~/.openclaw/workspace/memory`)
 - `OCMEMOG_API_TOKEN` (optional; if set, requests must include `x-ocmemog-token` or `Authorization: Bearer ...`)
 - `OCMEMOG_AUTO_HYDRATION` (`true` to re-enable prompt-time continuity prepending; defaults to `false` as a safety guard until the host runtime is verified not to persist prepended context into session history)
+- `OCMEMOG_LAPTOP_MODE` (`auto` by default; on macOS battery power this slows watcher polling, reduces ingest batch size, and disables sentiment reinforcement unless explicitly overridden)
 - `OCMEMOG_USE_OLLAMA` (`true` to use Ollama for distill/inference)
 - `OCMEMOG_OLLAMA_HOST` (default: `http://127.0.0.1:11434`)
-- `OCMEMOG_OLLAMA_MODEL` (default: `phi3:latest`)
+- `OCMEMOG_OLLAMA_MODEL` (default: `phi3:latest`; lightweight local fallback / cheap cognition)
 - `OCMEMOG_OLLAMA_EMBED_MODEL` (default: `nomic-embed-text:latest`)
 - `OCMEMOG_PROMOTION_THRESHOLD` (default: `0.5`)
 - `OCMEMOG_DEMOTION_THRESHOLD` (default: `0.2`)
 - `OCMEMOG_PONDER_ENABLED` (default: `true`)
-- `OCMEMOG_PONDER_MODEL` (default: `OCMEMOG_MEMORY_MODEL`)
+- `OCMEMOG_PONDER_MODEL` (default via launcher: `qwen2.5:7b`; recommended for structured local memory refinement)
 - `OCMEMOG_LESSON_MINING_ENABLED` (default: `true`)
 ## Security
@@ -153,7 +154,7 @@ launchctl bootstrap gui/$UID scripts/launchagents/com.openclaw.ocmemog.guard.pli
 ## Recent changes
-### 0.1.4 (unreleased / current main)
+### 0.1.5 (current main)
 Package ownership + runtime safety release:
 - Publish package under `@simbimbo/memory-ocmemog` instead of the unauthorized `@openclaw` scope
@@ -192,7 +193,7 @@ plugins:
     memory-ocmemog:
       enabled: true
       config:
-        endpoint: http://127.0.0.1:17890
+        endpoint: http://127.0.0.1:17891
         timeoutMs: 30000
 ```
@@ -221,3 +222,4 @@ Current limitations before broader public rollout:
 - Public release/distribution metadata is still being tightened up
 When a richer path is unavailable, the sidecar is designed to fail soft with explicit warnings rather than crash.
+ soft with explicit warnings rather than crash.

package/brain/runtime/inference.py CHANGED Viewed

@@ -33,13 +33,43 @@ def _infer_ollama(prompt: str, model: str | None = None) -> dict[str, str]:
     return {"status": "ok", "output": str(output).strip()}
+def _looks_like_ollama_model(name: str) -> bool:
+    if not name:
+        return False
+    lowered = name.strip().lower()
+    if lowered.startswith("ollama:"):
+        return True
+    if "/" in lowered:
+        return False
+    return ":" in lowered
+def stats() -> dict[str, object]:
+    materialized_local = int(_LOCAL_INFER_STATS.get("local_success", 0)) + int(_LOCAL_INFER_STATS.get("cache_hits", 0))
+    est_prompt_tokens_saved = materialized_local * _AVG_PROMPT_TOKENS_SAVED
+    est_completion_tokens_saved = materialized_local * _AVG_COMPLETION_TOKENS_SAVED
+    est_cost_saved = (
+        (est_prompt_tokens_saved / 1000.0) * _EST_FRONTIER_INPUT_COST_PER_1K
+        + (est_completion_tokens_saved / 1000.0) * _EST_FRONTIER_OUTPUT_COST_PER_1K
+    )
+    return {
+        "cache_entries": len(_LOCAL_INFER_CACHE),
+        "warm_models": sorted(_MODEL_WARM_STATE.keys()),
+        "frontier_calls_avoided_est": materialized_local,
+        "prompt_tokens_saved_est": est_prompt_tokens_saved,
+        "completion_tokens_saved_est": est_completion_tokens_saved,
+        "cost_saved_usd_est": round(est_cost_saved, 4),
+        **{k: int(v) for k, v in _LOCAL_INFER_STATS.items()},
+    }
 def infer(prompt: str, provider_name: str | None = None) -> dict[str, str]:
     if not isinstance(prompt, str) or not prompt.strip():
         return {"status": "error", "error": "empty_prompt"}
     use_ollama = os.environ.get("OCMEMOG_USE_OLLAMA", "").lower() in {"1", "true", "yes"}
     model_override = provider_name or config.OCMEMOG_MEMORY_MODEL
-    if use_ollama or model_override.startswith("ollama:"):
+    if use_ollama or _looks_like_ollama_model(model_override):
         model = model_override.split(":", 1)[-1] if model_override.startswith("ollama:") else model_override
         return _infer_ollama(prompt, model)