npm - @simbimbo/memory-ocmemog - Versions diffs - 0.1.10 → 0.1.12 - Mend

@simbimbo/memory-ocmemog 0.1.10 → 0.1.12

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (102) hide show

package/CHANGELOG.md +30 -0
package/README.md +85 -18
package/brain/runtime/__init__.py +2 -12
package/brain/runtime/config.py +1 -24
package/brain/runtime/inference.py +1 -151
package/brain/runtime/instrumentation.py +1 -15
package/brain/runtime/memory/__init__.py +3 -13
package/brain/runtime/memory/api.py +1 -1219
package/brain/runtime/memory/candidate.py +1 -185
package/brain/runtime/memory/conversation_state.py +1 -1823
package/brain/runtime/memory/distill.py +1 -344
package/brain/runtime/memory/embedding_engine.py +1 -92
package/brain/runtime/memory/freshness.py +1 -112
package/brain/runtime/memory/health.py +1 -40
package/brain/runtime/memory/integrity.py +1 -186
package/brain/runtime/memory/memory_consolidation.py +1 -58
package/brain/runtime/memory/memory_links.py +1 -107
package/brain/runtime/memory/memory_salience.py +1 -233
package/brain/runtime/memory/memory_synthesis.py +1 -31
package/brain/runtime/memory/memory_taxonomy.py +1 -33
package/brain/runtime/memory/pondering_engine.py +1 -654
package/brain/runtime/memory/promote.py +1 -277
package/brain/runtime/memory/provenance.py +1 -406
package/brain/runtime/memory/reinforcement.py +1 -71
package/brain/runtime/memory/retrieval.py +1 -210
package/brain/runtime/memory/semantic_search.py +1 -64
package/brain/runtime/memory/store.py +1 -429
package/brain/runtime/memory/unresolved_state.py +1 -91
package/brain/runtime/memory/vector_index.py +1 -323
package/brain/runtime/model_roles.py +1 -9
package/brain/runtime/model_router.py +1 -22
package/brain/runtime/providers.py +1 -66
package/brain/runtime/security/redaction.py +1 -12
package/brain/runtime/state_store.py +1 -23
package/brain/runtime/storage_paths.py +1 -39
package/docs/architecture/memory.md +20 -24
package/docs/release-checklist.md +19 -6
package/docs/usage.md +33 -17
package/index.ts +8 -1
package/ocmemog/__init__.py +11 -0
package/ocmemog/doctor.py +1255 -0
package/ocmemog/runtime/__init__.py +18 -0
package/ocmemog/runtime/_compat_bridge.py +28 -0
package/ocmemog/runtime/config.py +35 -0
package/ocmemog/runtime/identity.py +115 -0
package/ocmemog/runtime/inference.py +164 -0
package/ocmemog/runtime/instrumentation.py +20 -0
package/ocmemog/runtime/memory/__init__.py +91 -0
package/ocmemog/runtime/memory/api.py +1431 -0
package/ocmemog/runtime/memory/candidate.py +192 -0
package/ocmemog/runtime/memory/conversation_state.py +1831 -0
package/ocmemog/runtime/memory/distill.py +282 -0
package/ocmemog/runtime/memory/embedding_engine.py +151 -0
package/ocmemog/runtime/memory/freshness.py +114 -0
package/ocmemog/runtime/memory/health.py +57 -0
package/ocmemog/runtime/memory/integrity.py +208 -0
package/ocmemog/runtime/memory/memory_consolidation.py +60 -0
package/ocmemog/runtime/memory/memory_links.py +109 -0
package/ocmemog/runtime/memory/memory_salience.py +235 -0
package/ocmemog/runtime/memory/memory_synthesis.py +33 -0
package/ocmemog/runtime/memory/memory_taxonomy.py +35 -0
package/ocmemog/runtime/memory/pondering_engine.py +681 -0
package/ocmemog/runtime/memory/promote.py +279 -0
package/ocmemog/runtime/memory/provenance.py +408 -0
package/ocmemog/runtime/memory/reinforcement.py +73 -0
package/ocmemog/runtime/memory/retrieval.py +224 -0
package/ocmemog/runtime/memory/semantic_search.py +66 -0
package/ocmemog/runtime/memory/store.py +433 -0
package/ocmemog/runtime/memory/unresolved_state.py +93 -0
package/ocmemog/runtime/memory/vector_index.py +411 -0
package/ocmemog/runtime/model_roles.py +16 -0
package/ocmemog/runtime/model_router.py +29 -0
package/ocmemog/runtime/providers.py +79 -0
package/ocmemog/runtime/roles.py +92 -0
package/ocmemog/runtime/security/__init__.py +8 -0
package/ocmemog/runtime/security/redaction.py +17 -0
package/ocmemog/runtime/state_store.py +34 -0
package/ocmemog/runtime/storage_paths.py +70 -0
package/ocmemog/sidecar/app.py +311 -23
package/ocmemog/sidecar/compat.py +50 -13
package/ocmemog/sidecar/transcript_watcher.py +391 -190
package/openclaw.plugin.json +4 -0
package/package.json +1 -1
package/scripts/ocmemog-backfill-vectors.py +5 -3
package/scripts/ocmemog-continuity-benchmark.py +1 -1
package/scripts/ocmemog-demo.py +1 -1
package/scripts/ocmemog-doctor.py +15 -0
package/scripts/ocmemog-install.sh +29 -7
package/scripts/ocmemog-integrated-proof.py +373 -0
package/scripts/ocmemog-reindex-vectors.py +5 -3
package/scripts/ocmemog-release-check.sh +330 -0
package/scripts/ocmemog-sidecar.sh +4 -2
package/scripts/ocmemog-test-rig.py +5 -3
package/brain/runtime/memory/artifacts.py +0 -33
package/brain/runtime/memory/context_builder.py +0 -112
package/brain/runtime/memory/interaction_memory.py +0 -57
package/brain/runtime/memory/memory_gate.py +0 -38
package/brain/runtime/memory/memory_graph.py +0 -54
package/brain/runtime/memory/person_identity.py +0 -83
package/brain/runtime/memory/person_memory.py +0 -138
package/brain/runtime/memory/sentiment_memory.py +0 -67
package/brain/runtime/memory/tool_catalog.py +0 -68

package/ocmemog/runtime/memory/candidate.py ADDED Viewed

@@ -0,0 +1,192 @@
+from __future__ import annotations
+import json
+import re
+import uuid
+from difflib import SequenceMatcher
+from typing import Any, Dict
+from ocmemog.runtime.security import redaction
+from ocmemog.runtime.memory import provenance, store
+from ocmemog.runtime.instrumentation import emit_event
+from ocmemog.runtime import state_store
+LOGFILE = state_store.report_log_path()
+_NEAR_DUPLICATE_SIMILARITY = 0.85
+def _normalize_summary(text: str) -> str:
+    return re.sub(r"\s+", " ", str(text or "").strip().lower())
+def _tokenize(text: str) -> set[str]:
+    return {token for token in re.findall(r"[a-z0-9]+", _normalize_summary(text))}
+def _summary_similarity(left: str, right: str) -> float:
+    left_tokens = _tokenize(left)
+    right_tokens = _tokenize(right)
+    token_similarity = 0.0
+    if left_tokens and right_tokens:
+        overlap = len(left_tokens & right_tokens)
+        union = len(left_tokens | right_tokens)
+        token_similarity = overlap / max(1, union)
+    sequence_similarity = SequenceMatcher(None, _normalize_summary(left), _normalize_summary(right)).ratio()
+    return max(token_similarity, sequence_similarity)
+def _ranges_overlap(left: Dict[str, Any], right: Dict[str, Any]) -> bool:
+    if str(left.get("path") or "") != str(right.get("path") or ""):
+        return False
+    def _as_int(value: Any) -> int | None:
+        try:
+            return int(value) if value is not None else None
+        except Exception:
+            return None
+    left_start = _as_int(left.get("start_line"))
+    left_end = _as_int(left.get("end_line")) or left_start
+    right_start = _as_int(right.get("start_line"))
+    right_end = _as_int(right.get("end_line")) or right_start
+    if left_start is None and right_start is None:
+        return True
+    if left_start is None or right_start is None:
+        return False
+    return max(left_start, right_start) <= min(left_end or left_start, right_end or right_start)
+def _shares_provenance_anchor(left: Dict[str, Any], right: Dict[str, Any]) -> bool:
+    left_meta = provenance.normalize_metadata(left)
+    right_meta = provenance.normalize_metadata(right)
+    left_prov = left_meta.get("provenance") if isinstance(left_meta.get("provenance"), dict) else {}
+    right_prov = right_meta.get("provenance") if isinstance(right_meta.get("provenance"), dict) else {}
+    left_conv = left_prov.get("conversation") if isinstance(left_prov.get("conversation"), dict) else {}
+    right_conv = right_prov.get("conversation") if isinstance(right_prov.get("conversation"), dict) else {}
+    if left_conv.get("message_id") and left_conv.get("message_id") == right_conv.get("message_id"):
+        return True
+    left_transcript = left_prov.get("transcript_anchor") if isinstance(left_prov.get("transcript_anchor"), dict) else {}
+    right_transcript = right_prov.get("transcript_anchor") if isinstance(right_prov.get("transcript_anchor"), dict) else {}
+    if left_transcript.get("path") and right_transcript.get("path") and _ranges_overlap(left_transcript, right_transcript):
+        return True
+    left_refs = {str(item) for item in left_prov.get("source_references") or [] if str(item).strip()}
+    right_refs = {str(item) for item in right_prov.get("source_references") or [] if str(item).strip()}
+    return bool(left_refs & right_refs)
+def _find_near_duplicate_candidate(conn, source_event_id: int, summary: str, metadata: Dict[str, Any]) -> str | None:
+    rows = conn.execute(
+        """
+        SELECT candidate_id, distilled_summary, metadata_json
+        FROM candidates
+        WHERE source_event_id != ?
+        ORDER BY created_at DESC, candidate_id DESC
+        LIMIT 250
+        """,
+        (source_event_id,),
+    ).fetchall()
+    normalized_summary = _normalize_summary(summary)
+    for row in rows:
+        existing_summary = str(row["distilled_summary"] if isinstance(row, dict) else row[1] or "")
+        similarity = _summary_similarity(normalized_summary, existing_summary)
+        if similarity < _NEAR_DUPLICATE_SIMILARITY:
+            continue
+        try:
+            existing_metadata = json.loads(row["metadata_json"] if isinstance(row, dict) else row[2] or "{}")
+        except Exception:
+            existing_metadata = {}
+        if _shares_provenance_anchor(metadata, existing_metadata):
+            return str(row["candidate_id"] if isinstance(row, dict) else row[0])
+    return None
+def create_candidate(
+    source_event_id: int,
+    distilled_summary: str,
+    verification_points: list[str],
+    confidence_score: float,
+    metadata: Dict[str, Any] | None = None,
+) -> Dict[str, Any]:
+    summary, redacted = redaction.redact_text(distilled_summary)
+    verification_lines = []
+    for point in verification_points:
+        clean, _ = redaction.redact_text(str(point))
+        verification_lines.append(clean)
+    normalized_metadata = provenance.normalize_metadata(metadata, source="candidate")
+    conn = store.connect()
+    exact_row = conn.execute(
+        "SELECT candidate_id FROM candidates WHERE source_event_id=? AND distilled_summary=?",
+        (source_event_id, summary),
+    ).fetchone()
+    if exact_row:
+        conn.close()
+        emit_event(LOGFILE, "brain_memory_candidate_duplicate", status="ok", source_event_id=source_event_id)
+        return {"candidate_id": exact_row[0], "duplicate": True}
+    near_duplicate_id = _find_near_duplicate_candidate(conn, source_event_id, summary, normalized_metadata)
+    if near_duplicate_id:
+        conn.close()
+        emit_event(
+            LOGFILE,
+            "brain_memory_candidate_duplicate",
+            status="ok",
+            source_event_id=source_event_id,
+            duplicate_kind="near",
+        )
+        return {"candidate_id": near_duplicate_id, "duplicate": True}
+    candidate_id = str(uuid.uuid4())
+    verification_status = "verified" if verification_lines else "unverified"
+    conn.execute(
+        """
+        INSERT INTO candidates (
+            candidate_id, source_event_id, distilled_summary, verification_points,
+            confidence_score, status, verification_status, metadata_json, schema_version
+        ) VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?)
+        """,
+        (
+            candidate_id,
+            source_event_id,
+            summary,
+            "\n".join(verification_lines),
+            confidence_score,
+            "pending",
+            verification_status,
+            json.dumps(normalized_metadata, ensure_ascii=False),
+            store.SCHEMA_VERSION,
+        ),
+    )
+    conn.execute(
+        "INSERT INTO memory_events (event_type, source, details_json, schema_version) VALUES (?, ?, ?, ?)",
+        (
+            "candidate_created",
+            str(source_event_id),
+            json.dumps({"candidate_id": candidate_id, "redacted": redacted, "verification_status": verification_status}),
+            store.SCHEMA_VERSION,
+        ),
+    )
+    conn.commit()
+    conn.close()
+    emit_event(LOGFILE, "brain_memory_candidate_created", status="ok", source_event_id=source_event_id, redacted=redacted)
+    return {"candidate_id": candidate_id, "duplicate": False}
+def get_candidate(candidate_id: str) -> Dict[str, Any] | None:
+    conn = store.connect()
+    row = conn.execute(
+        """
+        SELECT candidate_id, source_event_id, distilled_summary, verification_points,
+               confidence_score, status, verification_status, metadata_json
+        FROM candidates
+        WHERE candidate_id=?
+        """,
+        (candidate_id,),
+    ).fetchone()
+    conn.close()
+    return dict(row) if row else None