npm - @simbimbo/memory-ocmemog - Versions diffs - 0.1.11 → 0.1.12 - Mend

@simbimbo/memory-ocmemog 0.1.11 → 0.1.12

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (102) hide show

package/CHANGELOG.md +16 -0
package/README.md +83 -18
package/brain/runtime/__init__.py +2 -12
package/brain/runtime/config.py +1 -24
package/brain/runtime/inference.py +1 -151
package/brain/runtime/instrumentation.py +1 -15
package/brain/runtime/memory/__init__.py +3 -13
package/brain/runtime/memory/api.py +1 -1219
package/brain/runtime/memory/candidate.py +1 -185
package/brain/runtime/memory/conversation_state.py +1 -1823
package/brain/runtime/memory/distill.py +1 -344
package/brain/runtime/memory/embedding_engine.py +1 -92
package/brain/runtime/memory/freshness.py +1 -112
package/brain/runtime/memory/health.py +1 -40
package/brain/runtime/memory/integrity.py +1 -186
package/brain/runtime/memory/memory_consolidation.py +1 -58
package/brain/runtime/memory/memory_links.py +1 -107
package/brain/runtime/memory/memory_salience.py +1 -233
package/brain/runtime/memory/memory_synthesis.py +1 -31
package/brain/runtime/memory/memory_taxonomy.py +1 -33
package/brain/runtime/memory/pondering_engine.py +1 -654
package/brain/runtime/memory/promote.py +1 -277
package/brain/runtime/memory/provenance.py +1 -406
package/brain/runtime/memory/reinforcement.py +1 -71
package/brain/runtime/memory/retrieval.py +1 -210
package/brain/runtime/memory/semantic_search.py +1 -64
package/brain/runtime/memory/store.py +1 -429
package/brain/runtime/memory/unresolved_state.py +1 -91
package/brain/runtime/memory/vector_index.py +1 -323
package/brain/runtime/model_roles.py +1 -9
package/brain/runtime/model_router.py +1 -22
package/brain/runtime/providers.py +1 -66
package/brain/runtime/security/redaction.py +1 -12
package/brain/runtime/state_store.py +1 -23
package/brain/runtime/storage_paths.py +1 -39
package/docs/architecture/memory.md +20 -24
package/docs/release-checklist.md +19 -6
package/docs/usage.md +33 -17
package/index.ts +8 -1
package/ocmemog/__init__.py +11 -0
package/ocmemog/doctor.py +1255 -0
package/ocmemog/runtime/__init__.py +18 -0
package/ocmemog/runtime/_compat_bridge.py +28 -0
package/ocmemog/runtime/config.py +35 -0
package/ocmemog/runtime/identity.py +115 -0
package/ocmemog/runtime/inference.py +164 -0
package/ocmemog/runtime/instrumentation.py +20 -0
package/ocmemog/runtime/memory/__init__.py +91 -0
package/ocmemog/runtime/memory/api.py +1431 -0
package/ocmemog/runtime/memory/candidate.py +192 -0
package/ocmemog/runtime/memory/conversation_state.py +1831 -0
package/ocmemog/runtime/memory/distill.py +282 -0
package/ocmemog/runtime/memory/embedding_engine.py +151 -0
package/ocmemog/runtime/memory/freshness.py +114 -0
package/ocmemog/runtime/memory/health.py +57 -0
package/ocmemog/runtime/memory/integrity.py +208 -0
package/ocmemog/runtime/memory/memory_consolidation.py +60 -0
package/ocmemog/runtime/memory/memory_links.py +109 -0
package/ocmemog/runtime/memory/memory_salience.py +235 -0
package/ocmemog/runtime/memory/memory_synthesis.py +33 -0
package/ocmemog/runtime/memory/memory_taxonomy.py +35 -0
package/ocmemog/runtime/memory/pondering_engine.py +681 -0
package/ocmemog/runtime/memory/promote.py +279 -0
package/ocmemog/runtime/memory/provenance.py +408 -0
package/ocmemog/runtime/memory/reinforcement.py +73 -0
package/ocmemog/runtime/memory/retrieval.py +224 -0
package/ocmemog/runtime/memory/semantic_search.py +66 -0
package/ocmemog/runtime/memory/store.py +433 -0
package/ocmemog/runtime/memory/unresolved_state.py +93 -0
package/ocmemog/runtime/memory/vector_index.py +411 -0
package/ocmemog/runtime/model_roles.py +16 -0
package/ocmemog/runtime/model_router.py +29 -0
package/ocmemog/runtime/providers.py +79 -0
package/ocmemog/runtime/roles.py +92 -0
package/ocmemog/runtime/security/__init__.py +8 -0
package/ocmemog/runtime/security/redaction.py +17 -0
package/ocmemog/runtime/state_store.py +34 -0
package/ocmemog/runtime/storage_paths.py +70 -0
package/ocmemog/sidecar/app.py +310 -23
package/ocmemog/sidecar/compat.py +50 -13
package/ocmemog/sidecar/transcript_watcher.py +318 -240
package/openclaw.plugin.json +4 -0
package/package.json +1 -1
package/scripts/ocmemog-backfill-vectors.py +5 -3
package/scripts/ocmemog-continuity-benchmark.py +1 -1
package/scripts/ocmemog-demo.py +1 -1
package/scripts/ocmemog-doctor.py +15 -0
package/scripts/ocmemog-install.sh +29 -7
package/scripts/ocmemog-integrated-proof.py +373 -0
package/scripts/ocmemog-reindex-vectors.py +5 -3
package/scripts/ocmemog-release-check.sh +330 -0
package/scripts/ocmemog-sidecar.sh +4 -2
package/scripts/ocmemog-test-rig.py +5 -3
package/brain/runtime/memory/artifacts.py +0 -33
package/brain/runtime/memory/context_builder.py +0 -112
package/brain/runtime/memory/interaction_memory.py +0 -57
package/brain/runtime/memory/memory_gate.py +0 -38
package/brain/runtime/memory/memory_graph.py +0 -54
package/brain/runtime/memory/person_identity.py +0 -83
package/brain/runtime/memory/person_memory.py +0 -138
package/brain/runtime/memory/sentiment_memory.py +0 -67
package/brain/runtime/memory/tool_catalog.py +0 -68

package/ocmemog/sidecar/transcript_watcher.py CHANGED Viewed

@@ -1,14 +1,16 @@
 from __future__ import annotations
 import json
+import sys
 import os
 import time
 from collections import deque
+import threading
 from pathlib import Path
 from typing import Optional
 from urllib import request as urlrequest
-from brain.runtime import state_store
+from ocmemog.runtime import state_store
 DEFAULT_ENDPOINT = "http://127.0.0.1:17891/memory/ingest_async"
 DEFAULT_GLOB = "*.log"
@@ -34,6 +36,65 @@ DEFAULT_REINFORCE_NEGATIVE = [
     "frustrated",
 ]
 WATCHER_ERROR_LOG = state_store.reports_dir() / "ocmemog_transcript_watcher_errors.jsonl"
+_SHUTDOWN_TRACE = os.environ.get("OCMEMOG_SHUTDOWN_TIMING", "true").lower() in {"1", "true", "yes", "on"}
+_WATCHER_REQUEST_TIMEOUT_SECONDS = 10.0
+_WATCHER_SHUTDOWN_REQUEST_TIMEOUT_SECONDS = 1.0
+_WATCHER_STOP_EVENT: threading.Event | None = None
+try:
+    _WATCHER_REQUEST_TIMEOUT_SECONDS = float(os.environ.get("OCMEMOG_INGEST_REQUEST_TIMEOUT_SECONDS", "10"))
+except Exception:
+    pass
+try:
+    _WATCHER_SHUTDOWN_REQUEST_TIMEOUT_SECONDS = float(
+        os.environ.get("OCMEMOG_SHUTDOWN_INGEST_REQUEST_TIMEOUT_SECONDS", "1")
+    )
+except Exception:
+    pass
+def _watcher_timeout(stop_event: threading.Event | None) -> float:
+    timeout = _WATCHER_REQUEST_TIMEOUT_SECONDS
+    if stop_event is not None and stop_event.is_set():
+        timeout = min(timeout, _WATCHER_SHUTDOWN_REQUEST_TIMEOUT_SECONDS)
+    return max(0.05, timeout)
+def _post_json_payload(endpoint: str, payload: dict, *, stop_event: threading.Event | None, kind: str) -> bool:
+    data = json.dumps(payload).encode("utf-8")
+    req = urlrequest.Request(endpoint, data=data, method="POST")
+    req.add_header("Content-Type", "application/json")
+    _apply_auth_headers(req)
+    timeout = _watcher_timeout(stop_event)
+    start = time.perf_counter()
+    status = "ok"
+    try:
+        with urlrequest.urlopen(req, timeout=timeout) as resp:
+            resp.read()
+        return True
+    except Exception as exc:
+        status = f"error={type(exc).__name__}"
+        _log_watcher_error(kind, endpoint, payload, exc)
+        if _SHUTDOWN_TRACE:
+            print(
+                f"[ocmemog][watcher-request] {kind} failed timeout={timeout:.3f}s elapsed={time.perf_counter()-start:.3f}s",
+                file=sys.stderr,
+            )
+        return False
+    finally:
+        if _SHUTDOWN_TRACE:
+            elapsed = time.perf_counter() - start
+            if stop_event is None or not stop_event.is_set():
+                if elapsed >= timeout * 0.95:
+                    print(
+                        f"[ocmemog][watcher-request] {kind} timeout={timeout:.3f}s elapsed={elapsed:.3f}s status={status}",
+                        file=sys.stderr,
+                    )
+            else:
+                print(
+                    f"[ocmemog][watcher-request] {kind} timeout={timeout:.3f}s elapsed={elapsed:.3f}s status={status}",
+                    file=sys.stderr,
+                )
 def _log_watcher_error(kind: str, endpoint: str, payload: dict, exc: Exception) -> None:
@@ -67,36 +128,16 @@ def _apply_auth_headers(req: urlrequest.Request) -> None:
         req.add_header("x-ocmemog-token", token)
-def _post_ingest(endpoint: str, payload: dict) -> bool:
-    data = json.dumps(payload).encode("utf-8")
-    req = urlrequest.Request(endpoint, data=data, method="POST")
-    req.add_header("Content-Type", "application/json")
-    _apply_auth_headers(req)
-    try:
-        with urlrequest.urlopen(req, timeout=10) as resp:
-            resp.read()
-        return True
-    except Exception as exc:
-        _log_watcher_error("ingest", endpoint, payload, exc)
-        return False
+def _post_ingest(endpoint: str, payload: dict, *, stop_event: threading.Event | None = None) -> bool:
+    return _post_json_payload(endpoint, payload, stop_event=stop_event, kind="ingest")
-def _post_json(endpoint: str, payload: dict) -> bool:
-    data = json.dumps(payload).encode("utf-8")
-    req = urlrequest.Request(endpoint, data=data, method="POST")
-    req.add_header("Content-Type", "application/json")
-    _apply_auth_headers(req)
-    try:
-        with urlrequest.urlopen(req, timeout=10) as resp:
-            resp.read()
-        return True
-    except Exception as exc:
-        _log_watcher_error("json", endpoint, payload, exc)
-        return False
+def _post_json(endpoint: str, payload: dict, *, stop_event: threading.Event | None = None) -> bool:
+    return _post_json_payload(endpoint, payload, stop_event=stop_event, kind="json")
-def _post_turn(endpoint: str, payload: dict) -> bool:
-    return _post_json(endpoint, payload)
+def _post_turn(endpoint: str, payload: dict, *, stop_event: threading.Event | None = None) -> bool:
+    return _post_json(endpoint, payload, stop_event=stop_event)
 def _extract_user_text(text: str) -> str:
@@ -183,7 +224,8 @@ def _append_transcript(transcript_target: Path, timestamp: str, role: str, text:
     return path, line_no
-def watch_forever() -> None:
+def watch_forever(stop_event: Optional[threading.Event] = None) -> None:
+    global _WATCHER_STOP_EVENT
     transcript_path = os.environ.get("OCMEMOG_TRANSCRIPT_PATH", "").strip()
     transcript_dir = os.environ.get("OCMEMOG_TRANSCRIPT_DIR", "").strip()
     glob_pattern = os.environ.get("OCMEMOG_TRANSCRIPT_GLOB", DEFAULT_GLOB)
@@ -240,6 +282,13 @@ def watch_forever() -> None:
     pending_session_turns: dict[tuple[str, int], dict[str, object]] = {}
     last_transcript_flush = time.time()
     last_session_flush = time.time()
+    stopper: threading.Event
+    if isinstance(stop_event, threading.Event):
+        stopper = stop_event
+    else:
+        stopper = threading.Event()
+        stopper.clear()
+    _WATCHER_STOP_EVENT = stopper
     def _flush_buffer(
         buffer: list[str],
@@ -249,9 +298,12 @@ def watch_forever() -> None:
         timestamp: Optional[str],
         start_line: Optional[int],
         end_line: Optional[int],
+        stop_event: threading.Event,
     ) -> bool:
         if not buffer:
             return True
+        if stop_event.is_set():
+            return False
         payload = {
             "content": "\n".join(buffer),
             "kind": kind,
@@ -266,7 +318,7 @@ def watch_forever() -> None:
             payload["transcript_end_offset"] = end_line
         if timestamp:
             payload["timestamp"] = timestamp.replace("T", " ")[:19]
-        ok = _post_ingest(endpoint, payload)
+        ok = _post_ingest(endpoint, payload, stop_event=stop_event)
         if ok:
             buffer.clear()
         return ok
@@ -286,7 +338,7 @@ def watch_forever() -> None:
                 "source_module": "sentiment",
                 "note": text,
             }
-            _post_json(reinforce_endpoint, payload)
+            _post_json(reinforce_endpoint, payload, stop_event=stopper)
         elif any(term in lowered for term in negative_terms):
             payload = {
                 "task_id": f"feedback:{timestamp}",
@@ -298,224 +350,236 @@ def watch_forever() -> None:
                 "source_module": "sentiment",
                 "note": text,
             }
-            _post_json(reinforce_endpoint, payload)
-    while True:
-        # 1) Watch transcript logs (if any)
-        latest = _pick_latest(transcript_target, glob_pattern)
-        if latest is not None:
-            if current_file is None or latest != current_file:
-                current_file = latest
-                position = 0
-                current_line_number = 0
-                if start_at_end:
-                    try:
-                        position = current_file.stat().st_size
-                    except Exception:
-                        position = 0
-                    try:
-                        current_line_number = _count_lines(current_file)
-                    except Exception:
-                        current_line_number = 0
-            try:
-                with current_file.open("r", encoding="utf-8", errors="ignore") as handle:
-                    handle.seek(position)
-                    committed_position = position
-                    committed_line_number = current_line_number
-                    while True:
-                        line_start = handle.tell()
-                        line = handle.readline()
-                        if not line:
-                            position = committed_position
-                            current_line_number = committed_line_number
-                            break
-                        text = line.rstrip("\n")
-                        next_line_number = committed_line_number + 1
-                        if not text.strip():
-                            committed_position = handle.tell()
-                            committed_line_number = next_line_number
-                            position = committed_position
-                            current_line_number = committed_line_number
-                            continue
-                        current_marker = (str(current_file), next_line_number)
-                        if current_marker in recent_session_transcript_lines:
+            _post_json(reinforce_endpoint, payload, stop_event=stopper)
+    try:
+        while not stopper.is_set():
+            # 1) Watch transcript logs (if any)
+            latest = _pick_latest(transcript_target, glob_pattern)
+            if latest is not None:
+                if current_file is None or latest != current_file:
+                    current_file = latest
+                    position = 0
+                    current_line_number = 0
+                    if start_at_end:
+                        try:
+                            position = current_file.stat().st_size
+                        except Exception:
+                            position = 0
+                        try:
+                            current_line_number = _count_lines(current_file)
+                        except Exception:
+                            current_line_number = 0
+                try:
+                    with current_file.open("r", encoding="utf-8", errors="ignore") as handle:
+                        handle.seek(position)
+                        committed_position = position
+                        committed_line_number = current_line_number
+                        while True:
+                            if stopper.is_set():
+                                break
+                            line_start = handle.tell()
+                            line = handle.readline()
+                            if not line:
+                                position = committed_position
+                                current_line_number = committed_line_number
+                                break
+                            text = line.rstrip("\n")
+                            next_line_number = committed_line_number + 1
+                            if not text.strip():
+                                committed_position = handle.tell()
+                                committed_line_number = next_line_number
+                                position = committed_position
+                                current_line_number = committed_line_number
+                                continue
+                            current_marker = (str(current_file), next_line_number)
+                            if current_marker in recent_session_transcript_lines:
+                                committed_position = handle.tell()
+                                committed_line_number = next_line_number
+                                position = committed_position
+                                current_line_number = committed_line_number
+                                continue
+                            transcript_buffer.append(text)
+                            transcript_last_path = current_file
+                            if transcript_start_line is None:
+                                transcript_start_line = next_line_number
+                            transcript_end_line = next_line_number
+                            timestamp_value = None
+                            if text and " " in text:
+                                timestamp_value = text.split(" ", 1)[0]
+                                transcript_last_timestamp = timestamp_value
+                            role, turn_text = _parse_transcript_line(text)
+                            if role and turn_text:
+                                if stopper.is_set():
+                                    break
+                                ok = _post_turn(
+                                    turn_endpoint,
+                                    {
+                                        "role": role,
+                                        "content": turn_text,
+                                        "source": source,
+                                        "transcript_path": str(current_file),
+                                        "transcript_offset": next_line_number,
+                                        "transcript_end_offset": next_line_number,
+                                        "timestamp": timestamp_value.replace("T", " ")[:19] if timestamp_value else None,
+                                    },
+                                    stop_event=stopper,
+                                )
+                                if not ok:
+                                    if transcript_buffer:
+                                        transcript_buffer.pop()
+                                    if transcript_start_line == next_line_number:
+                                        transcript_start_line = None
+                                    transcript_end_line = committed_line_number if transcript_start_line is not None else None
+                                    position = line_start
+                                    current_line_number = committed_line_number
+                                    break
+                            if len(transcript_buffer) >= batch_max:
+                                ok = _flush_buffer(
+                                    transcript_buffer,
+                                    source_label=source,
+                                    transcript_path=transcript_last_path,
+                                    timestamp=transcript_last_timestamp,
+                                    start_line=transcript_start_line,
+                                    end_line=transcript_end_line,
+                                    stop_event=stopper,
+                                )
+                                if not ok:
+                                    position = line_start
+                                    current_line_number = committed_line_number
+                                    break
+                                transcript_start_line = None
+                                transcript_end_line = None
+                                last_transcript_flush = time.time()
                             committed_position = handle.tell()
                             committed_line_number = next_line_number
                             position = committed_position
                             current_line_number = committed_line_number
-                            continue
-                        transcript_buffer.append(text)
-                        transcript_last_path = current_file
-                        if transcript_start_line is None:
-                            transcript_start_line = next_line_number
-                        transcript_end_line = next_line_number
-                        timestamp_value = None
-                        if text and " " in text:
-                            timestamp_value = text.split(" ", 1)[0]
-                            transcript_last_timestamp = timestamp_value
-                        role, turn_text = _parse_transcript_line(text)
-                        if role and turn_text:
-                            ok = _post_turn(
-                                turn_endpoint,
-                                {
+                except Exception:
+                    pass
+            # 2) Watch OpenClaw session jsonl (verbatim capture)
+            session_latest = _pick_latest(session_target, session_glob)
+            if session_latest is not None:
+                if session_file is None or session_latest != session_file:
+                    session_file = session_latest
+                    session_pos = 0
+                    if start_at_end:
+                        try:
+                            session_pos = session_file.stat().st_size
+                        except Exception:
+                            session_pos = 0
+                try:
+                    with session_file.open("r", encoding="utf-8", errors="ignore") as handle:
+                        handle.seek(session_pos)
+                        committed_session_pos = session_pos
+                        while True:
+                            if stopper.is_set():
+                                break
+                            line_start = handle.tell()
+                            line = handle.readline()
+                            if not line:
+                                session_pos = committed_session_pos
+                                break
+                            try:
+                                entry = json.loads(line)
+                            except Exception:
+                                committed_session_pos = handle.tell()
+                                session_pos = committed_session_pos
+                                continue
+                            if entry.get("type") != "message":
+                                committed_session_pos = handle.tell()
+                                session_pos = committed_session_pos
+                                continue
+                            msg = entry.get("message") or {}
+                            role = msg.get("role")
+                            if role not in {"user", "assistant"}:
+                                committed_session_pos = handle.tell()
+                                session_pos = committed_session_pos
+                                continue
+                            content = msg.get("content")
+                            text = _extract_message_text(content).strip()
+                            conversation_info = _extract_conversation_info(text)
+                            if role == "user":
+                                text = _extract_user_text(text)
+                            text = text.replace("\n", " ").strip()
+                            if not text:
+                                committed_session_pos = handle.tell()
+                                session_pos = committed_session_pos
+                                continue
+                            timestamp = entry.get("timestamp") or time.strftime("%Y-%m-%dT%H:%M:%S")
+                            if role == "user":
+                                _maybe_reinforce(text, timestamp)
+                            session_id = session_file.stem if session_file is not None else None
+                            message_id = entry.get("id") or conversation_info.get("message_id")
+                            conversation_id = conversation_info.get("conversation_id") or session_id
+                            thread_id = conversation_info.get("thread_id") or session_id
+                            transcript_line = f"{timestamp} [{role}] {text}"
+                            retry_key = (str(session_file), line_start)
+                            pending = pending_session_turns.get(retry_key)
+                            if pending is None:
+                                transcript_path, transcript_line_no = _append_transcript(transcript_target, timestamp, role, text)
+                                turn_payload = {
                                     "role": role,
-                                    "content": turn_text,
-                                    "source": source,
-                                    "transcript_path": str(current_file),
-                                    "transcript_offset": next_line_number,
-                                    "transcript_end_offset": next_line_number,
-                                    "timestamp": timestamp_value.replace("T", " ")[:19] if timestamp_value else None,
-                                },
-                            )
-                            if not ok:
-                                if transcript_buffer:
-                                    transcript_buffer.pop()
-                                if transcript_start_line == next_line_number:
-                                    transcript_start_line = None
-                                transcript_end_line = committed_line_number if transcript_start_line is not None else None
-                                position = line_start
-                                current_line_number = committed_line_number
+                                    "content": text,
+                                    "conversation_id": conversation_id,
+                                    "session_id": session_id,
+                                    "thread_id": thread_id,
+                                    "message_id": message_id,
+                                    "source": "session",
+                                    "timestamp": timestamp.replace("T", " ")[:19],
+                                    "transcript_path": str(transcript_path),
+                                    "transcript_offset": transcript_line_no,
+                                    "transcript_end_offset": transcript_line_no,
+                                    "metadata": {
+                                        "parent_message_id": entry.get("parentId"),
+                                    },
+                                }
+                                pending_session_turns[retry_key] = {
+                                    "payload": dict(turn_payload),
+                                    "transcript_line": transcript_line,
+                                    "transcript_path": transcript_path,
+                                    "transcript_line_no": transcript_line_no,
+                                }
+                            else:
+                                turn_payload = dict(pending["payload"])
+                                transcript_line = str(pending["transcript_line"])
+                                transcript_path = Path(str(pending["transcript_path"]))
+                                transcript_line_no = int(pending["transcript_line_no"])
+                            if stopper.is_set():
                                 break
-                        if len(transcript_buffer) >= batch_max:
-                            ok = _flush_buffer(
-                                transcript_buffer,
-                                source_label=source,
-                                transcript_path=transcript_last_path,
-                                timestamp=transcript_last_timestamp,
-                                start_line=transcript_start_line,
-                                end_line=transcript_end_line,
-                            )
-                            if not ok:
-                                position = line_start
-                                current_line_number = committed_line_number
+                            if not _post_turn(turn_endpoint, turn_payload, stop_event=stopper):
+                                session_pos = line_start
                                 break
-                            transcript_start_line = None
-                            transcript_end_line = None
-                            last_transcript_flush = time.time()
-                        committed_position = handle.tell()
-                        committed_line_number = next_line_number
-                        position = committed_position
-                        current_line_number = committed_line_number
-            except Exception:
-                pass
-        # 2) Watch OpenClaw session jsonl (verbatim capture)
-        session_latest = _pick_latest(session_target, session_glob)
-        if session_latest is not None:
-            if session_file is None or session_latest != session_file:
-                session_file = session_latest
-                session_pos = 0
-                if start_at_end:
-                    try:
-                        session_pos = session_file.stat().st_size
-                    except Exception:
-                        session_pos = 0
-            try:
-                with session_file.open("r", encoding="utf-8", errors="ignore") as handle:
-                    handle.seek(session_pos)
-                    committed_session_pos = session_pos
-                    while True:
-                        line_start = handle.tell()
-                        line = handle.readline()
-                        if not line:
-                            session_pos = committed_session_pos
-                            break
-                        try:
-                            entry = json.loads(line)
-                        except Exception:
-                            committed_session_pos = handle.tell()
-                            session_pos = committed_session_pos
-                            continue
-                        if entry.get("type") != "message":
-                            committed_session_pos = handle.tell()
-                            session_pos = committed_session_pos
-                            continue
-                        msg = entry.get("message") or {}
-                        role = msg.get("role")
-                        if role not in {"user", "assistant"}:
-                            committed_session_pos = handle.tell()
-                            session_pos = committed_session_pos
-                            continue
-                        content = msg.get("content")
-                        text = _extract_message_text(content).strip()
-                        conversation_info = _extract_conversation_info(text)
-                        if role == "user":
-                            text = _extract_user_text(text)
-                        text = text.replace("\n", " ").strip()
-                        if not text:
+                            pending_session_turns.pop(retry_key, None)
+                            recent_session_transcript_lines.append((str(transcript_path), transcript_line_no))
+                            session_buffer.append(transcript_line)
+                            session_last_path = transcript_path
+                            session_last_timestamp = timestamp
+                            if session_start_line is None:
+                                session_start_line = transcript_line_no
+                            session_end_line = transcript_line_no
+                            if len(session_buffer) >= batch_max:
+                                ok = _flush_buffer(
+                                    session_buffer,
+                                    source_label="session",
+                                    transcript_path=session_last_path,
+                                    timestamp=session_last_timestamp,
+                                    start_line=session_start_line,
+                                    end_line=session_end_line,
+                                    stop_event=stopper,
+                                )
+                                if not ok:
+                                    session_pos = line_start
+                                    break
+                                session_start_line = None
+                                session_end_line = None
+                                last_session_flush = time.time()
                             committed_session_pos = handle.tell()
                             session_pos = committed_session_pos
-                            continue
-                        timestamp = entry.get("timestamp") or time.strftime("%Y-%m-%dT%H:%M:%S")
-                        if role == "user":
-                            _maybe_reinforce(text, timestamp)
-                        session_id = session_file.stem if session_file is not None else None
-                        message_id = entry.get("id") or conversation_info.get("message_id")
-                        conversation_id = conversation_info.get("conversation_id") or session_id
-                        thread_id = conversation_info.get("thread_id") or session_id
-                        transcript_line = f"{timestamp} [{role}] {text}"
-                        retry_key = (str(session_file), line_start)
-                        pending = pending_session_turns.get(retry_key)
-                        if pending is None:
-                            transcript_path, transcript_line_no = _append_transcript(transcript_target, timestamp, role, text)
-                            turn_payload = {
-                                "role": role,
-                                "content": text,
-                                "conversation_id": conversation_id,
-                                "session_id": session_id,
-                                "thread_id": thread_id,
-                                "message_id": message_id,
-                                "source": "session",
-                                "timestamp": timestamp.replace("T", " ")[:19],
-                                "transcript_path": str(transcript_path),
-                                "transcript_offset": transcript_line_no,
-                                "transcript_end_offset": transcript_line_no,
-                                "metadata": {
-                                    "parent_message_id": entry.get("parentId"),
-                                },
-                            }
-                            pending_session_turns[retry_key] = {
-                                "payload": dict(turn_payload),
-                                "transcript_line": transcript_line,
-                                "transcript_path": transcript_path,
-                                "transcript_line_no": transcript_line_no,
-                            }
-                        else:
-                            turn_payload = dict(pending["payload"])
-                            transcript_line = str(pending["transcript_line"])
-                            transcript_path = Path(str(pending["transcript_path"]))
-                            transcript_line_no = int(pending["transcript_line_no"])
-                        if not _post_turn(turn_endpoint, turn_payload):
-                            session_pos = line_start
-                            break
-                        pending_session_turns.pop(retry_key, None)
-                        recent_session_transcript_lines.append((str(transcript_path), transcript_line_no))
-                        session_buffer.append(transcript_line)
-                        session_last_path = transcript_path
-                        session_last_timestamp = timestamp
-                        if session_start_line is None:
-                            session_start_line = transcript_line_no
-                        session_end_line = transcript_line_no
-                        if len(session_buffer) >= batch_max:
-                            ok = _flush_buffer(
-                                session_buffer,
-                                source_label="session",
-                                transcript_path=session_last_path,
-                                timestamp=session_last_timestamp,
-                                start_line=session_start_line,
-                                end_line=session_end_line,
-                            )
-                            if not ok:
-                                session_pos = line_start
-                                break
-                            session_start_line = None
-                            session_end_line = None
-                            last_session_flush = time.time()
-                        committed_session_pos = handle.tell()
-                        session_pos = committed_session_pos
-            except Exception:
-                pass
+                except Exception:
+                    pass
         now = time.time()
         if transcript_buffer and (now - last_transcript_flush) >= batch_seconds:
@@ -526,6 +590,7 @@ def watch_forever() -> None:
                 timestamp=transcript_last_timestamp,
                 start_line=transcript_start_line,
                 end_line=transcript_end_line,
+                stop_event=stopper,
             )
             if ok:
                 transcript_start_line = None
@@ -539,10 +604,23 @@ def watch_forever() -> None:
                 timestamp=session_last_timestamp,
                 start_line=session_start_line,
                 end_line=session_end_line,
+                stop_event=stopper,
             )
             if ok:
                 session_start_line = None
                 session_end_line = None
                 last_session_flush = now
-        time.sleep(poll_seconds)
+        poll_started = time.perf_counter()
+        if stopper.wait(poll_seconds):
+            if _SHUTDOWN_TRACE:
+                print(
+                    f"[ocmemog][watcher-poll] stop_wait timeout={poll_seconds:.3f}s elapsed={time.perf_counter()-poll_started:.3f}s",
+                    file=sys.stderr,
+                )
+            return
+    finally:
+        _WATCHER_STOP_EVENT = None
+        if _SHUTDOWN_TRACE:
+            print("[ocmemog][watcher] shutdown loop exiting", file=sys.stderr)
+        # no return value