npm - claude-memory-agent - Versions diffs - 2.1.0 → 2.2.0 - Mend

claude-memory-agent 2.1.0 → 2.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (91) hide show

package/bin/cli.js +11 -1
package/bin/lib/banner.js +39 -0
package/bin/lib/environment.js +166 -0
package/bin/lib/installer.js +291 -0
package/bin/lib/models.js +95 -0
package/bin/lib/steps/advanced.js +101 -0
package/bin/lib/steps/confirm.js +87 -0
package/bin/lib/steps/model.js +57 -0
package/bin/lib/steps/provider.js +65 -0
package/bin/lib/steps/scope.js +59 -0
package/bin/lib/steps/server.js +74 -0
package/bin/lib/ui.js +75 -0
package/bin/onboarding.js +164 -0
package/bin/postinstall.js +22 -257
package/config.py +103 -4
package/dashboard.html +697 -27
package/hooks/extract_memories.py +439 -0
package/hooks/pre_compact_hook.py +76 -0
package/hooks/session_end_hook.py +149 -0
package/hooks/stop_hook.py +372 -0
package/install.py +85 -32
package/main.py +1636 -892
package/mcp_server.py +451 -0
package/package.json +14 -3
package/requirements.txt +12 -8
package/services/adaptive_ranker.py +272 -0
package/services/agent_catalog.json +153 -0
package/services/agent_registry.py +245 -730
package/services/claude_md_sync.py +320 -4
package/services/consolidation.py +417 -0
package/services/database.py +586 -105
package/services/embedding_pipeline.py +262 -0
package/services/embeddings.py +493 -85
package/services/memory_decay.py +408 -0
package/services/native_memory_paths.py +86 -0
package/services/native_memory_sync.py +496 -0
package/services/response_manager.py +183 -0
package/services/terminal_ui.py +199 -0
package/services/tier_manager.py +235 -0
package/services/websocket.py +26 -6
package/skills/search.py +136 -61
package/skills/session_review.py +210 -23
package/skills/store.py +125 -18
package/terminal_dashboard.py +474 -0
package/hooks/__pycache__/auto-detect-response.cpython-312.pyc +0 -0
package/hooks/__pycache__/auto_capture.cpython-312.pyc +0 -0
package/hooks/__pycache__/grounding-hook.cpython-312.pyc +0 -0
package/hooks/__pycache__/session_end.cpython-312.pyc +0 -0
package/hooks/__pycache__/session_start.cpython-312.pyc +0 -0
package/services/__pycache__/__init__.cpython-312.pyc +0 -0
package/services/__pycache__/agent_registry.cpython-312.pyc +0 -0
package/services/__pycache__/auth.cpython-312.pyc +0 -0
package/services/__pycache__/auto_inject.cpython-312.pyc +0 -0
package/services/__pycache__/claude_md_sync.cpython-312.pyc +0 -0
package/services/__pycache__/cleanup.cpython-312.pyc +0 -0
package/services/__pycache__/compaction_flush.cpython-312.pyc +0 -0
package/services/__pycache__/confidence.cpython-312.pyc +0 -0
package/services/__pycache__/curator.cpython-312.pyc +0 -0
package/services/__pycache__/daily_log.cpython-312.pyc +0 -0
package/services/__pycache__/database.cpython-312.pyc +0 -0
package/services/__pycache__/embeddings.cpython-312.pyc +0 -0
package/services/__pycache__/insights.cpython-312.pyc +0 -0
package/services/__pycache__/llm_analyzer.cpython-312.pyc +0 -0
package/services/__pycache__/memory_md_sync.cpython-312.pyc +0 -0
package/services/__pycache__/retry_queue.cpython-312.pyc +0 -0
package/services/__pycache__/timeline.cpython-312.pyc +0 -0
package/services/__pycache__/vector_index.cpython-312.pyc +0 -0
package/services/__pycache__/websocket.cpython-312.pyc +0 -0
package/skills/__pycache__/__init__.cpython-312.pyc +0 -0
package/skills/__pycache__/admin.cpython-312.pyc +0 -0
package/skills/__pycache__/checkpoint.cpython-312.pyc +0 -0
package/skills/__pycache__/claude_md.cpython-312.pyc +0 -0
package/skills/__pycache__/cleanup.cpython-312.pyc +0 -0
package/skills/__pycache__/confidence_tracker.cpython-312.pyc +0 -0
package/skills/__pycache__/context.cpython-312.pyc +0 -0
package/skills/__pycache__/curator.cpython-312.pyc +0 -0
package/skills/__pycache__/grounding.cpython-312.pyc +0 -0
package/skills/__pycache__/insights.cpython-312.pyc +0 -0
package/skills/__pycache__/natural_language.cpython-312.pyc +0 -0
package/skills/__pycache__/retrieve.cpython-312.pyc +0 -0
package/skills/__pycache__/search.cpython-312.pyc +0 -0
package/skills/__pycache__/session_review.cpython-312.pyc +0 -0
package/skills/__pycache__/state.cpython-312.pyc +0 -0
package/skills/__pycache__/store.cpython-312.pyc +0 -0
package/skills/__pycache__/summarize.cpython-312.pyc +0 -0
package/skills/__pycache__/timeline.cpython-312.pyc +0 -0
package/skills/__pycache__/verification.cpython-312.pyc +0 -0
package/test_automation.py +0 -221
package/test_complete.py +0 -338
package/test_full.py +0 -322
package/verify_db.py +0 -134

package/hooks/extract_memories.py ADDED Viewed

@@ -0,0 +1,439 @@
+#!/usr/bin/env python3
+"""
+Extract memories from conversation transcripts.
+This script reads a Claude Code conversation transcript, extracts key
+decisions, errors, patterns, and facts using keyword/pattern matching,
+and stores them via the memory agent's HTTP API.
+It tracks what has already been extracted using a cursor file so that
+repeated calls (e.g., multiple PreCompact events) do not duplicate
+extracted memories.
+Design constraints:
+  - Must complete in under 5 seconds
+  - Uses simple keyword matching, NOT an LLM call
+  - Fails silently (exit 0) to never block compaction or session end
+  - Idempotent: cursor tracking prevents duplicate extraction
+"""
+import os
+import sys
+import json
+import re
+import time
+import hashlib
+from datetime import datetime
+from pathlib import Path
+from typing import Dict, Any, List, Optional, Tuple
+# ---------------------------------------------------------------------------
+# Configuration
+# ---------------------------------------------------------------------------
+MEMORY_AGENT_URL = os.getenv("MEMORY_AGENT_URL", "http://localhost:8102")
+API_KEY = os.getenv("MEMORY_API_KEY", "")
+CURSOR_DIR = Path.home() / ".claude"
+CURSOR_FILE = CURSOR_DIR / "memory-agent-cursor.json"
+MAX_EXTRACTION_TIME_SECONDS = 4.0  # Leave 1s headroom under the 5s budget
+MAX_MEMORIES_PER_RUN = 10  # Cap to stay fast
+MAX_CONTENT_LENGTH = 500  # Truncate long content for storage
+# ---------------------------------------------------------------------------
+# Extraction patterns
+# ---------------------------------------------------------------------------
+DECISION_PATTERNS = [
+    # Explicit decision language
+    re.compile(r"(?:^|\n)\s*(?:I |We |Let's |Going to )?(?:decided|decide) (?:to |that )(.*?)(?:\.|$)", re.IGNORECASE | re.MULTILINE),
+    re.compile(r"(?:^|\n)\s*(?:Let's use|Going with|Chose|Choosing|Will use|Using|Went with) (.*?)(?:\.|$)", re.IGNORECASE | re.MULTILINE),
+    re.compile(r"(?:^|\n)\s*(?:The approach|The plan|The strategy|The solution) (?:is|will be) (.*?)(?:\.|$)", re.IGNORECASE | re.MULTILINE),
+    re.compile(r"(?:^|\n)\s*(?:I'll implement|We'll implement|Implementing) (.*?)(?:\.|$)", re.IGNORECASE | re.MULTILINE),
+]
+ERROR_PATTERNS = [
+    # Error/bug language
+    re.compile(r"(?:^|\n)\s*(?:Error|ERROR|Bug|BUG|ISSUE|Issue|PROBLEM|Problem|CRITICAL|FATAL)[:\s]+(.*?)(?:\n|$)", re.IGNORECASE | re.MULTILINE),
+    re.compile(r"(?:^|\n)\s*(?:Fixed|Fixing|Fix for|Resolved|Resolution)[:\s]+(.*?)(?:\n|$)", re.IGNORECASE | re.MULTILINE),
+    re.compile(r"(?:Traceback|Exception|raise \w+Error)(.*?)(?:\n\n|\Z)", re.DOTALL),
+    re.compile(r"(?:^|\n)\s*(?:Root cause|The bug was|The issue was|The problem was)[:\s]+(.*?)(?:\.|$)", re.IGNORECASE | re.MULTILINE),
+]
+PATTERN_PATTERNS = [
+    # Architecture/pattern language
+    re.compile(r"(?:^|\n)\s*(?:The pattern|A pattern|Pattern)[:\s]+(.*?)(?:\.|$)", re.IGNORECASE | re.MULTILINE),
+    re.compile(r"(?:^|\n)\s*(?:The approach|Best practice|Convention|Architecture)[:\s]+(.*?)(?:\.|$)", re.IGNORECASE | re.MULTILINE),
+    re.compile(r"(?:^|\n)\s*(?:Always|Never|Should always|Should never|Must always|Must never) (.*?)(?:\.|$)", re.IGNORECASE | re.MULTILINE),
+]
+# Broader keyword triggers (used for line-level scanning)
+DECISION_KEYWORDS = {"decided", "let's use", "going with", "chose", "choosing", "will use", "the plan is", "approach is", "strategy is", "i'll implement", "we'll implement"}
+ERROR_KEYWORDS = {"error", "bug", "fix", "issue", "traceback", "exception", "failed", "failure", "broken", "crash", "root cause"}
+PATTERN_KEYWORDS = {"pattern", "approach", "architecture", "convention", "best practice", "always", "never", "rule"}
+# ---------------------------------------------------------------------------
+# Cursor management - tracks what we already extracted
+# ---------------------------------------------------------------------------
+def load_cursor(session_id: str) -> Dict[str, Any]:
+    """Load the extraction cursor for a session."""
+    try:
+        if CURSOR_FILE.exists():
+            data = json.loads(CURSOR_FILE.read_text(encoding="utf-8"))
+            return data.get(session_id, {"byte_offset": 0, "extracted_hashes": []})
+    except (json.JSONDecodeError, OSError):
+        pass
+    return {"byte_offset": 0, "extracted_hashes": []}
+def save_cursor(session_id: str, cursor: Dict[str, Any]):
+    """Save the extraction cursor for a session."""
+    try:
+        CURSOR_DIR.mkdir(parents=True, exist_ok=True)
+        data = {}
+        if CURSOR_FILE.exists():
+            try:
+                data = json.loads(CURSOR_FILE.read_text(encoding="utf-8"))
+            except (json.JSONDecodeError, OSError):
+                data = {}
+        data[session_id] = cursor
+        # Prune old sessions (keep last 20)
+        if len(data) > 20:
+            sorted_keys = sorted(data.keys())
+            for old_key in sorted_keys[:-20]:
+                del data[old_key]
+        CURSOR_FILE.write_text(json.dumps(data, indent=2), encoding="utf-8")
+    except OSError:
+        pass  # Fail silently
+def cleanup_cursor(session_id: str):
+    """Remove cursor data for a completed session."""
+    try:
+        if CURSOR_FILE.exists():
+            data = json.loads(CURSOR_FILE.read_text(encoding="utf-8"))
+            if session_id in data:
+                del data[session_id]
+                CURSOR_FILE.write_text(json.dumps(data, indent=2), encoding="utf-8")
+    except (json.JSONDecodeError, OSError):
+        pass
+def content_hash(text: str) -> str:
+    """Create a short hash to deduplicate extracted content."""
+    return hashlib.md5(text.strip().lower().encode("utf-8")).hexdigest()[:12]
+# ---------------------------------------------------------------------------
+# Transcript reading
+# ---------------------------------------------------------------------------
+def read_transcript(transcript_path: str, byte_offset: int = 0) -> Tuple[str, int]:
+    """
+    Read the transcript file from the given byte offset.
+    Returns (new_text, new_byte_offset).
+    """
+    path = Path(transcript_path)
+    if not path.exists():
+        return "", byte_offset
+    try:
+        file_size = path.stat().st_size
+        if file_size <= byte_offset:
+            return "", byte_offset
+        with open(path, "r", encoding="utf-8", errors="replace") as f:
+            f.seek(byte_offset)
+            text = f.read()
+            new_offset = f.tell()
+        return text, new_offset
+    except OSError:
+        return "", byte_offset
+# ---------------------------------------------------------------------------
+# Extraction logic
+# ---------------------------------------------------------------------------
+def extract_context_around(text: str, match_start: int, match_end: int, context_chars: int = 200) -> str:
+    """Get surrounding context for a match to make the extraction more useful."""
+    start = max(0, match_start - context_chars)
+    end = min(len(text), match_end + context_chars)
+    # Try to align to line boundaries
+    while start > 0 and text[start] != '\n':
+        start -= 1
+    while end < len(text) and text[end] != '\n':
+        end += 1
+    return text[start:end].strip()
+def extract_from_text(text: str, existing_hashes: set) -> List[Dict[str, Any]]:
+    """
+    Extract memories from transcript text using keyword/pattern matching.
+    Returns a list of extracted memory dicts.
+    """
+    extractions = []
+    seen_hashes = set(existing_hashes)
+    def add_extraction(content: str, memory_type: str, importance: int, tags: List[str]):
+        """Add an extraction if not already seen."""
+        if len(extractions) >= MAX_MEMORIES_PER_RUN:
+            return
+        h = content_hash(content)
+        if h in seen_hashes:
+            return
+        seen_hashes.add(h)
+        # Truncate content
+        if len(content) > MAX_CONTENT_LENGTH:
+            content = content[:MAX_CONTENT_LENGTH] + "..."
+        extractions.append({
+            "content": content,
+            "type": memory_type,
+            "importance": importance,
+            "tags": tags + ["auto-extracted", "hook"],
+            "hash": h,
+        })
+    # --- Regex-based extraction ---
+    # Decisions
+    for pattern in DECISION_PATTERNS:
+        for match in pattern.finditer(text):
+            context = extract_context_around(text, match.start(), match.end())
+            if len(context) > 30:  # Skip very short matches
+                add_extraction(context, "decision", 6, ["decision"])
+    # Errors
+    for pattern in ERROR_PATTERNS:
+        for match in pattern.finditer(text):
+            context = extract_context_around(text, match.start(), match.end())
+            if len(context) > 30:
+                add_extraction(context, "error", 7, ["error"])
+    # Patterns
+    for pattern in PATTERN_PATTERNS:
+        for match in pattern.finditer(text):
+            context = extract_context_around(text, match.start(), match.end())
+            if len(context) > 30:
+                add_extraction(context, "code", 6, ["pattern"])
+    # --- Line-level keyword scanning (fallback for cases regex misses) ---
+    # Only do this if we have not yet hit our cap
+    if len(extractions) < MAX_MEMORIES_PER_RUN:
+        lines = text.split('\n')
+        i = 0
+        while i < len(lines) and len(extractions) < MAX_MEMORIES_PER_RUN:
+            line_lower = lines[i].lower().strip()
+            # Skip very short or empty lines
+            if len(line_lower) < 20:
+                i += 1
+                continue
+            # Check for decision keywords
+            if any(kw in line_lower for kw in DECISION_KEYWORDS):
+                # Grab this line plus next 2 for context
+                block = '\n'.join(lines[i:i+3]).strip()
+                if len(block) > 30:
+                    add_extraction(block, "decision", 5, ["decision", "keyword-match"])
+            # Check for error keywords
+            elif any(kw in line_lower for kw in ERROR_KEYWORDS):
+                block = '\n'.join(lines[i:i+3]).strip()
+                if len(block) > 30:
+                    add_extraction(block, "error", 6, ["error", "keyword-match"])
+            # Check for pattern keywords
+            elif any(kw in line_lower for kw in PATTERN_KEYWORDS):
+                block = '\n'.join(lines[i:i+3]).strip()
+                if len(block) > 30:
+                    add_extraction(block, "code", 5, ["pattern", "keyword-match"])
+            i += 1
+    return extractions
+# ---------------------------------------------------------------------------
+# API calls to memory agent
+# ---------------------------------------------------------------------------
+def store_memory_sync(extraction: Dict[str, Any], project_path: Optional[str] = None) -> bool:
+    """
+    Store a single extracted memory via the memory agent API.
+    Uses urllib to avoid requiring httpx/requests for the hook scripts.
+    """
+    import urllib.request
+    import urllib.error
+    payload = {
+        "jsonrpc": "2.0",
+        "method": "tasks/send",
+        "params": {
+            "message": {"parts": [{"type": "text", "text": ""}]},
+            "metadata": {
+                "skill_id": "store_memory",
+                "params": {
+                    "content": extraction["content"],
+                    "type": extraction["type"],
+                    "importance": extraction["importance"],
+                    "tags": extraction["tags"],
+                    "project_path": project_path,
+                    "agent_type": "hook-extractor",
+                    "outcome_status": "pending",
+                    "confidence": 0.4,  # Lower confidence for auto-extracted
+                }
+            }
+        },
+        "id": f"extract-{extraction['hash']}-{int(time.time())}"
+    }
+    headers = {"Content-Type": "application/json"}
+    if API_KEY:
+        headers["X-Memory-Key"] = API_KEY
+    try:
+        data = json.dumps(payload).encode("utf-8")
+        req = urllib.request.Request(
+            f"{MEMORY_AGENT_URL}/a2a",
+            data=data,
+            headers=headers,
+            method="POST"
+        )
+        with urllib.request.urlopen(req, timeout=2) as resp:
+            return resp.status == 200
+    except (urllib.error.URLError, urllib.error.HTTPError, OSError, TimeoutError):
+        return False
+# ---------------------------------------------------------------------------
+# Main entry point
+# ---------------------------------------------------------------------------
+def run_extraction(session_id: str, transcript_path: str, project_path: Optional[str] = None, is_session_end: bool = False) -> Dict[str, Any]:
+    """
+    Main extraction function.
+    Args:
+        session_id: The session identifier
+        transcript_path: Path to the conversation transcript file
+        project_path: Optional project path for memory context
+        is_session_end: If True, clean up cursor after extraction
+    Returns:
+        Summary dict with extraction results
+    """
+    start_time = time.time()
+    results = {
+        "extracted": 0,
+        "stored": 0,
+        "skipped_duplicate": 0,
+        "errors": 0,
+        "elapsed_seconds": 0,
+    }
+    # Load cursor state
+    cursor = load_cursor(session_id)
+    byte_offset = cursor.get("byte_offset", 0)
+    existing_hashes = set(cursor.get("extracted_hashes", []))
+    # Read new transcript content
+    new_text, new_offset = read_transcript(transcript_path, byte_offset)
+    if not new_text:
+        results["elapsed_seconds"] = time.time() - start_time
+        if is_session_end:
+            cleanup_cursor(session_id)
+        return results
+    # Extract memories from text
+    extractions = extract_from_text(new_text, existing_hashes)
+    results["extracted"] = len(extractions)
+    # Store each extraction via API (with time budget)
+    stored_hashes = []
+    for extraction in extractions:
+        # Check time budget
+        elapsed = time.time() - start_time
+        if elapsed >= MAX_EXTRACTION_TIME_SECONDS:
+            break
+        success = store_memory_sync(extraction, project_path)
+        if success:
+            results["stored"] += 1
+            stored_hashes.append(extraction["hash"])
+        else:
+            results["errors"] += 1
+    # Update cursor
+    all_hashes = list(existing_hashes | set(stored_hashes))
+    # Keep only the last 200 hashes to prevent unbounded growth
+    if len(all_hashes) > 200:
+        all_hashes = all_hashes[-200:]
+    cursor = {
+        "byte_offset": new_offset,
+        "extracted_hashes": all_hashes,
+        "last_run": datetime.now().isoformat(),
+    }
+    if is_session_end:
+        # Final save then cleanup
+        save_cursor(session_id, cursor)
+        cleanup_cursor(session_id)
+    else:
+        save_cursor(session_id, cursor)
+    results["elapsed_seconds"] = round(time.time() - start_time, 2)
+    return results
+def main():
+    """Entry point: reads hook JSON from stdin."""
+    try:
+        hook_data = {}
+        if not sys.stdin.isatty():
+            raw = sys.stdin.read()
+            if raw.strip():
+                hook_data = json.loads(raw)
+        session_id = hook_data.get("session_id", f"unknown-{int(time.time())}")
+        transcript_path = hook_data.get("transcript_path", "")
+        project_path = hook_data.get("cwd") or hook_data.get("project_path", "")
+        hook_event = hook_data.get("hook_event_name", "")
+        is_session_end = hook_event == "SessionEnd"
+        if not transcript_path:
+            # No transcript path provided - nothing to extract
+            sys.exit(0)
+        results = run_extraction(
+            session_id=session_id,
+            transcript_path=transcript_path,
+            project_path=project_path,
+            is_session_end=is_session_end,
+        )
+        # Output summary to stderr (stdout is reserved for hook output)
+        print(
+            f"[MemoryExtractor] session={session_id} event={hook_event} "
+            f"extracted={results['extracted']} stored={results['stored']} "
+            f"errors={results['errors']} elapsed={results['elapsed_seconds']}s",
+            file=sys.stderr,
+        )
+    except Exception as e:
+        # Fail silently - never block the user's workflow
+        print(f"[MemoryExtractor] Error: {e}", file=sys.stderr)
+    sys.exit(0)
+if __name__ == "__main__":
+    main()

package/hooks/pre_compact_hook.py ADDED Viewed

@@ -0,0 +1,76 @@
+#!/usr/bin/env python3
+"""
+PreCompact hook for Claude Code.
+Called before context compaction. Extracts memories from the conversation
+transcript so important information is preserved even if compaction
+discards conversation turns.
+This script:
+  1. Reads hook JSON from stdin (session_id, transcript_path, etc.)
+  2. Delegates to extract_memories.py for the actual extraction
+  3. Exits 0 on success OR failure (never blocks compaction)
+Timing budget: < 5 seconds total.
+"""
+import sys
+import json
+import os
+import time
+# Ensure the hooks directory is on the path
+sys.path.insert(0, os.path.dirname(os.path.abspath(__file__)))
+def main():
+    start = time.time()
+    try:
+        # Read hook data from stdin
+        hook_data = {}
+        if not sys.stdin.isatty():
+            raw = sys.stdin.read()
+            if raw.strip():
+                hook_data = json.loads(raw)
+        # Ensure hook_event_name is set
+        if "hook_event_name" not in hook_data:
+            hook_data["hook_event_name"] = "PreCompact"
+        session_id = hook_data.get("session_id", "")
+        transcript_path = hook_data.get("transcript_path", "")
+        if not transcript_path:
+            # No transcript available, nothing to extract
+            print("[PreCompact] No transcript_path provided, skipping extraction.", file=sys.stderr)
+            sys.exit(0)
+        # Import and run extraction
+        from extract_memories import run_extraction
+        results = run_extraction(
+            session_id=session_id,
+            transcript_path=transcript_path,
+            project_path=hook_data.get("cwd") or hook_data.get("project_path", ""),
+            is_session_end=False,
+        )
+        elapsed = round(time.time() - start, 2)
+        print(
+            f"[PreCompact] Extraction complete: "
+            f"extracted={results['extracted']} stored={results['stored']} "
+            f"errors={results['errors']} total_time={elapsed}s",
+            file=sys.stderr,
+        )
+    except Exception as e:
+        elapsed = round(time.time() - start, 2)
+        print(f"[PreCompact] Error (non-fatal): {e} [{elapsed}s]", file=sys.stderr)
+    # Always exit 0 - never block compaction
+    sys.exit(0)
+if __name__ == "__main__":
+    main()

package/hooks/session_end_hook.py ADDED Viewed

@@ -0,0 +1,149 @@
+#!/usr/bin/env python3
+"""
+SessionEnd hook for Claude Code.
+Called when a Claude Code session ends. Performs final memory extraction
+from the conversation transcript and cleans up the cursor file for
+this session.
+This script:
+  1. Reads hook JSON from stdin (session_id, transcript_path, etc.)
+  2. Runs final extraction via extract_memories.py (with is_session_end=True)
+  3. Optionally invokes the existing session_end.py for full session wrapup
+  4. Cleans up cursor state for this session
+  5. Exits 0 on success OR failure (never blocks session teardown)
+Timing budget: < 5 seconds total.
+"""
+import sys
+import json
+import os
+import time
+# Ensure the hooks directory is on the path
+sys.path.insert(0, os.path.dirname(os.path.abspath(__file__)))
+def main():
+    start = time.time()
+    try:
+        # Read hook data from stdin
+        hook_data = {}
+        if not sys.stdin.isatty():
+            raw = sys.stdin.read()
+            if raw.strip():
+                hook_data = json.loads(raw)
+        # Ensure hook_event_name is set
+        if "hook_event_name" not in hook_data:
+            hook_data["hook_event_name"] = "SessionEnd"
+        session_id = hook_data.get("session_id", "")
+        transcript_path = hook_data.get("transcript_path", "")
+        project_path = hook_data.get("cwd") or hook_data.get("project_path", "")
+        # ---------------------------------------------------------------
+        # Step 1: Extract memories from transcript (final pass)
+        # ---------------------------------------------------------------
+        if transcript_path:
+            from extract_memories import run_extraction
+            results = run_extraction(
+                session_id=session_id,
+                transcript_path=transcript_path,
+                project_path=project_path,
+                is_session_end=True,  # This will clean up the cursor after extraction
+            )
+            elapsed_extract = round(time.time() - start, 2)
+            print(
+                f"[SessionEnd] Extraction complete: "
+                f"extracted={results['extracted']} stored={results['stored']} "
+                f"errors={results['errors']} time={elapsed_extract}s",
+                file=sys.stderr,
+            )
+        else:
+            print("[SessionEnd] No transcript_path provided, skipping extraction.", file=sys.stderr)
+            # Still clean up cursor if session_id is present
+            if session_id:
+                try:
+                    from extract_memories import cleanup_cursor
+                    cleanup_cursor(session_id)
+                except ImportError:
+                    pass
+        # ---------------------------------------------------------------
+        # Step 2: Trigger the existing session_end.py wrapup logic
+        # (summarization, daily log, MEMORY.md sync, flush)
+        # Only if we have time left in our budget
+        # ---------------------------------------------------------------
+        remaining = 5.0 - (time.time() - start)
+        if remaining > 1.0 and session_id:
+            try:
+                _trigger_session_wrapup(session_id, project_path, timeout=remaining - 0.5)
+            except Exception as e:
+                print(f"[SessionEnd] Session wrapup failed (non-fatal): {e}", file=sys.stderr)
+        elapsed_total = round(time.time() - start, 2)
+        print(f"[SessionEnd] Complete. Total time: {elapsed_total}s", file=sys.stderr)
+    except Exception as e:
+        elapsed = round(time.time() - start, 2)
+        print(f"[SessionEnd] Error (non-fatal): {e} [{elapsed}s]", file=sys.stderr)
+    # Always exit 0 - never block session end
+    sys.exit(0)
+def _trigger_session_wrapup(session_id: str, project_path: str, timeout: float = 3.0):
+    """
+    Trigger the existing session_end.py summarization via the memory agent API.
+    This calls key skills: daily_log_append_session, sync_memory_md, pre_compaction_flush.
+    Uses a single lightweight API call rather than the full async pipeline.
+    """
+    import urllib.request
+    import urllib.error
+    memory_agent_url = os.getenv("MEMORY_AGENT_URL", "http://localhost:8102")
+    api_key = os.getenv("MEMORY_API_KEY", "")
+    # Call the pre_compaction_flush skill as a lightweight session wrapup
+    payload = {
+        "jsonrpc": "2.0",
+        "method": "tasks/send",
+        "params": {
+            "message": {"parts": [{"type": "text", "text": ""}]},
+            "metadata": {
+                "skill_id": "pre_compaction_flush",
+                "params": {
+                    "project_path": project_path,
+                    "session_id": session_id,
+                }
+            }
+        },
+        "id": f"session-end-flush-{session_id}"
+    }
+    headers = {"Content-Type": "application/json"}
+    if api_key:
+        headers["X-Memory-Key"] = api_key
+    try:
+        data = json.dumps(payload).encode("utf-8")
+        req = urllib.request.Request(
+            f"{memory_agent_url}/a2a",
+            data=data,
+            headers=headers,
+            method="POST"
+        )
+        with urllib.request.urlopen(req, timeout=min(timeout, 3.0)) as resp:
+            if resp.status == 200:
+                print(f"[SessionEnd] Flush triggered successfully.", file=sys.stderr)
+    except (urllib.error.URLError, urllib.error.HTTPError, OSError, TimeoutError) as e:
+        print(f"[SessionEnd] Flush API call failed: {e}", file=sys.stderr)
+if __name__ == "__main__":
+    main()