npm - claude-memory-agent - Versions diffs - 2.1.0 → 2.2.1 - Mend

claude-memory-agent 2.1.0 → 2.2.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (91) hide show

package/bin/cli.js +11 -1
package/bin/lib/banner.js +39 -0
package/bin/lib/environment.js +166 -0
package/bin/lib/installer.js +291 -0
package/bin/lib/models.js +95 -0
package/bin/lib/steps/advanced.js +101 -0
package/bin/lib/steps/confirm.js +87 -0
package/bin/lib/steps/model.js +57 -0
package/bin/lib/steps/provider.js +65 -0
package/bin/lib/steps/scope.js +59 -0
package/bin/lib/steps/server.js +74 -0
package/bin/lib/ui.js +75 -0
package/bin/onboarding.js +164 -0
package/bin/postinstall.js +22 -257
package/config.py +103 -4
package/dashboard.html +697 -27
package/hooks/extract_memories.py +439 -0
package/hooks/pre_compact_hook.py +76 -0
package/hooks/session_end_hook.py +149 -0
package/hooks/stop_hook.py +372 -0
package/install.py +91 -37
package/main.py +1636 -892
package/mcp_server.py +451 -0
package/package.json +14 -3
package/requirements.txt +12 -8
package/services/adaptive_ranker.py +272 -0
package/services/agent_catalog.json +153 -0
package/services/agent_registry.py +245 -730
package/services/claude_md_sync.py +320 -4
package/services/consolidation.py +417 -0
package/services/database.py +586 -105
package/services/embedding_pipeline.py +262 -0
package/services/embeddings.py +493 -85
package/services/memory_decay.py +408 -0
package/services/native_memory_paths.py +86 -0
package/services/native_memory_sync.py +496 -0
package/services/response_manager.py +183 -0
package/services/terminal_ui.py +199 -0
package/services/tier_manager.py +235 -0
package/services/websocket.py +26 -6
package/skills/search.py +136 -61
package/skills/session_review.py +210 -23
package/skills/store.py +125 -18
package/terminal_dashboard.py +474 -0
package/hooks/__pycache__/auto-detect-response.cpython-312.pyc +0 -0
package/hooks/__pycache__/auto_capture.cpython-312.pyc +0 -0
package/hooks/__pycache__/grounding-hook.cpython-312.pyc +0 -0
package/hooks/__pycache__/session_end.cpython-312.pyc +0 -0
package/hooks/__pycache__/session_start.cpython-312.pyc +0 -0
package/services/__pycache__/__init__.cpython-312.pyc +0 -0
package/services/__pycache__/agent_registry.cpython-312.pyc +0 -0
package/services/__pycache__/auth.cpython-312.pyc +0 -0
package/services/__pycache__/auto_inject.cpython-312.pyc +0 -0
package/services/__pycache__/claude_md_sync.cpython-312.pyc +0 -0
package/services/__pycache__/cleanup.cpython-312.pyc +0 -0
package/services/__pycache__/compaction_flush.cpython-312.pyc +0 -0
package/services/__pycache__/confidence.cpython-312.pyc +0 -0
package/services/__pycache__/curator.cpython-312.pyc +0 -0
package/services/__pycache__/daily_log.cpython-312.pyc +0 -0
package/services/__pycache__/database.cpython-312.pyc +0 -0
package/services/__pycache__/embeddings.cpython-312.pyc +0 -0
package/services/__pycache__/insights.cpython-312.pyc +0 -0
package/services/__pycache__/llm_analyzer.cpython-312.pyc +0 -0
package/services/__pycache__/memory_md_sync.cpython-312.pyc +0 -0
package/services/__pycache__/retry_queue.cpython-312.pyc +0 -0
package/services/__pycache__/timeline.cpython-312.pyc +0 -0
package/services/__pycache__/vector_index.cpython-312.pyc +0 -0
package/services/__pycache__/websocket.cpython-312.pyc +0 -0
package/skills/__pycache__/__init__.cpython-312.pyc +0 -0
package/skills/__pycache__/admin.cpython-312.pyc +0 -0
package/skills/__pycache__/checkpoint.cpython-312.pyc +0 -0
package/skills/__pycache__/claude_md.cpython-312.pyc +0 -0
package/skills/__pycache__/cleanup.cpython-312.pyc +0 -0
package/skills/__pycache__/confidence_tracker.cpython-312.pyc +0 -0
package/skills/__pycache__/context.cpython-312.pyc +0 -0
package/skills/__pycache__/curator.cpython-312.pyc +0 -0
package/skills/__pycache__/grounding.cpython-312.pyc +0 -0
package/skills/__pycache__/insights.cpython-312.pyc +0 -0
package/skills/__pycache__/natural_language.cpython-312.pyc +0 -0
package/skills/__pycache__/retrieve.cpython-312.pyc +0 -0
package/skills/__pycache__/search.cpython-312.pyc +0 -0
package/skills/__pycache__/session_review.cpython-312.pyc +0 -0
package/skills/__pycache__/state.cpython-312.pyc +0 -0
package/skills/__pycache__/store.cpython-312.pyc +0 -0
package/skills/__pycache__/summarize.cpython-312.pyc +0 -0
package/skills/__pycache__/timeline.cpython-312.pyc +0 -0
package/skills/__pycache__/verification.cpython-312.pyc +0 -0
package/test_automation.py +0 -221
package/test_complete.py +0 -338
package/test_full.py +0 -322
package/verify_db.py +0 -134

package/services/native_memory_sync.py ADDED Viewed

@@ -0,0 +1,496 @@
+"""Bidirectional sync between MCP vector DB and Claude Code's native auto memory.
+Direction A (MCP -> Native): Fast, no embeddings needed.
+    High-importance MCP memories -> fenced section in native MEMORY.md
+Direction B (Native -> MCP): Needs embeddings, runs at session end.
+    Native MEMORY.md sections -> MCP DB as type='chunk', tagged source=native_memory_md
+Dedup: markdown_syncs.content_hash prevents duplicates in both directions.
+"""
+import hashlib
+import logging
+import re
+from datetime import datetime
+from pathlib import Path
+from typing import Dict, Any, List, Optional
+from services.native_memory_paths import get_native_memory_md, list_native_memory_files
+logger = logging.getLogger(__name__)
+def _ensure_markdown_syncs_table(conn):
+    """Create the markdown_syncs table if it doesn't exist yet.
+    Lightweight safeguard: the full initialize_schema() may fail on older DBs
+    due to unrelated column mismatches, so we create just the table we need.
+    """
+    conn.execute("""
+        CREATE TABLE IF NOT EXISTS markdown_syncs (
+            id INTEGER PRIMARY KEY AUTOINCREMENT,
+            file_type TEXT NOT NULL,
+            file_path TEXT NOT NULL,
+            memory_id INTEGER,
+            project_path TEXT,
+            synced_at TEXT DEFAULT (datetime('now')),
+            content_hash TEXT,
+            FOREIGN KEY (memory_id) REFERENCES memories(id)
+        )
+    """)
+    conn.execute("CREATE INDEX IF NOT EXISTS idx_markdown_syncs_type ON markdown_syncs(file_type)")
+    conn.execute("CREATE INDEX IF NOT EXISTS idx_markdown_syncs_project ON markdown_syncs(project_path)")
+    conn.execute("CREATE INDEX IF NOT EXISTS idx_markdown_syncs_memory ON markdown_syncs(memory_id)")
+    conn.commit()
+# Markers for the MCP-synced section in native MEMORY.md
+MCP_SYNC_START = "<!-- MCP-SYNCED START -->"
+MCP_SYNC_END = "<!-- MCP-SYNCED END -->"
+# Budget: native auto memory loads first 200 lines, leave 20 headroom
+MAX_NATIVE_LINES = 180
+# Source tag used for native->MCP memories
+NATIVE_SOURCE_TAG = "source=native_memory_md"
+def _content_hash(text: str) -> str:
+    """Generate a short hash for dedup tracking."""
+    return hashlib.md5(text.strip().encode("utf-8")).hexdigest()[:16]
+# ── Direction A: MCP -> Native ────────────────────────────────────────────
+async def sync_mcp_to_native(
+    db,
+    project_path: str,
+    min_importance: int = 7,
+) -> Dict[str, Any]:
+    """Sync high-importance MCP memories into the native MEMORY.md fenced section.
+    1. Query MCP DB for important memories for this project
+    2. Skip already-synced (via markdown_syncs with file_type='mcp_to_native')
+    3. Read native MEMORY.md, check line budget
+    4. Replace content between MCP-SYNCED markers (non-destructive)
+    5. Record synced entries in markdown_syncs
+    Args:
+        db: DatabaseService instance
+        project_path: Absolute project path (e.g. C:\\xampp\\htdocs\\server)
+        min_importance: Minimum importance threshold (default 7)
+    Returns:
+        Dict with sync results
+    """
+    from services.database import normalize_path
+    norm_path = normalize_path(project_path)
+    _ensure_markdown_syncs_table(db.conn)
+    cursor = db.conn.cursor()
+    # 1. Query high-importance decisions, preferences, and successful errors
+    try:
+        cursor.execute("""
+            SELECT id, type, content, importance, success, created_at
+            FROM memories
+            WHERE importance >= ?
+            AND (project_path = ? OR project_path IS NULL)
+            AND (
+                type IN ('decision', 'preference')
+                OR (type = 'error' AND success = 1)
+            )
+            ORDER BY importance DESC, created_at DESC
+            LIMIT 30
+        """, (min_importance, norm_path))
+        memories = [dict(row) for row in cursor.fetchall()]
+    except Exception as e:
+        logger.error(f"MCP->Native: failed to query memories: {e}")
+        return {"success": False, "error": str(e)}
+    if not memories:
+        return {"success": True, "synced": 0, "reason": "no qualifying memories"}
+    # 2. Check which are already synced
+    already_synced_ids = set()
+    try:
+        cursor.execute("""
+            SELECT memory_id FROM markdown_syncs
+            WHERE file_type = 'mcp_to_native'
+            AND project_path = ?
+        """, (norm_path,))
+        already_synced_ids = {row["memory_id"] for row in cursor.fetchall()}
+    except Exception as e:
+        logger.warning(f"MCP->Native: failed to check synced IDs: {e}")
+    # Also get all synced content hashes for this direction
+    already_synced_hashes = set()
+    try:
+        cursor.execute("""
+            SELECT content_hash FROM markdown_syncs
+            WHERE file_type = 'mcp_to_native'
+            AND project_path = ?
+        """, (norm_path,))
+        already_synced_hashes = {row["content_hash"] for row in cursor.fetchall()}
+    except Exception:
+        pass
+    # Filter to new memories only
+    new_memories = []
+    for mem in memories:
+        h = _content_hash(mem["content"])
+        if mem["id"] not in already_synced_ids and h not in already_synced_hashes:
+            new_memories.append(mem)
+    if not new_memories:
+        return {"success": True, "synced": 0, "reason": "all already synced"}
+    # 3. Read native MEMORY.md
+    native_md_path = get_native_memory_md(project_path)
+    if native_md_path.exists():
+        existing_content = native_md_path.read_text(encoding="utf-8")
+    else:
+        existing_content = ""
+    # Count lines outside the MCP-synced section
+    user_content = _strip_mcp_section(existing_content)
+    user_line_count = len(user_content.splitlines())
+    if user_line_count >= MAX_NATIVE_LINES:
+        logger.warning(
+            f"MCP->Native: MEMORY.md already at {user_line_count} lines "
+            f"(budget {MAX_NATIVE_LINES}), skipping sync"
+        )
+        return {
+            "success": True,
+            "synced": 0,
+            "reason": f"line budget exceeded ({user_line_count}/{MAX_NATIVE_LINES})",
+        }
+    # 4. Build the fenced section content
+    # Include previously synced memories too (rebuild full section)
+    all_for_section = memories  # all qualifying, not just new
+    section_lines = _build_mcp_section(all_for_section)
+    # Check combined line count
+    total_lines = user_line_count + len(section_lines)
+    if total_lines > MAX_NATIVE_LINES:
+        # Trim section to fit budget
+        budget = MAX_NATIVE_LINES - user_line_count
+        if budget < 5:
+            return {
+                "success": True,
+                "synced": 0,
+                "reason": "not enough line budget for MCP section",
+            }
+        section_lines = section_lines[:budget]
+    # 5. Replace or append the fenced section
+    section_text = "\n".join(section_lines)
+    updated_content = _replace_mcp_section(user_content, section_text)
+    # Write back
+    native_md_path.parent.mkdir(parents=True, exist_ok=True)
+    native_md_path.write_text(updated_content, encoding="utf-8")
+    # 6. Record in markdown_syncs
+    now = datetime.now().isoformat()
+    synced_count = 0
+    for mem in new_memories:
+        h = _content_hash(mem["content"])
+        try:
+            cursor.execute("""
+                INSERT INTO markdown_syncs (file_type, file_path, memory_id, project_path, synced_at, content_hash)
+                VALUES ('mcp_to_native', ?, ?, ?, ?, ?)
+            """, (str(native_md_path), mem["id"], norm_path, now, h))
+            synced_count += 1
+        except Exception as e:
+            logger.warning(f"MCP->Native: failed to record sync for memory {mem['id']}: {e}")
+    db.conn.commit()
+    return {
+        "success": True,
+        "synced": synced_count,
+        "total_in_section": len(all_for_section),
+        "file": str(native_md_path),
+        "user_lines": user_line_count,
+        "total_lines": len(updated_content.splitlines()),
+    }
+def _build_mcp_section(memories: list) -> List[str]:
+    """Build the fenced MCP-SYNCED section lines."""
+    lines = [
+        MCP_SYNC_START,
+        "## Synced from MCP Memory DB",
+        "",
+    ]
+    for mem in memories:
+        mtype = mem.get("type", "chunk")
+        content = mem.get("content", "").replace("\n", " ").strip()
+        # Truncate long entries
+        if len(content) > 200:
+            content = content[:197] + "..."
+        importance = mem.get("importance", 5)
+        lines.append(f"- [{mtype}] {content} (importance: {importance})")
+    lines.append("")
+    lines.append(MCP_SYNC_END)
+    return lines
+def _strip_mcp_section(content: str) -> str:
+    """Remove the MCP-SYNCED fenced section from content."""
+    pattern = re.compile(
+        re.escape(MCP_SYNC_START) + r".*?" + re.escape(MCP_SYNC_END),
+        re.DOTALL,
+    )
+    stripped = pattern.sub("", content)
+    # Clean up extra blank lines left behind
+    stripped = re.sub(r"\n{3,}", "\n\n", stripped)
+    return stripped.rstrip("\n") + "\n" if stripped.strip() else ""
+def _replace_mcp_section(user_content: str, section_text: str) -> str:
+    """Append (or replace) the MCP section at the end of user content."""
+    # Ensure user content ends with a newline
+    if user_content and not user_content.endswith("\n"):
+        user_content += "\n"
+    return user_content + "\n" + section_text + "\n"
+# ── Direction B: Native -> MCP ────────────────────────────────────────────
+async def sync_native_to_mcp(
+    db,
+    embeddings,
+    project_path: str,
+) -> Dict[str, Any]:
+    """Sync native MEMORY.md content into the MCP vector DB.
+    1. Read native MEMORY.md + topic files
+    2. Parse into entries (## sections or bullet groups)
+    3. Skip the MCP-SYNCED section (avoid circular sync)
+    4. Hash each entry, check markdown_syncs for file_type='native_to_mcp'
+    5. For new/changed entries: generate embedding, store in MCP DB
+    6. Record in markdown_syncs
+    Args:
+        db: DatabaseService instance
+        embeddings: EmbeddingService instance
+        project_path: Absolute project path
+    Returns:
+        Dict with sync results
+    """
+    from services.database import normalize_path
+    norm_path = normalize_path(project_path)
+    _ensure_markdown_syncs_table(db.conn)
+    all_files = list_native_memory_files(project_path)
+    if not all_files:
+        return {"success": True, "synced": 0, "reason": "no native memory files"}
+    # 1. Read and parse all files
+    entries = []
+    for fpath in all_files:
+        try:
+            raw = fpath.read_text(encoding="utf-8")
+        except Exception as e:
+            logger.warning(f"Native->MCP: failed to read {fpath}: {e}")
+            continue
+        # Strip the MCP-synced section to avoid circular import
+        clean = _strip_mcp_section(raw)
+        parsed = _parse_markdown_entries(clean, source_file=fpath.name)
+        entries.extend(parsed)
+    if not entries:
+        return {"success": True, "synced": 0, "reason": "no parseable entries"}
+    # 2. Check what's already synced
+    cursor = db.conn.cursor()
+    already_synced_hashes = set()
+    try:
+        cursor.execute("""
+            SELECT content_hash FROM markdown_syncs
+            WHERE file_type = 'native_to_mcp'
+            AND project_path = ?
+        """, (norm_path,))
+        already_synced_hashes = {row["content_hash"] for row in cursor.fetchall()}
+    except Exception as e:
+        logger.warning(f"Native->MCP: failed to check synced hashes: {e}")
+    # 3. Filter to new/changed entries
+    new_entries = []
+    for entry in entries:
+        h = _content_hash(entry["content"])
+        if h not in already_synced_hashes:
+            entry["hash"] = h
+            new_entries.append(entry)
+    if not new_entries:
+        return {"success": True, "synced": 0, "reason": "all already synced"}
+    # 4. Generate embeddings and store
+    now = datetime.now().isoformat()
+    synced_count = 0
+    errors = []
+    for entry in new_entries:
+        try:
+            # Generate embedding
+            emb_result = await embeddings.generate_embedding(entry["content"])
+            if hasattr(emb_result, "ok") and not emb_result.ok:
+                logger.warning(f"Native->MCP: embedding failed for entry: {emb_result.error_message}")
+                errors.append(entry["content"][:50])
+                continue
+            # Extract the embedding vector
+            embedding = emb_result.embedding if hasattr(emb_result, "embedding") else emb_result
+            # Build tags
+            tags = [NATIVE_SOURCE_TAG]
+            if entry.get("source_file"):
+                tags.append(f"file={entry['source_file']}")
+            if entry.get("section"):
+                tags.append(f"section={entry['section']}")
+            # Store in MCP DB
+            import json
+            embedding_json = json.dumps(
+                embedding if isinstance(embedding, list) else embedding.tolist()
+                if hasattr(embedding, "tolist") else list(embedding)
+            )
+            # Use only columns guaranteed to exist in the active DB schema
+            cursor.execute("""
+                INSERT INTO memories (type, content, embedding, project_path, importance, tags, created_at)
+                VALUES ('chunk', ?, ?, ?, 6, ?, ?)
+            """, (
+                entry["content"],
+                embedding_json,
+                norm_path,
+                json.dumps(tags),
+                now,
+            ))
+            memory_id = cursor.lastrowid
+            # Record in markdown_syncs
+            cursor.execute("""
+                INSERT INTO markdown_syncs (file_type, file_path, memory_id, project_path, synced_at, content_hash)
+                VALUES ('native_to_mcp', ?, ?, ?, ?, ?)
+            """, (
+                entry.get("source_file", "MEMORY.md"),
+                memory_id,
+                norm_path,
+                now,
+                entry["hash"],
+            ))
+            synced_count += 1
+        except Exception as e:
+            logger.error(f"Native->MCP: failed to sync entry: {e}")
+            errors.append(str(e))
+    db.conn.commit()
+    return {
+        "success": True,
+        "synced": synced_count,
+        "total_entries": len(entries),
+        "new_entries": len(new_entries),
+        "errors": errors if errors else None,
+    }
+def _parse_markdown_entries(content: str, source_file: str = "MEMORY.md") -> List[Dict[str, Any]]:
+    """Parse markdown into discrete entries for import.
+    Splits on ## headers. Each section becomes one entry.
+    Bullet groups under a section are kept together.
+    Very short entries (< 20 chars) are skipped.
+    """
+    if not content.strip():
+        return []
+    entries = []
+    lines = content.splitlines()
+    current_section = ""
+    current_lines = []
+    for line in lines:
+        if line.startswith("## "):
+            # Flush previous section
+            if current_lines:
+                text = "\n".join(current_lines).strip()
+                if len(text) >= 20:
+                    entries.append({
+                        "content": text,
+                        "section": current_section,
+                        "source_file": source_file,
+                    })
+            current_section = line[3:].strip()
+            current_lines = [line]
+        elif line.startswith("# ") and not current_lines:
+            # Top-level heading, skip (it's the file title)
+            continue
+        else:
+            current_lines.append(line)
+    # Flush last section
+    if current_lines:
+        text = "\n".join(current_lines).strip()
+        if len(text) >= 20:
+            entries.append({
+                "content": text,
+                "section": current_section,
+                "source_file": source_file,
+            })
+    return entries
+# ── Combined sync ─────────────────────────────────────────────────────────
+async def sync_bidirectional(
+    db,
+    embeddings,
+    project_path: str,
+) -> Dict[str, Any]:
+    """Run both sync directions. Used at session end.
+    Args:
+        db: DatabaseService instance
+        embeddings: EmbeddingService instance (needed for native->MCP)
+        project_path: Absolute project path
+    Returns:
+        Dict with results from both directions
+    """
+    results = {}
+    # Direction A: MCP -> Native (fast)
+    try:
+        results["mcp_to_native"] = await sync_mcp_to_native(db, project_path)
+    except Exception as e:
+        logger.error(f"Bidirectional sync MCP->Native failed: {e}")
+        results["mcp_to_native"] = {"success": False, "error": str(e)}
+    # Direction B: Native -> MCP (needs embeddings)
+    try:
+        results["native_to_mcp"] = await sync_native_to_mcp(db, embeddings, project_path)
+    except Exception as e:
+        logger.error(f"Bidirectional sync Native->MCP failed: {e}")
+        results["native_to_mcp"] = {"success": False, "error": str(e)}
+    return results

package/services/response_manager.py ADDED Viewed

@@ -0,0 +1,183 @@
+"""Response size management with progressive degradation.
+Ensures MCP tool responses stay within Claude Code's token limits
+by applying increasingly aggressive size reduction strategies.
+"""
+import json
+import logging
+from typing import Any, Dict, List, Optional
+from config import config
+logger = logging.getLogger(__name__)
+# Fields added by graph enrichment that are safe to strip
+GRAPH_ENRICHMENT_FIELDS = frozenset({
+    "known_fixes", "rationale", "consequences",
+    "contradictions", "causal_chain",
+})
+# Keys in result dicts that hold lists of memory items
+RESULT_LIST_KEYS = (
+    "results", "memories", "patterns", "decisions",
+    "code_patterns", "relevant_to_query", "matches",
+)
+def _json_size(data: Any, indent: Optional[int] = 2) -> int:
+    """Return the character count of JSON-serialized data."""
+    return len(json.dumps(data, indent=indent, default=str))
+def _strip_graph_fields(data: Any) -> Any:
+    """Recursively remove graph enrichment fields from dicts/lists."""
+    if isinstance(data, dict):
+        return {
+            k: _strip_graph_fields(v)
+            for k, v in data.items()
+            if k not in GRAPH_ENRICHMENT_FIELDS
+        }
+    if isinstance(data, list):
+        return [_strip_graph_fields(item) for item in data]
+    return data
+def _truncate_content_fields(data: Any, max_len: int) -> Any:
+    """Truncate string values in 'content', 'outcome', 'solution' fields."""
+    truncatable = {"content", "outcome", "solution", "description"}
+    if isinstance(data, dict):
+        result = {}
+        for k, v in data.items():
+            if k in truncatable and isinstance(v, str) and len(v) > max_len:
+                result[k] = v[:max_len] + "..."
+            else:
+                result[k] = _truncate_content_fields(v, max_len)
+        return result
+    if isinstance(data, list):
+        return [_truncate_content_fields(item, max_len) for item in data]
+    return data
+def _halve_result_lists(data: Any, min_count: int) -> Any:
+    """Reduce list-type result fields to at most half their size (min min_count)."""
+    if not isinstance(data, dict):
+        return data
+    result = {}
+    for k, v in data.items():
+        if k in RESULT_LIST_KEYS and isinstance(v, list) and len(v) > min_count:
+            new_len = max(len(v) // 2, min_count)
+            result[k] = v[:new_len]
+        else:
+            result[k] = _halve_result_lists(v, min_count)
+    return result
+def fit_response(
+    data: Any,
+    max_chars: Optional[int] = None,
+) -> str:
+    """Serialize data to JSON, applying progressive degradation if too large.
+    Degradation levels:
+        0 - Full response with indent=2
+        1 - Compact JSON (no indent)
+        2 - Strip graph enrichment fields
+        3 - Truncate content fields to CONTENT_TRUNCATE_LENGTH
+        4 - Halve result list counts (min MIN_RESULT_COUNT)
+        5 - Emergency hard truncation
+    Returns:
+        JSON string guaranteed to be <= max_chars.
+    """
+    if max_chars is None:
+        max_chars = config.MAX_RESPONSE_CHARS
+    level = 0
+    working = data
+    # Level 0: full pretty-printed JSON
+    output = json.dumps(working, indent=2, default=str)
+    if len(output) <= max_chars:
+        return output
+    # Level 1: compact JSON
+    level = 1
+    output = json.dumps(working, default=str)
+    if len(output) <= max_chars:
+        return _with_meta(output, working, level, max_chars)
+    # Level 2: strip graph enrichment fields
+    level = 2
+    working = _strip_graph_fields(working)
+    output = json.dumps(working, default=str)
+    if len(output) <= max_chars:
+        return _with_meta(output, working, level, max_chars)
+    # Level 3: truncate content fields
+    level = 3
+    working = _truncate_content_fields(working, config.CONTENT_TRUNCATE_LENGTH)
+    output = json.dumps(working, default=str)
+    if len(output) <= max_chars:
+        return _with_meta(output, working, level, max_chars)
+    # Level 4: halve result counts
+    level = 4
+    working = _halve_result_lists(working, config.MIN_RESULT_COUNT)
+    output = json.dumps(working, default=str)
+    if len(output) <= max_chars:
+        return _with_meta(output, working, level, max_chars)
+    # Level 5: emergency hard truncation
+    level = 5
+    logger.warning(
+        "Response required emergency truncation: %d -> %d chars",
+        len(output), max_chars,
+    )
+    output = output[:max_chars - 100]
+    # Append a valid JSON suffix with metadata
+    meta = json.dumps({
+        "_response_meta": {
+            "degradation_level": level,
+            "truncated": True,
+            "original_chars": _json_size(data, indent=None),
+            "note": "Response was emergency-truncated. Use specific queries to retrieve full data.",
+        }
+    })
+    return output + "\n" + meta
+def _with_meta(
+    compact_json: str,
+    working_data: Any,
+    level: int,
+    max_chars: int,
+) -> str:
+    """Inject _response_meta into the serialized response."""
+    if not isinstance(working_data, dict):
+        return compact_json
+    meta = {
+        "degradation_level": level,
+        "truncated": False,
+        "note": _level_description(level),
+    }
+    working_data["_response_meta"] = meta
+    output = json.dumps(working_data, default=str)
+    # If adding meta pushes us over, return without meta
+    if len(output) > max_chars:
+        del working_data["_response_meta"]
+        return compact_json
+    return output
+def _level_description(level: int) -> str:
+    descriptions = {
+        1: "Compact JSON (whitespace removed)",
+        2: "Graph enrichment fields stripped",
+        3: "Content fields truncated",
+        4: "Result counts reduced",
+        5: "Emergency truncation applied",
+    }
+    return descriptions.get(level, "Unknown degradation")