PyPI - agent-cli - Versions diffs - 0.70.5__py3-none-any.whl - Mend

agent-cli 0.70.5__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (196) hide show

agent_cli/__init__.py +5 -0
agent_cli/__main__.py +6 -0
agent_cli/_extras.json +14 -0
agent_cli/_requirements/.gitkeep +0 -0
agent_cli/_requirements/audio.txt +79 -0
agent_cli/_requirements/faster-whisper.txt +215 -0
agent_cli/_requirements/kokoro.txt +425 -0
agent_cli/_requirements/llm.txt +183 -0
agent_cli/_requirements/memory.txt +355 -0
agent_cli/_requirements/mlx-whisper.txt +222 -0
agent_cli/_requirements/piper.txt +176 -0
agent_cli/_requirements/rag.txt +402 -0
agent_cli/_requirements/server.txt +154 -0
agent_cli/_requirements/speed.txt +77 -0
agent_cli/_requirements/vad.txt +155 -0
agent_cli/_requirements/wyoming.txt +71 -0
agent_cli/_tools.py +368 -0
agent_cli/agents/__init__.py +23 -0
agent_cli/agents/_voice_agent_common.py +136 -0
agent_cli/agents/assistant.py +383 -0
agent_cli/agents/autocorrect.py +284 -0
agent_cli/agents/chat.py +496 -0
agent_cli/agents/memory/__init__.py +31 -0
agent_cli/agents/memory/add.py +190 -0
agent_cli/agents/memory/proxy.py +160 -0
agent_cli/agents/rag_proxy.py +128 -0
agent_cli/agents/speak.py +209 -0
agent_cli/agents/transcribe.py +671 -0
agent_cli/agents/transcribe_daemon.py +499 -0
agent_cli/agents/voice_edit.py +291 -0
agent_cli/api.py +22 -0
agent_cli/cli.py +106 -0
agent_cli/config.py +503 -0
agent_cli/config_cmd.py +307 -0
agent_cli/constants.py +27 -0
agent_cli/core/__init__.py +1 -0
agent_cli/core/audio.py +461 -0
agent_cli/core/audio_format.py +299 -0
agent_cli/core/chroma.py +88 -0
agent_cli/core/deps.py +191 -0
agent_cli/core/openai_proxy.py +139 -0
agent_cli/core/process.py +195 -0
agent_cli/core/reranker.py +120 -0
agent_cli/core/sse.py +87 -0
agent_cli/core/transcription_logger.py +70 -0
agent_cli/core/utils.py +526 -0
agent_cli/core/vad.py +175 -0
agent_cli/core/watch.py +65 -0
agent_cli/dev/__init__.py +14 -0
agent_cli/dev/cli.py +1588 -0
agent_cli/dev/coding_agents/__init__.py +19 -0
agent_cli/dev/coding_agents/aider.py +24 -0
agent_cli/dev/coding_agents/base.py +167 -0
agent_cli/dev/coding_agents/claude.py +39 -0
agent_cli/dev/coding_agents/codex.py +24 -0
agent_cli/dev/coding_agents/continue_dev.py +15 -0
agent_cli/dev/coding_agents/copilot.py +24 -0
agent_cli/dev/coding_agents/cursor_agent.py +48 -0
agent_cli/dev/coding_agents/gemini.py +28 -0
agent_cli/dev/coding_agents/opencode.py +15 -0
agent_cli/dev/coding_agents/registry.py +49 -0
agent_cli/dev/editors/__init__.py +19 -0
agent_cli/dev/editors/base.py +89 -0
agent_cli/dev/editors/cursor.py +15 -0
agent_cli/dev/editors/emacs.py +46 -0
agent_cli/dev/editors/jetbrains.py +56 -0
agent_cli/dev/editors/nano.py +31 -0
agent_cli/dev/editors/neovim.py +33 -0
agent_cli/dev/editors/registry.py +59 -0
agent_cli/dev/editors/sublime.py +20 -0
agent_cli/dev/editors/vim.py +42 -0
agent_cli/dev/editors/vscode.py +15 -0
agent_cli/dev/editors/zed.py +20 -0
agent_cli/dev/project.py +568 -0
agent_cli/dev/registry.py +52 -0
agent_cli/dev/skill/SKILL.md +141 -0
agent_cli/dev/skill/examples.md +571 -0
agent_cli/dev/terminals/__init__.py +19 -0
agent_cli/dev/terminals/apple_terminal.py +82 -0
agent_cli/dev/terminals/base.py +56 -0
agent_cli/dev/terminals/gnome.py +51 -0
agent_cli/dev/terminals/iterm2.py +84 -0
agent_cli/dev/terminals/kitty.py +77 -0
agent_cli/dev/terminals/registry.py +48 -0
agent_cli/dev/terminals/tmux.py +58 -0
agent_cli/dev/terminals/warp.py +132 -0
agent_cli/dev/terminals/zellij.py +78 -0
agent_cli/dev/worktree.py +856 -0
agent_cli/docs_gen.py +417 -0
agent_cli/example-config.toml +185 -0
agent_cli/install/__init__.py +5 -0
agent_cli/install/common.py +89 -0
agent_cli/install/extras.py +174 -0
agent_cli/install/hotkeys.py +48 -0
agent_cli/install/services.py +87 -0
agent_cli/memory/__init__.py +7 -0
agent_cli/memory/_files.py +250 -0
agent_cli/memory/_filters.py +63 -0
agent_cli/memory/_git.py +157 -0
agent_cli/memory/_indexer.py +142 -0
agent_cli/memory/_ingest.py +408 -0
agent_cli/memory/_persistence.py +182 -0
agent_cli/memory/_prompt.py +91 -0
agent_cli/memory/_retrieval.py +294 -0
agent_cli/memory/_store.py +169 -0
agent_cli/memory/_streaming.py +44 -0
agent_cli/memory/_tasks.py +48 -0
agent_cli/memory/api.py +113 -0
agent_cli/memory/client.py +272 -0
agent_cli/memory/engine.py +361 -0
agent_cli/memory/entities.py +43 -0
agent_cli/memory/models.py +112 -0
agent_cli/opts.py +433 -0
agent_cli/py.typed +0 -0
agent_cli/rag/__init__.py +3 -0
agent_cli/rag/_indexer.py +67 -0
agent_cli/rag/_indexing.py +226 -0
agent_cli/rag/_prompt.py +30 -0
agent_cli/rag/_retriever.py +156 -0
agent_cli/rag/_store.py +48 -0
agent_cli/rag/_utils.py +218 -0
agent_cli/rag/api.py +175 -0
agent_cli/rag/client.py +299 -0
agent_cli/rag/engine.py +302 -0
agent_cli/rag/models.py +55 -0
agent_cli/scripts/.runtime/.gitkeep +0 -0
agent_cli/scripts/__init__.py +1 -0
agent_cli/scripts/check_plugin_skill_sync.py +50 -0
agent_cli/scripts/linux-hotkeys/README.md +63 -0
agent_cli/scripts/linux-hotkeys/toggle-autocorrect.sh +45 -0
agent_cli/scripts/linux-hotkeys/toggle-transcription.sh +58 -0
agent_cli/scripts/linux-hotkeys/toggle-voice-edit.sh +58 -0
agent_cli/scripts/macos-hotkeys/README.md +45 -0
agent_cli/scripts/macos-hotkeys/skhd-config-example +5 -0
agent_cli/scripts/macos-hotkeys/toggle-autocorrect.sh +12 -0
agent_cli/scripts/macos-hotkeys/toggle-transcription.sh +37 -0
agent_cli/scripts/macos-hotkeys/toggle-voice-edit.sh +37 -0
agent_cli/scripts/nvidia-asr-server/README.md +99 -0
agent_cli/scripts/nvidia-asr-server/pyproject.toml +27 -0
agent_cli/scripts/nvidia-asr-server/server.py +255 -0
agent_cli/scripts/nvidia-asr-server/shell.nix +32 -0
agent_cli/scripts/nvidia-asr-server/uv.lock +4654 -0
agent_cli/scripts/run-openwakeword.sh +11 -0
agent_cli/scripts/run-piper-windows.ps1 +30 -0
agent_cli/scripts/run-piper.sh +24 -0
agent_cli/scripts/run-whisper-linux.sh +40 -0
agent_cli/scripts/run-whisper-macos.sh +6 -0
agent_cli/scripts/run-whisper-windows.ps1 +51 -0
agent_cli/scripts/run-whisper.sh +9 -0
agent_cli/scripts/run_faster_whisper_server.py +136 -0
agent_cli/scripts/setup-linux-hotkeys.sh +72 -0
agent_cli/scripts/setup-linux.sh +108 -0
agent_cli/scripts/setup-macos-hotkeys.sh +61 -0
agent_cli/scripts/setup-macos.sh +76 -0
agent_cli/scripts/setup-windows.ps1 +63 -0
agent_cli/scripts/start-all-services-windows.ps1 +53 -0
agent_cli/scripts/start-all-services.sh +178 -0
agent_cli/scripts/sync_extras.py +138 -0
agent_cli/server/__init__.py +3 -0
agent_cli/server/cli.py +721 -0
agent_cli/server/common.py +222 -0
agent_cli/server/model_manager.py +288 -0
agent_cli/server/model_registry.py +225 -0
agent_cli/server/proxy/__init__.py +3 -0
agent_cli/server/proxy/api.py +444 -0
agent_cli/server/streaming.py +67 -0
agent_cli/server/tts/__init__.py +3 -0
agent_cli/server/tts/api.py +335 -0
agent_cli/server/tts/backends/__init__.py +82 -0
agent_cli/server/tts/backends/base.py +139 -0
agent_cli/server/tts/backends/kokoro.py +403 -0
agent_cli/server/tts/backends/piper.py +253 -0
agent_cli/server/tts/model_manager.py +201 -0
agent_cli/server/tts/model_registry.py +28 -0
agent_cli/server/tts/wyoming_handler.py +249 -0
agent_cli/server/whisper/__init__.py +3 -0
agent_cli/server/whisper/api.py +413 -0
agent_cli/server/whisper/backends/__init__.py +89 -0
agent_cli/server/whisper/backends/base.py +97 -0
agent_cli/server/whisper/backends/faster_whisper.py +225 -0
agent_cli/server/whisper/backends/mlx.py +270 -0
agent_cli/server/whisper/languages.py +116 -0
agent_cli/server/whisper/model_manager.py +157 -0
agent_cli/server/whisper/model_registry.py +28 -0
agent_cli/server/whisper/wyoming_handler.py +203 -0
agent_cli/services/__init__.py +343 -0
agent_cli/services/_wyoming_utils.py +64 -0
agent_cli/services/asr.py +506 -0
agent_cli/services/llm.py +228 -0
agent_cli/services/tts.py +450 -0
agent_cli/services/wake_word.py +142 -0
agent_cli-0.70.5.dist-info/METADATA +2118 -0
agent_cli-0.70.5.dist-info/RECORD +196 -0
agent_cli-0.70.5.dist-info/WHEEL +4 -0
agent_cli-0.70.5.dist-info/entry_points.txt +4 -0
agent_cli-0.70.5.dist-info/licenses/LICENSE +21 -0

agent_cli/memory/_git.py ADDED Viewed

@@ -0,0 +1,157 @@
+"""Git integration for memory versioning."""
+from __future__ import annotations
+import asyncio
+import logging
+import shutil
+import subprocess
+from typing import TYPE_CHECKING, NamedTuple
+if TYPE_CHECKING:
+    from pathlib import Path
+LOGGER = logging.getLogger(__name__)
+class GitCommandResult(NamedTuple):
+    """Result of a git command execution."""
+    returncode: int
+    stdout: str
+    stderr: str
+def _is_git_installed() -> bool:
+    """Check if git is available in the path."""
+    return shutil.which("git") is not None
+def _run_git_sync(
+    args: list[str],
+    cwd: Path,
+    check: bool = True,
+) -> GitCommandResult:
+    """Run a git command synchronously."""
+    proc = subprocess.run(
+        ["git", *args],  # noqa: S607
+        cwd=cwd,
+        check=check,
+        capture_output=True,
+        text=True,
+        encoding="utf-8",
+        errors="replace",
+    )
+    return GitCommandResult(proc.returncode, proc.stdout, proc.stderr)
+async def _run_git_async(
+    args: list[str],
+    cwd: Path,
+    check: bool = True,
+) -> GitCommandResult:
+    """Run a git command asynchronously."""
+    proc = await asyncio.create_subprocess_exec(
+        "git",
+        *args,
+        cwd=cwd,
+        stdout=asyncio.subprocess.PIPE,
+        stderr=asyncio.subprocess.PIPE,
+    )
+    stdout, stderr = await proc.communicate()
+    assert proc.returncode is not None
+    stdout_text = stdout.decode("utf-8", errors="replace")
+    stderr_text = stderr.decode("utf-8", errors="replace")
+    if check and proc.returncode != 0:
+        raise subprocess.CalledProcessError(
+            proc.returncode,
+            ["git", *args],
+            output=stdout_text,
+            stderr=stderr_text,
+        )
+    return GitCommandResult(proc.returncode, stdout_text, stderr_text)
+def init_repo(path: Path) -> None:
+    """Initialize a git repository if one does not exist."""
+    if not _is_git_installed():
+        LOGGER.warning("Git is not installed; skipping repository initialization.")
+        return
+    if (path / ".git").exists():
+        return
+    try:
+        LOGGER.info("Initializing git repository in %s", path)
+        _run_git_sync(["init"], cwd=path)
+        # Configure local user if not set (to avoid commit errors)
+        try:
+            _run_git_sync(["config", "user.email"], cwd=path)
+        except subprocess.CalledProcessError:
+            # No email configured, set local config
+            _run_git_sync(["config", "user.email", "agent-cli@local"], cwd=path)
+            _run_git_sync(["config", "user.name", "Agent CLI"], cwd=path)
+        # Create .gitignore to exclude derived data (vector db, cache)
+        gitignore_path = path / ".gitignore"
+        if not gitignore_path.exists():
+            gitignore_content = "chroma/\nmemory_index.json\n__pycache__/\n*.tmp\n.DS_Store\n"
+            gitignore_path.write_text(gitignore_content, encoding="utf-8")
+        # Create README.md
+        readme_path = path / "README.md"
+        if not readme_path.exists():
+            readme_content = (
+                "# Agent Memory Store\n\n"
+                "This repository contains the long-term memory for the Agent CLI.\n"
+                "Files are automatically managed and versioned by the memory proxy.\n\n"
+                "- `entries/`: Markdown files containing facts and conversation logs.\n"
+                "- `deleted/`: Soft-deleted memories (tombstones).\n"
+            )
+            readme_path.write_text(readme_content, encoding="utf-8")
+        # Initial commit
+        _run_git_sync(["add", "."], cwd=path)
+        _run_git_sync(
+            ["commit", "--allow-empty", "-m", "Initial commit"],
+            cwd=path,
+            check=False,
+        )
+    except subprocess.CalledProcessError:
+        LOGGER.exception("Failed to initialize git repo")
+async def commit_changes(path: Path, message: str) -> None:
+    """Stage and commit all changes in the given path."""
+    if not _is_git_installed():
+        return
+    if not (path / ".git").exists():
+        LOGGER.warning("Not a git repository: %s", path)
+        return
+    try:
+        # Check if there are changes
+        status = await _run_git_async(
+            ["status", "--porcelain"],
+            cwd=path,
+            check=False,
+        )
+        if status.returncode != 0:
+            LOGGER.error("Failed to check git status")
+            return
+        if not status.stdout.strip():
+            return  # Nothing to commit
+        LOGGER.info("Committing changes to memory store: %s", message)
+        await _run_git_async(["add", "."], cwd=path)
+        await _run_git_async(["commit", "-m", message], cwd=path)
+    except Exception:
+        LOGGER.exception("Failed to commit changes")

agent_cli/memory/_indexer.py ADDED Viewed

@@ -0,0 +1,142 @@
+"""File watcher and indexing for file-backed memories."""
+from __future__ import annotations
+import logging
+from dataclasses import dataclass, field
+from typing import TYPE_CHECKING
+from agent_cli.core.watch import watch_directory
+from agent_cli.memory._files import (
+    _DELETED_DIRNAME,
+    MemoryFileRecord,
+    ensure_store_dirs,
+    load_memory_files,
+    load_snapshot,
+    read_memory_file,
+    write_snapshot,
+)
+from agent_cli.memory._store import delete_entries, upsert_memories
+if TYPE_CHECKING:
+    from pathlib import Path
+    from chromadb import Collection
+    from watchfiles import Change
+LOGGER = logging.getLogger(__name__)
+@dataclass
+class MemoryIndex:
+    """In-memory view of memory files plus a JSON snapshot on disk."""
+    entries: dict[str, MemoryFileRecord] = field(default_factory=dict)
+    snapshot_path: Path | None = None
+    @classmethod
+    def from_snapshot(cls, snapshot_path: Path) -> MemoryIndex:
+        """Restore index state from a snapshot file if present."""
+        return cls(entries=load_snapshot(snapshot_path), snapshot_path=snapshot_path)
+    def replace(self, records: list[MemoryFileRecord]) -> None:
+        """Replace the in-memory index with the given records."""
+        self.entries = {rec.id: rec for rec in records}
+        self._persist()
+    def upsert(self, record: MemoryFileRecord) -> None:
+        """Insert or update a record and persist the snapshot."""
+        self.entries[record.id] = record
+        self._persist()
+    def remove(self, doc_id: str) -> None:
+        """Remove a record by id and persist the snapshot."""
+        self.entries.pop(doc_id, None)
+        self._persist()
+    def find_id_by_path(self, path: Path) -> str | None:
+        """Find a record id by its file path, if present."""
+        for doc_id, record in self.entries.items():
+            if record.path == path:
+                return doc_id
+        return None
+    def _persist(self) -> None:
+        if self.snapshot_path:
+            write_snapshot(self.snapshot_path, self.entries.values())
+def initial_index(collection: Collection, root: Path, *, index: MemoryIndex) -> None:
+    """Load memory files, reconcile against snapshot, and index into Chroma."""
+    entries_dir, snapshot_path = ensure_store_dirs(root)
+    if index.snapshot_path is None:
+        index.snapshot_path = snapshot_path
+    records = load_memory_files(root)
+    current_ids = {rec.id for rec in records}
+    # Remove stale docs that were present in last snapshot but missing now
+    stale_ids = set(index.entries) - current_ids
+    if stale_ids:
+        LOGGER.info("Removing %d stale memory docs from index", len(stale_ids))
+        delete_entries(collection, list(stale_ids))
+    if records:
+        ids = [rec.id for rec in records]
+        docs = [rec.content for rec in records]
+        metas = [rec.metadata for rec in records]
+        upsert_memories(collection, ids=ids, contents=docs, metadatas=metas)
+        LOGGER.info("Indexed %d memory docs from %s", len(records), entries_dir)
+    else:
+        LOGGER.info("No memory files found in %s", entries_dir)
+    index.replace(records)
+async def watch_memory_store(collection: Collection, root: Path, *, index: MemoryIndex) -> None:
+    """Watch the memory entries folder and keep Chroma in sync."""
+    entries_dir, snapshot_path = ensure_store_dirs(root)
+    if index.snapshot_path is None:
+        index.snapshot_path = snapshot_path
+    LOGGER.info("📁 Watching memory store: %s", entries_dir)
+    await watch_directory(
+        entries_dir,
+        lambda change, path: _handle_change(change, path, collection, index),
+    )
+def _handle_change(change: Change, path: Path, collection: Collection, index: MemoryIndex) -> None:
+    from watchfiles import Change  # noqa: PLC0415
+    if path.suffix == ".tmp":
+        return
+    if _DELETED_DIRNAME in path.parts:
+        return
+    if change == Change.deleted:
+        doc_id = index.find_id_by_path(path)
+        if not doc_id:
+            # Fallback: try to parse ID from filename (timestamp__uuid.md)
+            parts = path.stem.split("__")
+            doc_id = parts[-1] if len(parts) > 1 else path.stem
+        LOGGER.info("[deleted] %s", path.name)
+        delete_entries(collection, [doc_id])
+        index.remove(doc_id)
+        return
+    if change in {Change.added, Change.modified}:
+        action = "added" if change == Change.added else "modified"
+        LOGGER.info("[%s] %s", action, path.name)
+        record = read_memory_file(path)
+        if not record:
+            return
+        upsert_memories(
+            collection,
+            ids=[record.id],
+            contents=[record.content],
+            metadatas=[record.metadata],
+        )
+        index.upsert(record)

agent_cli/memory/_ingest.py ADDED Viewed

@@ -0,0 +1,408 @@
+"""Ingestion logic for memory (LLM Extraction, Reconciliation, Summarization)."""
+from __future__ import annotations
+import json
+import logging
+from datetime import UTC, datetime
+from time import perf_counter
+from typing import TYPE_CHECKING
+from uuid import uuid4
+from agent_cli.memory._git import commit_changes
+from agent_cli.memory._persistence import delete_memory_files, persist_entries, persist_summary
+from agent_cli.memory._prompt import (
+    FACT_INSTRUCTIONS,
+    FACT_SYSTEM_PROMPT,
+    SUMMARY_PROMPT,
+    UPDATE_MEMORY_PROMPT,
+)
+from agent_cli.memory._retrieval import gather_relevant_existing_memories
+from agent_cli.memory._store import delete_entries, get_summary_entry
+from agent_cli.memory.entities import Fact, Summary
+from agent_cli.memory.models import (
+    MemoryAdd,
+    MemoryDecision,
+    MemoryDelete,
+    MemoryIgnore,
+    MemoryUpdate,
+    SummaryOutput,
+)
+if TYPE_CHECKING:
+    from pathlib import Path
+    from chromadb import Collection
+LOGGER = logging.getLogger(__name__)
+_SUMMARY_ROLE = "summary"
+def _elapsed_ms(start: float) -> float:
+    """Return elapsed milliseconds since start."""
+    return (perf_counter() - start) * 1000
+async def extract_salient_facts(
+    *,
+    user_message: str | None,
+    assistant_message: str | None,
+    openai_base_url: str,
+    api_key: str | None,
+    model: str,
+) -> list[str]:
+    """Run an LLM agent to extract facts from the transcript."""
+    if not user_message and not assistant_message:
+        return []
+    import httpx  # noqa: PLC0415
+    from pydantic_ai import Agent  # noqa: PLC0415
+    from pydantic_ai.exceptions import AgentRunError, UnexpectedModelBehavior  # noqa: PLC0415
+    from pydantic_ai.models.openai import OpenAIChatModel  # noqa: PLC0415
+    from pydantic_ai.providers.openai import OpenAIProvider  # noqa: PLC0415
+    # Extract facts from the latest user turn only (ignore assistant/system).
+    transcript = user_message or ""
+    LOGGER.info("Extracting facts from transcript: %r", transcript)
+    provider = OpenAIProvider(api_key=api_key or "dummy", base_url=openai_base_url)
+    model_cfg = OpenAIChatModel(model_name=model, provider=provider)
+    agent = Agent(
+        model=model_cfg,
+        system_prompt=FACT_SYSTEM_PROMPT,
+        output_type=list[str],
+        retries=2,
+    )
+    instructions = FACT_INSTRUCTIONS
+    try:
+        facts = await agent.run(transcript, instructions=instructions)
+        LOGGER.info("Raw fact extraction output: %s", facts.output)
+        return facts.output
+    except (httpx.HTTPError, AgentRunError, UnexpectedModelBehavior):
+        LOGGER.warning("PydanticAI fact extraction transient failure", exc_info=True)
+        return []
+    except Exception:
+        LOGGER.exception("PydanticAI fact extraction internal error")
+        raise
+def process_reconciliation_decisions(
+    decisions: list[MemoryDecision],
+    id_map: dict[int, str],
+    conversation_id: str,
+    source_id: str,
+    created_at: datetime,
+) -> tuple[list[Fact], list[str], dict[str, str]]:
+    """Process LLM decisions into actionable changes."""
+    to_add: list[Fact] = []
+    to_delete: list[str] = []
+    replacement_map: dict[str, str] = {}
+    LOGGER.info(
+        "Reconcile decisions raw: %s",
+        [d.model_dump() for d in decisions],
+    )
+    for dec in decisions:
+        if isinstance(dec, MemoryAdd):
+            text = dec.text.strip()
+            if text:
+                to_add.append(
+                    Fact(
+                        id=str(uuid4()),
+                        conversation_id=conversation_id,
+                        content=text,
+                        source_id=source_id,
+                        created_at=created_at,
+                    ),
+                )
+        elif isinstance(dec, MemoryUpdate):
+            text = dec.text.strip()
+            if text:
+                # Update existing memory: delete old, add new
+                orig = id_map[dec.id]  # Guaranteed valid by output_validator
+                new_id = str(uuid4())
+                to_delete.append(orig)
+                to_add.append(
+                    Fact(
+                        id=new_id,
+                        conversation_id=conversation_id,
+                        content=text,
+                        source_id=source_id,
+                        created_at=created_at,
+                    ),
+                )
+                replacement_map[orig] = new_id
+        elif isinstance(dec, MemoryDelete):
+            to_delete.append(id_map[dec.id])  # Guaranteed valid by output_validator
+        elif isinstance(dec, MemoryIgnore):
+            pass  # NONE ignored
+    return to_add, to_delete, replacement_map
+async def reconcile_facts(
+    collection: Collection,
+    conversation_id: str,
+    new_facts: list[str],
+    source_id: str,
+    created_at: datetime,
+    *,
+    openai_base_url: str,
+    api_key: str | None,
+    model: str,
+) -> tuple[list[Fact], list[str], dict[str, str]]:
+    """Use an LLM to decide add/update/delete/none for facts, with id remapping."""
+    if not new_facts:
+        return [], [], {}
+    existing = gather_relevant_existing_memories(collection, conversation_id, new_facts)
+    LOGGER.info("Reconcile: Found %d existing memories for new facts %s", len(existing), new_facts)
+    if not existing:
+        LOGGER.info("Reconcile: no existing memory facts; defaulting to add all new facts")
+        entries = [
+            Fact(
+                id=str(uuid4()),
+                conversation_id=conversation_id,
+                content=f,
+                source_id=source_id,
+                created_at=created_at,
+            )
+            for f in new_facts
+            if f.strip()
+        ]
+        return entries, [], {}
+    import httpx  # noqa: PLC0415
+    from pydantic_ai import Agent, ModelRetry, PromptedOutput  # noqa: PLC0415
+    from pydantic_ai.exceptions import AgentRunError, UnexpectedModelBehavior  # noqa: PLC0415
+    from pydantic_ai.models.openai import OpenAIChatModel  # noqa: PLC0415
+    from pydantic_ai.providers.openai import OpenAIProvider  # noqa: PLC0415
+    from pydantic_ai.settings import ModelSettings  # noqa: PLC0415
+    id_map: dict[int, str] = {idx: mem.id for idx, mem in enumerate(existing)}
+    existing_json = [{"id": idx, "text": mem.content} for idx, mem in enumerate(existing)]
+    existing_ids = set(id_map.keys())
+    provider = OpenAIProvider(api_key=api_key or "dummy", base_url=openai_base_url)
+    model_cfg = OpenAIChatModel(
+        model_name=model,
+        provider=provider,
+        settings=ModelSettings(temperature=0.0, max_tokens=512),
+    )
+    agent = Agent(
+        model=model_cfg,
+        system_prompt=UPDATE_MEMORY_PROMPT,
+        output_type=PromptedOutput(list[MemoryDecision]),  # JSON mode instead of tool calls
+        retries=3,
+    )
+    @agent.output_validator
+    def validate_decisions(decisions: list[MemoryDecision]) -> list[MemoryDecision]:
+        """Validate LLM decisions and provide feedback for retry."""
+        errors = []
+        for dec in decisions:
+            if (
+                isinstance(dec, (MemoryUpdate, MemoryDelete, MemoryIgnore))
+                and dec.id not in existing_ids
+            ):
+                if isinstance(dec, MemoryUpdate):
+                    errors.append(
+                        f"UPDATE with id={dec.id} is invalid: that ID doesn't exist. "
+                        f"Valid existing IDs are: {sorted(existing_ids)}. "
+                        f"For NEW facts, use ADD with a new ID.",
+                    )
+                elif isinstance(dec, MemoryDelete):
+                    errors.append(f"DELETE with id={dec.id} is invalid: that ID doesn't exist.")
+                else:  # MemoryIgnore (NONE)
+                    errors.append(f"NONE with id={dec.id} is invalid: that ID doesn't exist.")
+        if errors:
+            msg = "Invalid memory decisions:\n" + "\n".join(f"- {e}" for e in errors)
+            raise ModelRetry(msg)
+        return decisions
+    # Format with separate sections for existing and new facts
+    existing_str = json.dumps(existing_json, ensure_ascii=False, indent=2)
+    new_facts_str = json.dumps(new_facts, ensure_ascii=False, indent=2)
+    payload = f"""Current memory:
+```
+{existing_str}
+```
+New facts to process:
+```
+{new_facts_str}
+```"""
+    LOGGER.info("Reconcile payload: %s", payload)
+    try:
+        result = await agent.run(payload)
+        decisions = result.output
+    except (httpx.HTTPError, AgentRunError, UnexpectedModelBehavior):
+        LOGGER.warning(
+            "Update memory agent transient failure; defaulting to add all new facts",
+            exc_info=True,
+        )
+        entries = [
+            Fact(
+                id=str(uuid4()),
+                conversation_id=conversation_id,
+                content=f,
+                source_id=source_id,
+                created_at=created_at,
+            )
+            for f in new_facts
+            if f.strip()
+        ]
+        return entries, [], {}
+    except Exception:
+        LOGGER.exception("Update memory agent internal error")
+        raise
+    to_add, to_delete, replacement_map = process_reconciliation_decisions(
+        decisions,
+        id_map,
+        conversation_id=conversation_id,
+        source_id=source_id,
+        created_at=created_at,
+    )
+    LOGGER.info(
+        "Reconcile decisions: add=%d, delete=%d, events=%s",
+        len(to_add),
+        len(to_delete),
+        [dec.event for dec in decisions],
+    )
+    return to_add, to_delete, replacement_map
+async def update_summary(
+    *,
+    prior_summary: str | None,
+    new_facts: list[str],
+    openai_base_url: str,
+    api_key: str | None,
+    model: str,
+    max_tokens: int = 256,
+) -> str | None:
+    """Update the conversation summary based on new facts."""
+    if not new_facts:
+        return prior_summary
+    from pydantic_ai import Agent  # noqa: PLC0415
+    from pydantic_ai.models.openai import OpenAIChatModel  # noqa: PLC0415
+    from pydantic_ai.providers.openai import OpenAIProvider  # noqa: PLC0415
+    from pydantic_ai.settings import ModelSettings  # noqa: PLC0415
+    system_prompt = SUMMARY_PROMPT
+    user_parts: list[str] = []
+    if prior_summary:
+        user_parts.append(f"Previous summary:\n{prior_summary}")
+    user_parts.append("New facts:\n" + "\n".join(f"- {fact}" for fact in new_facts))
+    prompt_text = "\n\n".join(user_parts)
+    provider = OpenAIProvider(api_key=api_key or "dummy", base_url=openai_base_url)
+    model_cfg = OpenAIChatModel(
+        model_name=model,
+        provider=provider,
+        settings=ModelSettings(temperature=0.2, max_tokens=max_tokens),
+    )
+    agent = Agent(model=model_cfg, system_prompt=system_prompt, output_type=SummaryOutput)
+    result = await agent.run(prompt_text)
+    return result.output.summary or prior_summary
+async def extract_and_store_facts_and_summaries(
+    *,
+    collection: Collection,
+    memory_root: Path,
+    conversation_id: str,
+    user_message: str | None,
+    assistant_message: str | None,
+    openai_base_url: str,
+    api_key: str | None,
+    model: str,
+    enable_git_versioning: bool = False,
+    source_id: str | None = None,
+    enable_summarization: bool = True,
+) -> None:
+    """Run fact extraction and summary updates, persisting results."""
+    fact_start = perf_counter()
+    effective_source_id = source_id or str(uuid4())
+    fact_created_at = datetime.now(UTC)
+    facts = await extract_salient_facts(
+        user_message=user_message,
+        assistant_message=assistant_message,
+        openai_base_url=openai_base_url,
+        api_key=api_key,
+        model=model,
+    )
+    LOGGER.info(
+        "Fact extraction produced %d facts in %.1f ms (conversation=%s)",
+        len(facts),
+        _elapsed_ms(fact_start),
+        conversation_id,
+    )
+    to_add, to_delete, replacement_map = await reconcile_facts(
+        collection,
+        conversation_id,
+        facts,
+        source_id=effective_source_id,
+        created_at=fact_created_at,
+        openai_base_url=openai_base_url,
+        api_key=api_key,
+        model=model,
+    )
+    if to_delete:
+        delete_entries(collection, ids=list(to_delete))
+        delete_memory_files(
+            memory_root,
+            conversation_id,
+            list(to_delete),
+            replacement_map=replacement_map,
+        )
+    if to_add:
+        persist_entries(
+            collection,
+            memory_root=memory_root,
+            conversation_id=conversation_id,
+            entries=list(to_add),
+        )
+    if enable_summarization:
+        prior_summary_entry = get_summary_entry(
+            collection,
+            conversation_id,
+            role=_SUMMARY_ROLE,
+        )
+        prior_summary = prior_summary_entry.content if prior_summary_entry else None
+        summary_start = perf_counter()
+        new_summary = await update_summary(
+            prior_summary=prior_summary,
+            new_facts=facts,
+            openai_base_url=openai_base_url,
+            api_key=api_key,
+            model=model,
+        )
+        LOGGER.info(
+            "Summary update completed in %.1f ms (conversation=%s)",
+            _elapsed_ms(summary_start),
+            conversation_id,
+        )
+        if new_summary:
+            summary_obj = Summary(
+                conversation_id=conversation_id,
+                content=new_summary,
+                created_at=datetime.now(UTC),
+            )
+            persist_summary(
+                collection,
+                memory_root=memory_root,
+                summary=summary_obj,
+            )
+    if enable_git_versioning:
+        await commit_changes(memory_root, f"Add facts to conversation {conversation_id}")