PyPI - ata-coder - Versions diffs - 2.4.2__py3-none-any.whl - Mend

ata-coder 2.4.2__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (118) hide show

ata_coder/__init__.py +1 -0
ata_coder/agent.py +874 -0
ata_coder/agent_compact.py +190 -0
ata_coder/agent_controller.py +218 -0
ata_coder/agent_extension.py +69 -0
ata_coder/agent_routing.py +105 -0
ata_coder/agent_subsystems.py +72 -0
ata_coder/agent_tools.py +318 -0
ata_coder/agent_undo.py +63 -0
ata_coder/anthropic_client.py +465 -0
ata_coder/change_tracker.py +368 -0
ata_coder/clawd_integration.py +574 -0
ata_coder/commands/__init__.py +128 -0
ata_coder/commands/_core.py +184 -0
ata_coder/commands/_safety.py +95 -0
ata_coder/commands/_settings.py +241 -0
ata_coder/commands/_workflow.py +451 -0
ata_coder/commands.py +974 -0
ata_coder/config.py +257 -0
ata_coder/core/__init__.py +35 -0
ata_coder/core/events.py +73 -0
ata_coder/core/queue.py +85 -0
ata_coder/core/state.py +17 -0
ata_coder/event_queue.py +5 -0
ata_coder/extension.py +654 -0
ata_coder/extensions/__init__.py +1 -0
ata_coder/extensions/hello_skill.py +47 -0
ata_coder/fool_proof.py +295 -0
ata_coder/git_workflow.py +371 -0
ata_coder/gui.py +511 -0
ata_coder/llm_client.py +543 -0
ata_coder/main.py +814 -0
ata_coder/mcp_client.py +1095 -0
ata_coder/memory.py +539 -0
ata_coder/model_registry.py +134 -0
ata_coder/model_router.py +105 -0
ata_coder/permissions.py +274 -0
ata_coder/privilege.py +464 -0
ata_coder/project.py +273 -0
ata_coder/prompt_template.py +423 -0
ata_coder/prompts/auto-mode.md +7 -0
ata_coder/prompts/coding-rules.md +40 -0
ata_coder/prompts/execution-guardrails.md +14 -0
ata_coder/prompts/memory-system.md +24 -0
ata_coder/prompts/output-style.md +23 -0
ata_coder/prompts/safety.md +17 -0
ata_coder/prompts/slash-commands.md +24 -0
ata_coder/prompts/sub-agents.md +38 -0
ata_coder/prompts/system-reminders.md +17 -0
ata_coder/prompts/system.md +105 -0
ata_coder/prompts/tool-policy.md +46 -0
ata_coder/repl_theme.py +99 -0
ata_coder/repl_tracker.py +89 -0
ata_coder/repl_ui.py +1214 -0
ata_coder/safety_guard.py +434 -0
ata_coder/self_correct.py +346 -0
ata_coder/server.py +882 -0
ata_coder/server_session.py +159 -0
ata_coder/server_shell.py +129 -0
ata_coder/session.py +431 -0
ata_coder/settings.py +439 -0
ata_coder/setup_wizard.py +136 -0
ata_coder/skill_extension.py +92 -0
ata_coder/skills/architect/SKILL.md +42 -0
ata_coder/skills/code-reviewer/SKILL.md +37 -0
ata_coder/skills/codecraft/SKILL.md +452 -0
ata_coder/skills/debugger/SKILL.md +45 -0
ata_coder/skills/doc-writer/SKILL.md +36 -0
ata_coder/skills/general-coder/SKILL.md +76 -0
ata_coder/skills/math-calculator/README.md +40 -0
ata_coder/skills/math-calculator/SKILL.md +59 -0
ata_coder/skills/math-calculator/handler.py +103 -0
ata_coder/skills/math-calculator/prompts/system.md +8 -0
ata_coder/skills/math-calculator/requirements.txt +2 -0
ata_coder/skills/math-calculator/resources/constants.json +8 -0
ata_coder/skills/math-calculator/tests/test_handler.py +53 -0
ata_coder/skills/security-auditor/SKILL.md +40 -0
ata_coder/skills/test-writer/SKILL.md +36 -0
ata_coder/skills/weather-skill/README.md +45 -0
ata_coder/skills/weather-skill/handler.py +76 -0
ata_coder/skills/weather-skill/manifest.json +48 -0
ata_coder/skills/weather-skill/prompts/system_prompt.txt +9 -0
ata_coder/skills/weather-skill/prompts/user_prompt_template.txt +3 -0
ata_coder/skills/weather-skill/requirements.txt +1 -0
ata_coder/skills/weather-skill/resources/city_list.json +17 -0
ata_coder/skills/weather-skill/resources/error_messages.json +7 -0
ata_coder/skills/weather-skill/tests/test_handler.py +28 -0
ata_coder/skills/weather-skill/weather_utils.py +50 -0
ata_coder/skills.py +1014 -0
ata_coder/sub_agent.py +273 -0
ata_coder/sub_agent_manager.py +203 -0
ata_coder/system_prompt_builder.py +146 -0
ata_coder/task_planner.py +391 -0
ata_coder/terminal.py +318 -0
ata_coder/test_runner.py +219 -0
ata_coder/thread_supervisor.py +195 -0
ata_coder/tool_defs.py +335 -0
ata_coder/tools/__init__.py +11 -0
ata_coder/tools/definitions.py +335 -0
ata_coder/tools/executor.py +1036 -0
ata_coder/tools/result.py +26 -0
ata_coder/tools/subagent.py +332 -0
ata_coder/tools/web.py +361 -0
ata_coder/tools.py +1576 -0
ata_coder/types.py +92 -0
ata_coder/utils.py +113 -0
ata_coder/web/css/style.css +180 -0
ata_coder/web/index.html +84 -0
ata_coder/web/js/app.js +489 -0
ata_coder/web/package-lock.json +25 -0
ata_coder/web/package.json +10 -0
ata_coder/web/tsconfig.json +13 -0
ata_coder-2.4.2.dist-info/METADATA +799 -0
ata_coder-2.4.2.dist-info/RECORD +118 -0
ata_coder-2.4.2.dist-info/WHEEL +5 -0
ata_coder-2.4.2.dist-info/entry_points.txt +2 -0
ata_coder-2.4.2.dist-info/licenses/LICENSE +21 -0
ata_coder-2.4.2.dist-info/top_level.txt +1 -0

ata_coder/memory.py ADDED Viewed

@@ -0,0 +1,539 @@
+"""
+Persistent memory system for ATA Coder.
+Stores facts, user preferences, feedback, and project context across sessions.
+Uses a file-based approach:
+- memory/MEMORY.md — index of all memories (loaded on startup)
+- memory/<slug>.md — individual memory files with YAML frontmatter
+Memory types:
+- user: who the user is, their preferences, expertise
+- feedback: user guidance on how the agent should work
+- project: ongoing goals, constraints, architecture decisions
+- reference: pointers to external resources (URLs, docs, etc.)
+"""
+import json
+import logging
+import os
+import re
+import threading
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+from pathlib import Path
+from typing import Any
+from .utils import try_import_yaml
+logger = logging.getLogger(__name__)
+_yaml_mod, HAS_YAML = try_import_yaml()
+# ── Memory data model ────────────────────────────────────────────────────────
+@dataclass
+class Memory:
+    """A single memory entry."""
+    name: str                          # kebab-case slug, used as filename
+    description: str                   # one-line summary (used for relevance)
+    content: str                       # the memory body
+    metadata: dict[str, Any] = field(default_factory=dict)  # type, tags, etc.
+    created: str = ""                  # ISO timestamp
+    updated: str = ""                  # ISO timestamp
+    @property
+    def memory_type(self) -> str:
+        return self.metadata.get("type", "reference")
+    @property
+    def file_path(self) -> str:
+        return f"{self.name}.md"
+    def to_frontmatter(self) -> str:
+        """Serialize to a markdown file with YAML frontmatter."""
+        now = datetime.now(timezone.utc).strftime("%Y-%m-%dT%H:%M:%SZ")
+        meta = {
+            "name": self.name, "description": self.description,
+            "metadata": self.metadata, "created": self.created or now, "updated": now,
+        }
+        if _yaml_mod is not None:
+            yaml_str = _yaml_mod.dump(meta, default_flow_style=False, allow_unicode=True, sort_keys=False)
+        else:
+            yaml_str = json.dumps(meta, indent=2, ensure_ascii=False)
+        return f"---\n{yaml_str}---\n\n{self.content}"
+    @classmethod
+    def from_frontmatter(cls, raw: str) -> "Memory | None":
+        """Parse a markdown file with YAML frontmatter into a Memory."""
+        match = re.match(r"^---\s*\n(.*?)\n---\s*\n(.*)", raw, re.DOTALL)
+        if not match:
+            return None
+        front_str, content = match.group(1), match.group(2).strip()
+        try:
+            try:
+                if _yaml_mod is not None:
+                    meta = _yaml_mod.safe_load(front_str)
+                else:
+                    meta = json.loads(front_str)
+            except ImportError:
+                meta = json.loads(front_str)
+        except Exception as e:
+            logger.warning("Failed to parse frontmatter: %s", e)
+            return None
+        if not isinstance(meta, dict):
+            return None
+        return cls(
+            name=meta.get("name", "unknown"), description=meta.get("description", ""),
+            content=content, metadata=meta.get("metadata", {}),
+            created=meta.get("created", ""), updated=meta.get("updated", ""),
+        )
+# ── Memory store ─────────────────────────────────────────────────────────────
+class MemoryStore:
+    """
+    Persistent file-based memory store.
+    On initialization, reads MEMORY.md for the index, then loads individual
+    memory files on demand or all at once.
+    """
+    def __init__(self, memory_dir: str | Path | None = None):
+        if memory_dir is None:
+            try:
+                from .settings import get_settings
+                memory_dir = get_settings().memory_dir
+            except Exception:
+                memory_dir = Path.home() / ".ata_coder" / "memory"
+        self.memory_dir = Path(memory_dir)
+        self.memory_dir.mkdir(parents=True, exist_ok=True)
+        self._index_path = self.memory_dir / "MEMORY.md"
+        self._memories: dict[str, Memory] = {}
+        self._index_entries: list[str] = []  # lines from MEMORY.md
+        # IDF cache — invalidated on add/delete
+        self._idf_cache: dict[str, float] | None = None
+        self._idf_doc_count: int = 0
+        self._lock = threading.RLock()  # protect concurrent read/write
+        self._load_index()
+        self._load_all()
+    # ── Loading ───────────────────────────────────────────────────────────
+    def _load_index(self) -> None:
+        """Load the MEMORY.md index file."""
+        if self._index_path.exists():
+            try:
+                with open(self._index_path, "r", encoding="utf-8") as f:
+                    self._index_entries = [
+                        line.strip() for line in f.readlines() if line.strip()
+                    ]
+                logger.debug(
+                    "Loaded MEMORY.md: %d entries", len(self._index_entries)
+                )
+            except Exception as e:
+                logger.warning("Failed to load MEMORY.md: %s", e)
+                self._index_entries = []
+        else:
+            # Create empty index
+            self._write_index()
+    def _load_all(self) -> None:
+        """Load all memory files from the directory."""
+        if not self.memory_dir.exists():
+            return
+        for file_path in self.memory_dir.glob("*.md"):
+            if file_path.name == "MEMORY.md":
+                continue
+            try:
+                with open(file_path, "r", encoding="utf-8") as f:
+                    raw = f.read()
+                memory = Memory.from_frontmatter(raw)
+                if memory:
+                    self._memories[memory.name] = memory
+                else:
+                    logger.warning("Failed to parse memory file: %s", file_path.name)
+            except Exception as e:
+                logger.warning("Failed to read memory file %s: %s", file_path.name, e)
+        logger.debug("Loaded %d memories from disk", len(self._memories))
+    def _write_index(self) -> None:
+        """Write the index file atomically (write-then-rename)."""
+        tmp = self._index_path.with_suffix(".tmp")
+        try:
+            with open(tmp, "w", encoding="utf-8") as f:
+                for entry in self._index_entries:
+                    f.write(entry + "\n")
+            # os.replace is atomic cross-platform; Path.replace raises
+            # FileExistsError on Windows for existing targets.
+            os.replace(tmp, self._index_path)
+        except Exception as e:
+            logger.warning("Failed to write MEMORY.md: %s", e)
+    # ── CRUD operations ──────────────────────────────────────────────────
+    def add(self, memory: Memory) -> Memory:
+        """
+        Add or update a memory. If one with the same name exists, update it.
+        """
+        with self._lock:
+            self._idf_cache = None  # invalidate IDF cache
+            existing = self._memories.get(memory.name)
+            now = datetime.now(timezone.utc).strftime("%Y-%m-%dT%H:%M:%SZ")
+            if existing:
+                memory.created = existing.created
+            else:
+                memory.created = memory.created or now
+            memory.updated = now
+            # Write memory file
+            file_path = self.memory_dir / memory.file_path
+            try:
+                with open(file_path, "w", encoding="utf-8") as f:
+                    f.write(memory.to_frontmatter())
+            except Exception as e:
+                logger.error("Failed to write memory file %s: %s", file_path, e)
+                raise
+            self._memories[memory.name] = memory
+            # Update index
+            entry = f"- [{memory.description}]({memory.file_path})"
+            replaced = False
+            for i, line in enumerate(self._index_entries):
+                if f"]({memory.file_path})" in line:
+                    self._index_entries[i] = entry
+                    replaced = True
+                    break
+            if not replaced:
+                self._index_entries.append(entry)
+            self._write_index()
+        logger.info("Saved memory: %s", memory.name)
+        return memory
+    def save_batch(self, memories: list[Memory]) -> list[Memory]:
+        """Save multiple memories efficiently — writes index only once."""
+        with self._lock:
+            self._idf_cache = None
+            for memory in memories:
+                file_path = self.memory_dir / memory.file_path
+                try:
+                    with open(file_path, "w", encoding="utf-8") as f:
+                        f.write(memory.to_frontmatter())
+                except Exception as e:
+                    logger.error("Failed to write memory file %s: %s", file_path, e)
+                    continue
+                self._memories[memory.name] = memory
+            # Rebuild and write index once
+            self._rebuild_index()
+        logger.info("Batch saved %d memories", len(memories))
+        return memories
+    def _rebuild_index(self) -> None:
+        """Rebuild the index from all loaded memories (batch-safe)."""
+        self._index_entries = [
+            f"- [{m.description}]({m.file_path})"
+            for m in self._memories.values()
+        ]
+        self._write_index()
+    def flush(self) -> None:
+        """Force-write the index to disk (call before shutdown)."""
+        self._rebuild_index()
+    def get(self, name: str) -> Memory | None:
+        """Get a memory by name (slug)."""
+        return self._memories.get(name)
+    def delete(self, name: str) -> bool:
+        """Delete a memory by name."""
+        with self._lock:
+            self._idf_cache = None
+            memory = self._memories.pop(name, None)
+            if memory is None:
+                return False
+            file_path = self.memory_dir / memory.file_path
+            if file_path.exists():
+                try:
+                    file_path.unlink()
+                except Exception as e:
+                    logger.warning("Failed to delete memory file: %s", e)
+            self._index_entries = [
+                line for line in self._index_entries
+                if f"]({memory.file_path})" not in line
+            ]
+            self._write_index()
+        logger.info("Deleted memory: %s", name)
+        return True
+    def list_all(self, memory_type: str | None = None) -> list[Memory]:
+        """List all memories, optionally filtered by type."""
+        memories = list(self._memories.values())
+        if memory_type:
+            memories = [m for m in memories if m.memory_type == memory_type]
+        # Sort by updated (handle both string and datetime types)
+        def sort_key(m: Memory) -> str:
+            return str(m.updated or "")
+        return sorted(memories, key=sort_key, reverse=True)
+    def search(self, query: str) -> list[Memory]:
+        """Search memories by TF-IDF-weighted token overlap.
+        Returns memories sorted by relevance score (descending).
+        """
+        scored = self._search_scored(query)
+        return [m for _, m in scored]
+    def _search_scored(self, query: str) -> list[tuple[float, Memory]]:
+        """
+        Score every memory against *query* with TF-IDF-weighted token
+        overlap plus phrase bonuses and recency boost.
+        Returns (score, memory) pairs sorted by score descending.
+        """
+        if not self._memories:
+            return []
+        query_lower = query.lower()
+        query_tokens = set(query_lower.split())
+        # ── Pre-compute document frequencies for IDF weighting ──────────
+        # Use cached IDF when available; rebuild only when memories change.
+        import math as _math
+        doc_count = len(self._memories)
+        if self._idf_cache is None or self._idf_doc_count != doc_count:
+            token_df: dict[str, int] = {}
+            for m in self._memories.values():
+                text = f"{m.name} {m.description} {m.content}".lower()
+                seen: set[str] = set()
+                for word in text.split():
+                    if word not in seen:
+                        token_df[word] = token_df.get(word, 0) + 1
+                        seen.add(word)
+            # Pre-compute IDF for every token
+            self._idf_cache = {
+                t: _math.log((doc_count + 1) / (df + 1)) + 1.0
+                for t, df in token_df.items()
+            }
+            self._idf_doc_count = doc_count
+        idf_map = self._idf_cache
+        def idf(token: str) -> float:
+            return idf_map.get(token, 1.0)  # unseen tokens get neutral weight
+        # ── Score each memory ──────────────────────────────────────────
+        results: list[tuple[float, Memory]] = []
+        for memory in self._memories.values():
+            score = 0.0
+            name_lower = memory.name.lower()
+            desc_lower = memory.description.lower()
+            content_lower = memory.content.lower()
+            # Phrase bonus: full query appears as substring
+            if query_lower in name_lower:
+                score += 15.0
+            if query_lower in desc_lower:
+                score += 8.0
+            if query_lower in content_lower:
+                score += 4.0
+            # Token-level IDF-weighted match
+            for token in query_tokens:
+                w = idf(token)
+                if token in name_lower.replace("-", " ").split():
+                    score += 6.0 * w   # name match — highest signal
+                if token in set(desc_lower.split()):
+                    score += 3.0 * w   # description match — medium signal
+                if token in set(content_lower.split()):
+                    score += 1.5 * w   # content match — lower signal
+            # Recency boost: memories touched in the last hour get +2
+            try:
+                from datetime import datetime, timezone, timedelta
+                updated = memory.updated or ""
+                if updated:
+                    dt = datetime.fromisoformat(updated.replace("Z", "+00:00"))
+                    if dt > datetime.now(timezone.utc) - timedelta(hours=1):
+                        score += 2.0
+            except (ValueError, TypeError):
+                pass
+            if score > 0:
+                results.append((score, memory))
+        results.sort(key=lambda x: x[0], reverse=True)
+        return results
+    # ── Recall for context ───────────────────────────────────────────────
+    def recall_context(self, user_input: str, max_memories: int = 5,
+                       min_score: float = 3.0) -> str:
+        """
+        Recall memories relevant to *user_input* for inclusion in the system
+        prompt.  Only returns memories whose relevance score exceeds
+        *min_score* so the prompt doesn't get polluted with noise.
+        """
+        if not self._memories:
+            return ""
+        # Re-use the scored search
+        scored = self._search_scored(user_input)
+        relevant = [m for score, m in scored if score >= min_score][:max_memories]
+        if not relevant:
+            return ""
+        # Bump access tracking
+        now = datetime.now(timezone.utc).strftime("%Y-%m-%dT%H:%M:%SZ")
+        for m in relevant:
+            m.metadata["last_accessed"] = now
+            m.metadata["access_count"] = m.metadata.get("access_count", 0) + 1
+        lines = ["\n## Relevant Memories"]
+        for memory in relevant:
+            lines.append(f"\n### {memory.description}")
+            content = memory.content
+            if len(content) > 500:
+                content = content[:500] + "..."
+            lines.append(content)
+            refs = self._extract_links(memory.content)
+            if refs:
+                lines.append(f"Related: {', '.join(refs)}")
+        return "\n".join(lines)
+    def _extract_links(self, content: str) -> list[str]:
+        """Extract [[wiki-style]] links from content."""
+        return re.findall(r"\[\[([^\]]+)\]\]", content)
+    def get_memory_context(self, max_total: int = 8) -> str:
+        """
+        Return a compact summary of recently-updated memories for the
+        system prompt.  Capped at *max_total* entries so the prompt
+        doesn't bloat when the user has dozens of memories.
+        """
+        if not self._memories:
+            return ""
+        def _sort_key(m: Memory) -> str:
+            return str(m.updated or "")
+        recent = sorted(self._memories.values(), key=_sort_key, reverse=True)[:max_total]
+        if not recent:
+            return ""
+        lines = ["\n## Persistent Memory"]
+        by_type: dict[str, list[Memory]] = {}
+        for m in recent:
+            by_type.setdefault(m.memory_type, []).append(m)
+        for mtype in ["user", "project", "feedback", "reference"]:
+            entries = by_type.get(mtype, [])
+            if entries:
+                lines.append(f"\n### {mtype.title()}")
+                for m in entries[:3]:
+                    lines.append(f"- {m.description}")
+        return "\n".join(lines)
+    # ── Auto-suggest from conversation ──────────────────────────────────
+    def suggest_from_conversation(self, user_messages: list[str],
+                                  file_ops: list[str] | None = None,
+                                  tool_errors: list[str] | None = None) -> list[str]:
+        """Analyse recent messages for facts worth saving as memories.
+        Returns a list of human-readable suggestions like
+        ``"user prefers YAML over JSON for config"`` that the agent can
+        surface to the user with a quick save prompt.
+        """
+        suggestions: list[str] = []
+        # Heuristic 1: explicit "remember …" or "save …" directives
+        for msg in user_messages:
+            lower = msg.lower()
+            if any(kw in lower for kw in ("remember", "save this", "don't forget",
+                                           "记", "记住", "备忘")):
+                suggestions.append(f"User asked to remember: {msg[:120]}")
+        # Heuristic 2: project-specific paths or toolchains mentioned
+        toolchain_keywords = ["idf.py", "esp-idf", "esptool", "cmake", "platformio",
+                              "arduino", "stm32", "nrf", "zephyr"]
+        for msg in user_messages:
+            for kw in toolchain_keywords:
+                if kw.lower() in msg.lower():
+                    suggestions.append(
+                        f"Project uses {kw}: {msg[:120]}"
+                    )
+                    break
+        # Heuristic 3: device ports / serial config
+        import re as _re
+        for msg in user_messages:
+            port_match = _re.search(r'COM\d+|/dev/tty\w+', msg)
+            if port_match:
+                suggestions.append(
+                    f"Device port {port_match.group()}: {msg[:120]}"
+                )
+        # Heuristic 4: operational learnings — detect "X failed → Y worked" patterns
+        if tool_errors:
+            for err in tool_errors:
+                lower = err.lower()
+                if "not in the allowed list" in lower:
+                    suggestions.append(
+                        "ops: Some shell commands are blocked by the whitelist. "
+                        "Use python -c \"import subprocess; subprocess.run([...], cwd='...')\" "
+                        "as a workaround for tools not on PATH."
+                    )
+                    break
+                if "command not found" in lower or "not recognized" in lower:
+                    # Extract the command name
+                    m = _re.search(r"'(\w+)'", err)
+                    cmd = m.group(1) if m else "?"
+                    suggestions.append(
+                        f"ops: Command '{cmd}' not found — use full path or "
+                        f"python subprocess wrapper."
+                    )
+        return suggestions[:5]  # cap to avoid overwhelming the user
+# ── Convenience functions ────────────────────────────────────────────────────
+def create_memory(
+    name: str,
+    description: str,
+    content: str,
+    memory_type: str = "reference",
+    store: MemoryStore | None = None,
+) -> Memory:
+    """Create a memory with the given fields."""
+    if store is None:
+        store = get_memory_store()
+    memory = Memory(
+        name=name,
+        description=description,
+        content=content,
+        metadata={"type": memory_type},
+    )
+    return store.add(memory)
+# ── Global instance ──────────────────────────────────────────────────────────
+_memory_store: MemoryStore | None = None
+def get_memory_store(memory_dir: str | None = None) -> MemoryStore:
+    global _memory_store
+    if _memory_store is None:
+        _memory_store = MemoryStore(memory_dir)
+    return _memory_store

ata_coder/model_registry.py ADDED Viewed

@@ -0,0 +1,134 @@
+"""
+Shared model metadata — single source of truth for pricing, URL building,
+and model info. Eliminates the duplicated price tables and URL construction
+that were scattered across commands.py, repl_ui.py, main.py, and llm_client.py.
+"""
+from dataclasses import dataclass
+@dataclass(frozen=True)
+class ModelInfo:
+    """Immutable metadata for a known model."""
+    model_id: str
+    input_price_per_1m: float   # USD per 1M input tokens
+    output_price_per_1m: float   # USD per 1M output tokens
+    provider: str = ""           # "openai" | "deepseek" | "anthropic" | "local"
+# ── Registry ─────────────────────────────────────────────────────────────────
+MODEL_REGISTRY: dict[str, ModelInfo] = {
+    "gpt-4o":              ModelInfo("gpt-4o",              2.50,  10.00, "openai"),
+    "gpt-4o-mini":         ModelInfo("gpt-4o-mini",         0.15,   0.60, "openai"),
+    "gpt-4-turbo":         ModelInfo("gpt-4-turbo",        10.00,  30.00, "openai"),
+    "gpt-4":               ModelInfo("gpt-4",              30.00,  60.00, "openai"),
+    "deepseek-chat":       ModelInfo("deepseek-chat",       0.14,   0.28, "deepseek"),
+    "deepseek-coder":      ModelInfo("deepseek-coder",      0.14,   0.28, "deepseek"),
+    "deepseek-v4-pro":     ModelInfo("deepseek-v4-pro",     0.14,   0.28, "deepseek"),
+    "deepseek-v4-flash":   ModelInfo("deepseek-v4-flash",   0.14,   0.28, "deepseek"),
+    "claude-sonnet-4-6":   ModelInfo("claude-sonnet-4-6",   3.00,  15.00, "anthropic"),
+    "claude-opus-4-8":     ModelInfo("claude-opus-4-8",    15.00,  75.00, "anthropic"),
+    "qwen2.5-coder-14b":   ModelInfo("qwen2.5-coder-14b",   0.00,   0.00, "local"),
+}
+# Fallback prices when model is not in the registry
+_FALLBACK_INPUT_PRICE = 1.00
+_FALLBACK_OUTPUT_PRICE = 5.00
+def get_model_info(model_id: str) -> ModelInfo:
+    """Look up a model in the registry. Returns a fallback for unknown models.
+    Resolution order:
+    1. Exact match (e.g. "gpt-4o" → openai)
+    2. Strip bracket suffixes like ``[1m]`` / ``[context]``, then exact match
+    3. Substring match — longest known key found inside *model_id* wins
+       (e.g. "some-prefix-deepseek-chat-v2" → deepseek)
+    """
+    # Exact match first
+    if model_id in MODEL_REGISTRY:
+        return MODEL_REGISTRY[model_id]
+    # Strip common suffixes that providers append: "[1m]", "[context]", etc.
+    import re
+    clean = re.sub(r'\[.*\]', '', model_id).strip()
+    if clean in MODEL_REGISTRY:
+        return MODEL_REGISTRY[clean]
+    # Substring match — longest key wins (prevents "gpt-4" matching before "gpt-4o")
+    for key in sorted(MODEL_REGISTRY, key=len, reverse=True):
+        if key in model_id:
+            return MODEL_REGISTRY[key]
+    return ModelInfo(model_id, _FALLBACK_INPUT_PRICE, _FALLBACK_OUTPUT_PRICE, "unknown")
+def get_model_cost(model_id: str) -> tuple[float, float]:
+    """Return (input_price_per_1m, output_price_per_1m) for a model."""
+    info = get_model_info(model_id)
+    return info.input_price_per_1m, info.output_price_per_1m
+def estimate_cost(token_count: int, model_id: str,
+                  input_ratio: float = 0.7) -> float:
+    """
+    Estimate USD cost from a total token count.
+    Assumes *input_ratio* fraction of tokens are input (default 70%).
+    """
+    inp_price, out_price = get_model_cost(model_id)
+    input_tokens = int(token_count * input_ratio)
+    output_tokens = token_count - input_tokens
+    return (input_tokens / 1_000_000) * inp_price + (output_tokens / 1_000_000) * out_price
+# ── URL building ─────────────────────────────────────────────────────────────
+def build_api_url(base_url: str, endpoint: str = "chat/completions") -> str:
+    """
+    Build a complete OpenAI-compatible API URL from a base URL and endpoint.
+    Normalizes the base URL:
+        https://api.openai.com          → https://api.openai.com/v1/chat/completions
+        https://api.deepseek.com/v1     → https://api.deepseek.com/v1/chat/completions
+        https://api.deepseek.com/v2     → https://api.deepseek.com/v2/chat/completions
+    Use endpoint="" to get just the versioned base, e.g. for /models listing.
+    """
+    import re
+    base = base_url.rstrip("/")
+    if not re.search(r'/v\d+', base):
+        base += "/v1"
+    if endpoint:
+        return f"{base}/{endpoint.lstrip('/')}"
+    return base
+def build_models_url(base_url: str) -> str:
+    """Build the /models endpoint URL from a base URL."""
+    base = base_url.rstrip("/")
+    # Some providers expose /models at root, others at /v1/models
+    if "/v1" in base or "/v2" in base:
+        return f"{base}/models"
+    return f"{base}/v1/models"
+# ── Model list from API ──────────────────────────────────────────────────────
+def fetch_available_models(base_url: str, api_key: str, timeout: float = 10.0) -> list[str]:
+    """
+    Fetch the available model list from the API's /models endpoint.
+    Returns model IDs, or an empty list on failure.
+    .. note::
+       This uses synchronous ``httpx.get()``.  Callers inside an async
+       event loop should use ``asyncio.to_thread(fetch_available_models, ...)``
+       to avoid blocking the loop.
+    """
+    import httpx
+    url = build_models_url(base_url)
+    headers = {"Authorization": f"Bearer {api_key}"}
+    try:
+        resp = httpx.get(url, headers=headers, timeout=timeout)
+        resp.raise_for_status()
+        data = resp.json()
+        return [m.get("id", "") for m in data.get("data", [])]
+    except Exception:
+        return []