PyPI - llmcode-cli - Versions diffs - 1.0.0__py3-none-any.whl - Mend

llmcode-cli 1.0.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (212) hide show

llm_code/__init__.py +2 -0
llm_code/analysis/__init__.py +6 -0
llm_code/analysis/cache.py +33 -0
llm_code/analysis/engine.py +256 -0
llm_code/analysis/go_rules.py +114 -0
llm_code/analysis/js_rules.py +84 -0
llm_code/analysis/python_rules.py +311 -0
llm_code/analysis/rules.py +140 -0
llm_code/analysis/rust_rules.py +108 -0
llm_code/analysis/universal_rules.py +111 -0
llm_code/api/__init__.py +0 -0
llm_code/api/client.py +90 -0
llm_code/api/errors.py +73 -0
llm_code/api/openai_compat.py +390 -0
llm_code/api/provider.py +35 -0
llm_code/api/sse.py +52 -0
llm_code/api/types.py +140 -0
llm_code/cli/__init__.py +0 -0
llm_code/cli/commands.py +70 -0
llm_code/cli/image.py +122 -0
llm_code/cli/render.py +214 -0
llm_code/cli/status_line.py +79 -0
llm_code/cli/streaming.py +92 -0
llm_code/cli/tui_main.py +220 -0
llm_code/computer_use/__init__.py +11 -0
llm_code/computer_use/app_detect.py +49 -0
llm_code/computer_use/app_tier.py +57 -0
llm_code/computer_use/coordinator.py +99 -0
llm_code/computer_use/input_control.py +71 -0
llm_code/computer_use/screenshot.py +93 -0
llm_code/cron/__init__.py +13 -0
llm_code/cron/parser.py +145 -0
llm_code/cron/scheduler.py +135 -0
llm_code/cron/storage.py +126 -0
llm_code/enterprise/__init__.py +1 -0
llm_code/enterprise/audit.py +59 -0
llm_code/enterprise/auth.py +26 -0
llm_code/enterprise/oidc.py +95 -0
llm_code/enterprise/rbac.py +65 -0
llm_code/harness/__init__.py +5 -0
llm_code/harness/config.py +33 -0
llm_code/harness/engine.py +129 -0
llm_code/harness/guides.py +41 -0
llm_code/harness/sensors.py +68 -0
llm_code/harness/templates.py +84 -0
llm_code/hida/__init__.py +1 -0
llm_code/hida/classifier.py +187 -0
llm_code/hida/engine.py +49 -0
llm_code/hida/profiles.py +95 -0
llm_code/hida/types.py +28 -0
llm_code/ide/__init__.py +1 -0
llm_code/ide/bridge.py +80 -0
llm_code/ide/detector.py +76 -0
llm_code/ide/server.py +169 -0
llm_code/logging.py +29 -0
llm_code/lsp/__init__.py +0 -0
llm_code/lsp/client.py +298 -0
llm_code/lsp/detector.py +42 -0
llm_code/lsp/manager.py +56 -0
llm_code/lsp/tools.py +288 -0
llm_code/marketplace/__init__.py +0 -0
llm_code/marketplace/builtin_registry.py +102 -0
llm_code/marketplace/installer.py +162 -0
llm_code/marketplace/plugin.py +78 -0
llm_code/marketplace/registry.py +360 -0
llm_code/mcp/__init__.py +0 -0
llm_code/mcp/bridge.py +87 -0
llm_code/mcp/client.py +117 -0
llm_code/mcp/health.py +120 -0
llm_code/mcp/manager.py +214 -0
llm_code/mcp/oauth.py +219 -0
llm_code/mcp/transport.py +254 -0
llm_code/mcp/types.py +53 -0
llm_code/remote/__init__.py +0 -0
llm_code/remote/client.py +136 -0
llm_code/remote/protocol.py +22 -0
llm_code/remote/server.py +275 -0
llm_code/remote/ssh_proxy.py +56 -0
llm_code/runtime/__init__.py +0 -0
llm_code/runtime/auto_commit.py +56 -0
llm_code/runtime/auto_diagnose.py +62 -0
llm_code/runtime/checkpoint.py +70 -0
llm_code/runtime/checkpoint_recovery.py +142 -0
llm_code/runtime/compaction.py +35 -0
llm_code/runtime/compressor.py +415 -0
llm_code/runtime/config.py +533 -0
llm_code/runtime/context.py +49 -0
llm_code/runtime/conversation.py +921 -0
llm_code/runtime/cost_tracker.py +126 -0
llm_code/runtime/dream.py +127 -0
llm_code/runtime/file_protection.py +150 -0
llm_code/runtime/hardware.py +85 -0
llm_code/runtime/hooks.py +223 -0
llm_code/runtime/indexer.py +230 -0
llm_code/runtime/knowledge_compiler.py +232 -0
llm_code/runtime/memory.py +132 -0
llm_code/runtime/memory_layers.py +467 -0
llm_code/runtime/memory_lint.py +252 -0
llm_code/runtime/model_aliases.py +37 -0
llm_code/runtime/ollama.py +93 -0
llm_code/runtime/overlay.py +124 -0
llm_code/runtime/permissions.py +200 -0
llm_code/runtime/plan.py +45 -0
llm_code/runtime/prompt.py +238 -0
llm_code/runtime/repo_map.py +174 -0
llm_code/runtime/sandbox.py +116 -0
llm_code/runtime/session.py +268 -0
llm_code/runtime/skill_resolver.py +61 -0
llm_code/runtime/skills.py +133 -0
llm_code/runtime/speculative.py +75 -0
llm_code/runtime/streaming_executor.py +216 -0
llm_code/runtime/telemetry.py +196 -0
llm_code/runtime/token_budget.py +26 -0
llm_code/runtime/vcr.py +142 -0
llm_code/runtime/vision.py +102 -0
llm_code/swarm/__init__.py +1 -0
llm_code/swarm/backend_subprocess.py +108 -0
llm_code/swarm/backend_tmux.py +103 -0
llm_code/swarm/backend_worktree.py +306 -0
llm_code/swarm/checkpoint.py +74 -0
llm_code/swarm/coordinator.py +236 -0
llm_code/swarm/mailbox.py +88 -0
llm_code/swarm/manager.py +202 -0
llm_code/swarm/memory_sync.py +80 -0
llm_code/swarm/recovery.py +21 -0
llm_code/swarm/team.py +67 -0
llm_code/swarm/types.py +31 -0
llm_code/task/__init__.py +16 -0
llm_code/task/diagnostics.py +93 -0
llm_code/task/manager.py +162 -0
llm_code/task/types.py +112 -0
llm_code/task/verifier.py +104 -0
llm_code/tools/__init__.py +0 -0
llm_code/tools/agent.py +145 -0
llm_code/tools/agent_roles.py +82 -0
llm_code/tools/base.py +94 -0
llm_code/tools/bash.py +565 -0
llm_code/tools/computer_use_tools.py +278 -0
llm_code/tools/coordinator_tool.py +75 -0
llm_code/tools/cron_create.py +90 -0
llm_code/tools/cron_delete.py +49 -0
llm_code/tools/cron_list.py +51 -0
llm_code/tools/deferred.py +92 -0
llm_code/tools/dump.py +116 -0
llm_code/tools/edit_file.py +282 -0
llm_code/tools/git_tools.py +531 -0
llm_code/tools/glob_search.py +112 -0
llm_code/tools/grep_search.py +144 -0
llm_code/tools/ide_diagnostics.py +59 -0
llm_code/tools/ide_open.py +58 -0
llm_code/tools/ide_selection.py +52 -0
llm_code/tools/memory_tools.py +138 -0
llm_code/tools/multi_edit.py +143 -0
llm_code/tools/notebook_edit.py +107 -0
llm_code/tools/notebook_read.py +81 -0
llm_code/tools/parsing.py +63 -0
llm_code/tools/read_file.py +154 -0
llm_code/tools/registry.py +58 -0
llm_code/tools/search_backends/__init__.py +56 -0
llm_code/tools/search_backends/brave.py +56 -0
llm_code/tools/search_backends/duckduckgo.py +129 -0
llm_code/tools/search_backends/searxng.py +71 -0
llm_code/tools/search_backends/tavily.py +73 -0
llm_code/tools/swarm_create.py +109 -0
llm_code/tools/swarm_delete.py +95 -0
llm_code/tools/swarm_list.py +44 -0
llm_code/tools/swarm_message.py +109 -0
llm_code/tools/task_close.py +79 -0
llm_code/tools/task_plan.py +79 -0
llm_code/tools/task_verify.py +90 -0
llm_code/tools/tool_search.py +65 -0
llm_code/tools/web_common.py +258 -0
llm_code/tools/web_fetch.py +223 -0
llm_code/tools/web_search.py +280 -0
llm_code/tools/write_file.py +118 -0
llm_code/tui/__init__.py +1 -0
llm_code/tui/app.py +2432 -0
llm_code/tui/chat_view.py +82 -0
llm_code/tui/chat_widgets.py +309 -0
llm_code/tui/header_bar.py +46 -0
llm_code/tui/input_bar.py +349 -0
llm_code/tui/keybindings.py +142 -0
llm_code/tui/marketplace.py +210 -0
llm_code/tui/status_bar.py +72 -0
llm_code/tui/theme.py +96 -0
llm_code/utils/__init__.py +0 -0
llm_code/utils/diff.py +111 -0
llm_code/utils/errors.py +70 -0
llm_code/utils/hyperlink.py +73 -0
llm_code/utils/notebook.py +179 -0
llm_code/utils/search.py +69 -0
llm_code/utils/text_normalize.py +28 -0
llm_code/utils/version_check.py +62 -0
llm_code/vim/__init__.py +4 -0
llm_code/vim/engine.py +51 -0
llm_code/vim/motions.py +172 -0
llm_code/vim/operators.py +183 -0
llm_code/vim/text_objects.py +139 -0
llm_code/vim/transitions.py +279 -0
llm_code/vim/types.py +68 -0
llm_code/voice/__init__.py +1 -0
llm_code/voice/languages.py +43 -0
llm_code/voice/recorder.py +136 -0
llm_code/voice/stt.py +36 -0
llm_code/voice/stt_anthropic.py +66 -0
llm_code/voice/stt_google.py +32 -0
llm_code/voice/stt_whisper.py +52 -0
llmcode_cli-1.0.0.dist-info/METADATA +524 -0
llmcode_cli-1.0.0.dist-info/RECORD +212 -0
llmcode_cli-1.0.0.dist-info/WHEEL +4 -0
llmcode_cli-1.0.0.dist-info/entry_points.txt +2 -0
llmcode_cli-1.0.0.dist-info/licenses/LICENSE +21 -0

llm_code/tools/task_close.py ADDED Viewed

@@ -0,0 +1,79 @@
+"""TaskCloseTool: finalize a task, write summary, transition to DONE."""
+from __future__ import annotations
+from pydantic import BaseModel
+from llm_code.task.manager import TaskLifecycleManager
+from llm_code.task.types import TaskStatus
+from llm_code.tools.base import PermissionLevel, Tool, ToolResult
+class TaskCloseInput(BaseModel):
+    task_id: str
+    summary: str = ""
+class TaskCloseTool(Tool):
+    """Close a task: transition to DONE and write a completion summary."""
+    def __init__(self, manager: TaskLifecycleManager) -> None:
+        self._manager = manager
+    @property
+    def name(self) -> str:
+        return "task_close"
+    @property
+    def description(self) -> str:
+        return (
+            "Close a completed task. Transitions from CLOSE to DONE and writes "
+            "a completion summary. The task must be in CLOSE status."
+        )
+    @property
+    def input_schema(self) -> dict:
+        return {
+            "type": "object",
+            "properties": {
+                "task_id": {"type": "string", "description": "The task ID to close"},
+                "summary": {"type": "string", "description": "Completion summary"},
+            },
+            "required": ["task_id"],
+        }
+    @property
+    def required_permission(self) -> PermissionLevel:
+        return PermissionLevel.WORKSPACE_WRITE
+    @property
+    def input_model(self) -> type[TaskCloseInput]:
+        return TaskCloseInput
+    def execute(self, args: dict) -> ToolResult:
+        task_id = args["task_id"]
+        summary = args.get("summary", "")
+        task = self._manager.get_task(task_id)
+        if task is None:
+            return ToolResult(output=f"Task not found: {task_id}", is_error=True)
+        try:
+            self._manager.transition(task_id, TaskStatus.DONE)
+        except ValueError as exc:
+            return ToolResult(output=str(exc), is_error=True)
+        # Write summary to task
+        if summary:
+            self._manager.update_task(task_id, plan=f"{task.plan}\n\n## Summary\n{summary}")
+        closed = self._manager.get_task(task_id)
+        files = ", ".join(closed.files_modified) if closed and closed.files_modified else "(none)"
+        return ToolResult(
+            output=(
+                f"Task {task_id} closed successfully.\n"
+                f"Title: {task.title}\n"
+                f"Files modified: {files}\n"
+                f"Summary: {summary or '(no summary)'}"
+            )
+        )

llm_code/tools/task_plan.py ADDED Viewed

@@ -0,0 +1,79 @@
+"""TaskPlanTool: create a task with title, plan, and goals."""
+from __future__ import annotations
+from pydantic import BaseModel
+from llm_code.task.manager import TaskLifecycleManager
+from llm_code.tools.base import PermissionLevel, Tool, ToolResult
+class TaskPlanInput(BaseModel):
+    title: str
+    plan: str = ""
+    goals: list[str] = []
+class TaskPlanTool(Tool):
+    """Create a new structured task with a plan and goals."""
+    def __init__(self, manager: TaskLifecycleManager, session_id: str = "") -> None:
+        self._manager = manager
+        self._session_id = session_id
+    @property
+    def name(self) -> str:
+        return "task_plan"
+    @property
+    def description(self) -> str:
+        return (
+            "Create a new structured task. Provide a title, an implementation plan, "
+            "and measurable goals. The task starts in PLAN status."
+        )
+    @property
+    def input_schema(self) -> dict:
+        return {
+            "type": "object",
+            "properties": {
+                "title": {"type": "string", "description": "Short task title"},
+                "plan": {"type": "string", "description": "Step-by-step implementation plan"},
+                "goals": {
+                    "type": "array",
+                    "items": {"type": "string"},
+                    "description": "Measurable completion goals",
+                },
+            },
+            "required": ["title"],
+        }
+    @property
+    def required_permission(self) -> PermissionLevel:
+        return PermissionLevel.WORKSPACE_WRITE
+    @property
+    def input_model(self) -> type[TaskPlanInput]:
+        return TaskPlanInput
+    def execute(self, args: dict) -> ToolResult:
+        title = args.get("title", "").strip()
+        if not title:
+            return ToolResult(output="Error: title is required", is_error=True)
+        plan = args.get("plan", "")
+        goals = tuple(args.get("goals", []))
+        task = self._manager.create_task(
+            title=title,
+            plan=plan,
+            goals=goals,
+            session_id=self._session_id,
+        )
+        return ToolResult(
+            output=(
+                f"Created task {task.id}: {task.title}\n"
+                f"Status: {task.status.value}\n"
+                f"Goals: {', '.join(task.goals) if task.goals else '(none)'}\n"
+                f"Plan:\n{task.plan or '(no plan set)'}"
+            )
+        )

llm_code/tools/task_verify.py ADDED Viewed

@@ -0,0 +1,90 @@
+"""TaskVerifyTool: run verification checks on a task."""
+from __future__ import annotations
+from pydantic import BaseModel
+from llm_code.task.diagnostics import DiagnosticsEngine
+from llm_code.task.manager import TaskLifecycleManager
+from llm_code.task.verifier import Verifier
+from llm_code.tools.base import PermissionLevel, Tool, ToolResult
+class TaskVerifyInput(BaseModel):
+    task_id: str
+class TaskVerifyTool(Tool):
+    """Run automated verification checks (pytest, ruff, file_exists) on a task."""
+    def __init__(
+        self,
+        manager: TaskLifecycleManager,
+        verifier: Verifier,
+        diagnostics: DiagnosticsEngine,
+    ) -> None:
+        self._manager = manager
+        self._verifier = verifier
+        self._diagnostics = diagnostics
+    @property
+    def name(self) -> str:
+        return "task_verify"
+    @property
+    def description(self) -> str:
+        return (
+            "Run automated verification checks on a task: pytest, ruff, and file_exists. "
+            "Returns check results and a recommended action (continue/replan/escalate)."
+        )
+    @property
+    def input_schema(self) -> dict:
+        return {
+            "type": "object",
+            "properties": {
+                "task_id": {"type": "string", "description": "The task ID to verify"},
+            },
+            "required": ["task_id"],
+        }
+    @property
+    def required_permission(self) -> PermissionLevel:
+        return PermissionLevel.READ_ONLY
+    @property
+    def input_model(self) -> type[TaskVerifyInput]:
+        return TaskVerifyInput
+    def is_read_only(self, args: dict) -> bool:
+        return True
+    def execute(self, args: dict) -> ToolResult:
+        task_id = args["task_id"]
+        task = self._manager.get_task(task_id)
+        if task is None:
+            return ToolResult(output=f"Task not found: {task_id}", is_error=True)
+        # Run automated checks
+        verify_result = self._verifier.verify(task)
+        # Append result to task history
+        self._manager.append_verify_result(task_id, verify_result)
+        # Run diagnostics
+        report = self._diagnostics.analyze(task, verify_result)
+        # Format output
+        lines = [f"Verification for task {task_id}: {task.title}"]
+        lines.append(f"Overall: {'PASSED' if verify_result.all_passed else 'FAILED'}")
+        lines.append("")
+        for check in verify_result.checks:
+            icon = "PASS" if check.passed else "FAIL"
+            lines.append(f"  [{icon}] {check.check_name}: {check.output[:200]}")
+        lines.append("")
+        lines.append(f"Recommendation: {report.recommendation}")
+        if report.summary:
+            lines.append(f"Diagnostic: {report.summary}")
+        if report.report_path:
+            lines.append(f"Full report: {report.report_path}")
+        return ToolResult(output="\n".join(lines))

llm_code/tools/tool_search.py ADDED Viewed

@@ -0,0 +1,65 @@
+"""ToolSearchTool — lets the LLM discover and unlock deferred tools."""
+from __future__ import annotations
+from llm_code.tools.base import PermissionLevel, Tool, ToolResult
+if True:
+    # Avoid circular imports; DeferredToolManager is a pure data class
+    from llm_code.tools.deferred import DeferredToolManager
+class ToolSearchTool(Tool):
+    """Search deferred tools by name/description and unlock matching ones."""
+    def __init__(self, manager: "DeferredToolManager") -> None:
+        self._manager = manager
+    @property
+    def name(self) -> str:
+        return "tool_search"
+    @property
+    def description(self) -> str:
+        return (
+            "Search for additional tools that are not currently visible. "
+            "Provide a query string to find tools by name or description. "
+            "Matching tools will be unlocked and available in subsequent turns."
+        )
+    @property
+    def input_schema(self) -> dict:
+        return {
+            "type": "object",
+            "properties": {
+                "query": {
+                    "type": "string",
+                    "description": "Search query to match against tool names and descriptions.",
+                }
+            },
+            "required": ["query"],
+        }
+    @property
+    def required_permission(self) -> PermissionLevel:
+        return PermissionLevel.READ_ONLY
+    def execute(self, args: dict) -> ToolResult:
+        query = args.get("query", "")
+        deferred = self._manager._deferred
+        matches = self._manager.search_tools(query, deferred)
+        if not matches:
+            return ToolResult(
+                output=f"No tools found matching '{query}'. "
+                "Try a different search term or use a broader query.",
+            )
+        # Unlock all matching tools
+        for d in matches:
+            self._manager.unlock_tool(d.name)
+        lines = [f"Found {len(matches)} tool(s) matching '{query}' (now unlocked):"]
+        for d in matches:
+            lines.append(f"  - {d.name}: {d.description}")
+        return ToolResult(output="\n".join(lines))

llm_code/tools/web_common.py ADDED Viewed

@@ -0,0 +1,258 @@
+"""Shared utilities for web tools (URL safety, caching, extraction)."""
+from __future__ import annotations
+import dataclasses
+import ipaddress
+import json
+import re
+import time
+from collections import OrderedDict
+from urllib.parse import urlparse
+@dataclasses.dataclass(frozen=True)
+class UrlSafetyResult:
+    """Result of URL safety classification."""
+    classification: str
+    reasons: tuple[str, ...] = ()
+    @property
+    def is_safe(self) -> bool:
+        """Return True if URL is safe to fetch."""
+        return self.classification == "safe"
+    @property
+    def is_blocked(self) -> bool:
+        """Return True if URL should be blocked."""
+        return self.classification == "blocked"
+    @property
+    def needs_confirm(self) -> bool:
+        """Return True if URL needs user confirmation."""
+        return self.classification == "needs_confirm"
+def classify_url(url: str) -> UrlSafetyResult:
+    """Classify URL as safe, needs_confirm, or blocked.
+    Rules:
+    - blocked: file://, private IPs, cloud metadata, invalid URLs, unsupported schemes
+    - needs_confirm: localhost, 127.0.0.1, IP-only URLs, non-standard ports
+    - safe: standard HTTP/HTTPS URLs to regular hosts
+    """
+    reasons: list[str] = []
+    try:
+        parsed = urlparse(url)
+    except Exception:
+        return UrlSafetyResult(classification="blocked", reasons=("invalid URL",))
+    # Check scheme
+    if not parsed.scheme:
+        return UrlSafetyResult(classification="blocked", reasons=("missing scheme",))
+    if parsed.scheme == "file":
+        return UrlSafetyResult(
+            classification="blocked", reasons=("file scheme",)
+        )
+    if parsed.scheme not in ("http", "https"):
+        return UrlSafetyResult(
+            classification="blocked", reasons=("unsupported scheme",)
+        )
+    # Check host
+    if not parsed.hostname:
+        return UrlSafetyResult(classification="blocked", reasons=("missing host",))
+    host = parsed.hostname
+    # Check for cloud metadata hosts (must be before IP check)
+    if host in ("169.254.169.254", "metadata.google.internal", "metadata.azure.com"):
+        return UrlSafetyResult(
+            classification="blocked", reasons=("metadata",)
+        )
+    # Try to parse as IP address
+    is_ip = False
+    try:
+        ip = ipaddress.ip_address(host)
+        is_ip = True
+        # Check for loopback IPv6 (blocked)
+        if ip.version == 6 and ip.is_loopback:
+            return UrlSafetyResult(
+                classification="blocked", reasons=("loopback",)
+            )
+        # Check for loopback IPv4 first (needs confirm)
+        if ip.is_loopback:
+            return UrlSafetyResult(
+                classification="needs_confirm", reasons=("127.0.0.1",)
+            )
+        # Check for private IPs (blocked)
+        if ip.is_private:
+            return UrlSafetyResult(
+                classification="blocked", reasons=("private IP",)
+            )
+    except ValueError:
+        # Not an IP address, check for localhost string
+        pass
+    # Check for localhost name (needs confirm)
+    if host == "localhost":
+        return UrlSafetyResult(
+            classification="needs_confirm", reasons=("localhost",)
+        )
+    # Check port
+    port = parsed.port
+    if is_ip and port is None:
+        # IP-only URL without port (needs confirm)
+        return UrlSafetyResult(
+            classification="needs_confirm", reasons=("IP-only",)
+        )
+    if port is not None and port not in (80, 443):
+        # Non-standard port (needs confirm)
+        return UrlSafetyResult(
+            classification="needs_confirm", reasons=("non-standard port",)
+        )
+    # All checks passed
+    return UrlSafetyResult(classification="safe", reasons=())
+@dataclasses.dataclass(frozen=True)
+class CacheEntry:
+    """Cache entry with TTL support."""
+    content: str
+    fetched_at: float
+    ttl: float = 900.0
+    @property
+    def is_expired(self) -> bool:
+        """Return True if entry has expired based on TTL."""
+        return time.time() - self.fetched_at > self.ttl
+class UrlCache:
+    """LRU cache for URL content with TTL support."""
+    def __init__(self, max_entries: int = 50, ttl: float = 900.0) -> None:
+        """Initialize cache.
+        Args:
+            max_entries: Maximum number of entries before evicting oldest.
+            ttl: Time-to-live for entries in seconds.
+        """
+        self.max_entries = max_entries
+        self.ttl = ttl
+        self._cache: OrderedDict[str, CacheEntry] = OrderedDict()
+    def get(self, url: str) -> str | None:
+        """Get cached content for URL, return None if not found or expired."""
+        if url not in self._cache:
+            return None
+        entry = self._cache[url]
+        if entry.is_expired:
+            del self._cache[url]
+            return None
+        # Move to end (LRU)
+        self._cache.move_to_end(url)
+        return entry.content
+    def put(self, url: str, content: str) -> None:
+        """Store content in cache. Evicts oldest entry if cache is full."""
+        # If updating existing, remove it first
+        if url in self._cache:
+            del self._cache[url]
+        # Add new entry
+        entry = CacheEntry(content=content, fetched_at=time.time(), ttl=self.ttl)
+        self._cache[url] = entry
+        # Evict oldest if over capacity
+        if len(self._cache) > self.max_entries:
+            self._cache.popitem(last=False)
+    def clear(self) -> None:
+        """Clear all cached entries."""
+        self._cache.clear()
+def _html_to_markdown(html: str, use_readability: bool = True) -> str:
+    """Convert HTML to markdown using readability and html2text.
+    Falls back gracefully if dependencies are missing.
+    """
+    content = html
+    # Try readability first if requested
+    if use_readability:
+        try:
+            from readability import Document
+            doc = Document(content)
+            content = doc.summary()
+        except ImportError:
+            pass
+    # Try html2text
+    try:
+        import html2text
+        converter = html2text.HTML2Text()
+        converter.ignore_links = False
+        return converter.handle(content)
+    except ImportError:
+        # Fallback: simple regex tag stripping
+        content = re.sub(r"<[^>]+>", "", content)
+        content = re.sub(r"\s+", " ", content).strip()
+        return content
+def extract_content(
+    body: str,
+    content_type: str,
+    raw: bool = False,
+    max_length: int = 50000,
+) -> str:
+    """Extract and format content based on content type.
+    Args:
+        body: Raw content body.
+        content_type: MIME type of content.
+        raw: If True, skip readability for HTML (just strip tags).
+        max_length: Maximum length before truncation.
+    Returns:
+        Formatted content, possibly truncated with "[truncated]" marker.
+    """
+    if not body:
+        return ""
+    result = ""
+    if content_type.startswith("application/json"):
+        try:
+            data = json.loads(body)
+            result = json.dumps(data, indent=2)
+        except json.JSONDecodeError:
+            result = body
+    elif "html" in content_type:
+        result = _html_to_markdown(body, use_readability=not raw)
+    else:
+        # Passthrough
+        result = body
+    # Truncate if needed
+    if len(result) > max_length:
+        truncated_marker = "\n\n[truncated]"
+        available = max_length - len(truncated_marker)
+        result = result[:available] + truncated_marker
+    return result