PyPI - aru-code - Versions diffs - 0.14.1__tar.gz → 0.16.0__tar.gz - Mend

aru-code 0.14.1tar.gz → 0.16.0tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (58) hide show

{aru_code-0.14.1 → aru_code-0.16.0}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: aru-code
-Version: 0.14.1
+Version: 0.16.0
 Summary: A Claude Code clone built with Agno agents
 Author-email: Estevao <estevaofon@gmail.com>
 License-Expression: MIT
@@ -56,7 +56,7 @@ An intelligent coding assistant for the terminal, powered by LLMs and [Agno](htt
 - **Multi-Agent Architecture** — Specialized agents for planning, execution, and conversation
 - **Interactive CLI** — Streaming responses, multi-line paste, session management
 - **Image Support** — Attach images via `@` mentions for multimodal analysis (Claude, GPT-4o, Gemini)
-- **16 Integrated Tools** — File operations, code search, shell, web search, task delegation
+- **11 Integrated Tools** — File operations, code search, shell, web search, task delegation
 - **Task Planning** — Break down complex tasks into steps with automatic execution
 - **Multi-Provider** — Anthropic, OpenAI, Ollama, Groq, OpenRouter, DeepSeek, and others via custom configuration
 - **Custom Commands, Skills, and Agents** — Extend aru via the `.agents/` directory
@@ -369,7 +369,7 @@ Custom agents are Markdown files with YAML frontmatter stored in `.agents/agents
 name: Code Reviewer
 description: Review code for quality, bugs, and best practices
 model: anthropic/claude-sonnet-4-5
-tools: read_file, grep_search, glob_search, code_structure
+tools: read_file, grep_search, glob_search
 max_turns: 15
 mode: primary
 ---
@@ -479,19 +479,14 @@ Aru can load tools from MCP servers. Configure in `.aru/mcp_config.json`:
 ### File Operations
 - `read_file` — Reads files with line range support and binary detection
-- `read_file_smart` — Smart file reading focused on relevant snippets for the query
-- `write_file` / `write_files` — Writes single or batch files
-- `edit_file` / `edit_files` — Find-replace edits across multiple files
+- `read_file_smart` — Answers specific questions about a file without returning raw content
+- `write_file` — Writes content to files, creating directories as needed
+- `edit_file` — Find-and-replace edits on files
 ### Search & Discovery
 - `glob_search` — Find files by pattern (respects .gitignore)
 - `grep_search` — Content search with regex and file filtering
 - `list_directory` — Directory listing with gitignore filtering
-- `rank_files` — Multi-factor file relevance ranking (name, structure, recency)
-### Code Analysis
-- `code_structure` — Extracts classes, functions, imports via tree-sitter AST
-- `find_dependencies` — Analyzes import relationships between files
 ### Shell & Web
 - `bash` — Executes shell commands with permission gates
@@ -521,7 +516,7 @@ aru-code/
 │   │   ├── planner.py      # Planning agent
 │   │   └── executor.py     # Execution agent
 │   └── tools/
-│       ├── codebase.py     # 16 core tools
+│       ├── codebase.py     # 11 core tools
 │       ├── ast_tools.py    # Tree-sitter code analysis
 │       ├── ranker.py       # File relevance ranking
 │       ├── mcp_client.py   # MCP client

{aru_code-0.14.1 → aru_code-0.16.0}/README.md RENAMED Viewed

@@ -9,7 +9,7 @@ An intelligent coding assistant for the terminal, powered by LLMs and [Agno](htt
 - **Multi-Agent Architecture** — Specialized agents for planning, execution, and conversation
 - **Interactive CLI** — Streaming responses, multi-line paste, session management
 - **Image Support** — Attach images via `@` mentions for multimodal analysis (Claude, GPT-4o, Gemini)
-- **16 Integrated Tools** — File operations, code search, shell, web search, task delegation
+- **11 Integrated Tools** — File operations, code search, shell, web search, task delegation
 - **Task Planning** — Break down complex tasks into steps with automatic execution
 - **Multi-Provider** — Anthropic, OpenAI, Ollama, Groq, OpenRouter, DeepSeek, and others via custom configuration
 - **Custom Commands, Skills, and Agents** — Extend aru via the `.agents/` directory
@@ -322,7 +322,7 @@ Custom agents are Markdown files with YAML frontmatter stored in `.agents/agents
 name: Code Reviewer
 description: Review code for quality, bugs, and best practices
 model: anthropic/claude-sonnet-4-5
-tools: read_file, grep_search, glob_search, code_structure
+tools: read_file, grep_search, glob_search
 max_turns: 15
 mode: primary
 ---
@@ -432,19 +432,14 @@ Aru can load tools from MCP servers. Configure in `.aru/mcp_config.json`:
 ### File Operations
 - `read_file` — Reads files with line range support and binary detection
-- `read_file_smart` — Smart file reading focused on relevant snippets for the query
-- `write_file` / `write_files` — Writes single or batch files
-- `edit_file` / `edit_files` — Find-replace edits across multiple files
+- `read_file_smart` — Answers specific questions about a file without returning raw content
+- `write_file` — Writes content to files, creating directories as needed
+- `edit_file` — Find-and-replace edits on files
 ### Search & Discovery
 - `glob_search` — Find files by pattern (respects .gitignore)
 - `grep_search` — Content search with regex and file filtering
 - `list_directory` — Directory listing with gitignore filtering
-- `rank_files` — Multi-factor file relevance ranking (name, structure, recency)
-### Code Analysis
-- `code_structure` — Extracts classes, functions, imports via tree-sitter AST
-- `find_dependencies` — Analyzes import relationships between files
 ### Shell & Web
 - `bash` — Executes shell commands with permission gates
@@ -474,7 +469,7 @@ aru-code/
 │   │   ├── planner.py      # Planning agent
 │   │   └── executor.py     # Execution agent
 │   └── tools/
-│       ├── codebase.py     # 16 core tools
+│       ├── codebase.py     # 11 core tools
 │       ├── ast_tools.py    # Tree-sitter code analysis
 │       ├── ranker.py       # File relevance ranking
 │       ├── mcp_client.py   # MCP client

aru_code-0.16.0/aru/__init__.py ADDED Viewed

	@@ -0,0 +1 @@
1	+ __version__ = "0.16.0"

{aru_code-0.14.1 → aru_code-0.16.0}/aru/agent_factory.py RENAMED Viewed

@@ -21,12 +21,16 @@ def create_general_agent(
             in the system prompt. Placed in instructions so it's cacheable.
     """
     from agno.agent import Agent
-    from agno.compression.manager import CompressionManager
     from aru.tools.codebase import GENERAL_TOOLS
-    from aru.runtime import get_ctx
+    tools = GENERAL_TOOLS
-    extra = config.get_extra_instructions() if config else ""
+    # Only include AGENTS.md/project instructions on first turn to save ~1.6K tokens/turn
+    if config and not session.extra_instructions_sent:
+        extra = config.get_extra_instructions()
+        session.extra_instructions_sent = True
+    else:
+        extra = ""
     if env_context:
         extra = f"{extra}\n\n{env_context}" if extra else env_context
     model_ref = model_override or session.model_ref
@@ -34,15 +38,9 @@ def create_general_agent(
     return Agent(
         name="Aru",
         model=create_model(model_ref, max_tokens=8192),
-        tools=GENERAL_TOOLS,
+        tools=tools,
         instructions=_build_instructions("general", extra),
         markdown=True,
-        compress_tool_results=True,
-        compression_manager=CompressionManager(
-            model=create_model(get_ctx().small_model_ref, max_tokens=1024),
-            compress_tool_results=True,
-            compress_tool_results_limit=25,
-        ),
         tool_call_limit=20,
     )
@@ -52,10 +50,8 @@ def create_custom_agent_instance(agent_def: CustomAgent, session: Session,
                                   env_context: str = ""):
     """Create an Agno Agent from a CustomAgent definition."""
     from agno.agent import Agent
-    from agno.compression.manager import CompressionManager
     from aru.agents.base import BASE_INSTRUCTIONS
     from aru.tools.codebase import resolve_tools
-    from aru.runtime import get_ctx
     model_ref = agent_def.model or session.model_ref
     tools = resolve_tools(agent_def.tools)
@@ -74,11 +70,5 @@ def create_custom_agent_instance(agent_def: CustomAgent, session: Session,
         tools=tools,
         instructions=instructions,
         markdown=True,
-        compress_tool_results=True,
-        compression_manager=CompressionManager(
-            model=create_model(get_ctx().small_model_ref, max_tokens=1024),
-            compress_tool_results=True,
-            compress_tool_results_limit=25,
-        ),
         tool_call_limit=agent_def.max_turns or 20,
     )

{aru_code-0.14.1 → aru_code-0.16.0}/aru/agents/base.py RENAMED Viewed

@@ -35,7 +35,7 @@ PLANNER_ROLE = """\
 You are a software architect agent. Your job is to analyze codebases and create concise implementation plans.
 IMPORTANT: You are a READ-ONLY agent. You have NO tools to create, write, or edit files, or run shell commands. \
-Do NOT attempt to use write_file, edit_file, bash, run_command, or any write/exec tool — they do not exist in your toolkit. \
+Do NOT attempt to use write_file, edit_file, bash, or any write/exec tool — they do not exist in your toolkit. \
 To assess test coverage, read source files and test files directly — do NOT try to run pytest or any command. \
 Your sole output is the implementation plan. The executor agent will carry out the actual changes.
@@ -112,15 +112,12 @@ When all subtasks are done, STOP. Do not add extra actions beyond the task list.
 ## Subtask granularity — CRITICAL
 Each subtask should touch at most **3-4 files**. If the step involves many files, \
 split into subtasks grouped by concern (e.g. "Create model files", "Create route files", \
-"Update config and main"). Batch independent file writes using `write_files` or `edit_files` \
-to minimize tool calls. Batch independent file writes using `write_files` or `edit_files` to minimize tool calls.
+"Update config and main").
 ## Guidelines
 - Read files before editing them
 - Use edit_file for targeted changes (preferred over rewriting entire files)
 - Use write_file only for new files or complete rewrites
-- When creating or updating multiple independent files, use write_files to batch them
-- When making independent edits across files, use edit_files to batch them
 - Run existing tests after changes when applicable
 - **When adding or modifying unit tests, ALWAYS run them to verify they pass before finishing.**
 - Keep changes minimal and focused on the task
@@ -139,7 +136,7 @@ Use `context_lines=30` for full function bodies.
 **NEVER read the same file twice.** If you already have the file content in context, use it.
-**NEVER use bash/run_command to read files.** Always use `read_file` or `grep_search`.
+**NEVER use bash to read files.** Always use `read_file` or `grep_search`.
 **Batch independent tool calls**: emit ALL independent tool calls in a single response.
@@ -181,7 +178,7 @@ Every tool call accumulates its result in your context window. Use the minimum n
 **NEVER read the same file twice.** Check if you already have the content in context.
-**NEVER use bash/run_command to read files.** Always use `read_file` or `grep_search`.
+**NEVER use bash to read files.** Always use `read_file` or `grep_search`.
 **Batch independent tool calls**: emit ALL independent tool calls in a single response.
@@ -189,9 +186,7 @@ Every tool call accumulates its result in your context window. Use the minimum n
 **When adding or modifying unit tests, ALWAYS run them to verify they pass before finishing.**
-Use delegate_task to split work into independent subtasks for parallel execution.
-When creating or updating multiple independent files, use write_files to batch them.
-When making independent edits across files, use edit_files to batch them.\
+Use delegate_task to split work into independent subtasks for parallel execution.\
 """

aru_code-0.16.0/aru/cache_patch.py ADDED Viewed

@@ -0,0 +1,133 @@
+"""Monkey-patch Agno's model layer to reduce token consumption.
+Two optimizations:
+1. **Tool result pruning** (ALL providers): After each tool execution, old tool
+   results in the message list are truncated to a short summary. This prevents
+   O(n²) token growth where each API call re-sends all previous tool results.
+2. **Cache breakpoints** (Anthropic only): Marks the last 2 messages with
+   cache_control for Anthropic's prompt caching.
+These patches intercept Agno's internal loop so they work transparently
+regardless of which provider is used.
+"""
+from __future__ import annotations
+# Max chars to keep from old tool results
+_TOOL_RESULT_KEEP_CHARS = 200
+# Number of recent tool results to keep in full
+_KEEP_RECENT_RESULTS = 1
+def _prune_tool_messages(messages):
+    """Truncate old tool result content in the message list.
+    Keeps only the last N tool results in full. Older ones are truncated
+    to a short preview. This runs BEFORE each API call, so accumulated
+    tool results don't bloat the context on every re-send.
+    """
+    # Find all tool message indices
+    tool_indices = [
+        i for i, msg in enumerate(messages)
+        if getattr(msg, "role", None) == "tool"
+    ]
+    if len(tool_indices) <= _KEEP_RECENT_RESULTS:
+        return
+    # Prune all except the last N
+    for idx in tool_indices[:-_KEEP_RECENT_RESULTS]:
+        msg = messages[idx]
+        content = getattr(msg, "content", None)
+        if content is None:
+            continue
+        content_str = str(content)
+        if len(content_str) <= _TOOL_RESULT_KEEP_CHARS:
+            continue
+        truncated = content_str[:_TOOL_RESULT_KEEP_CHARS] + "\n[...truncated]"
+        try:
+            msg.content = truncated
+            if hasattr(msg, "compressed_content"):
+                msg.compressed_content = None
+        except (AttributeError, TypeError):
+            pass
+def apply_cache_patch():
+    """Apply all patches to reduce Agno's token consumption."""
+    _patch_tool_result_pruning()
+    _patch_claude_cache_breakpoints()
+def _patch_tool_result_pruning():
+    """Patch format_function_call_results to prune old tool results.
+    This is called after each tool execution, right before the next API call.
+    Works for ALL providers (Claude, OpenAI, Qwen, etc.) since it patches
+    the base Model class.
+    """
+    from agno.models.base import Model
+    _original_format_results = Model.format_function_call_results
+    def _patched_format_results(self, messages, function_call_results, **kwargs):
+        # First: prune old tool results already in messages
+        _prune_tool_messages(messages)
+        # Then: add new results normally
+        return _original_format_results(self, messages, function_call_results, **kwargs)
+    Model.format_function_call_results = _patched_format_results
+def _patch_claude_cache_breakpoints():
+    """Patch Claude's format_messages to add cache breakpoints.
+    Marks the last 2 messages with cache_control for Anthropic's prompt
+    caching. Non-Anthropic providers ignore these fields.
+    """
+    try:
+        import agno.utils.models.claude as claude_utils
+    except ImportError:
+        return
+    _original_format = claude_utils.format_messages
+    def _patched_format_messages(messages, compress_tool_results=False):
+        chat_messages, system_message = _original_format(
+            messages, compress_tool_results=compress_tool_results
+        )
+        if not chat_messages:
+            return chat_messages, system_message
+        # Add cache_control to last 2 messages
+        cache_marker = {"type": "ephemeral"}
+        marked = 0
+        for msg in reversed(chat_messages):
+            if marked >= 2:
+                break
+            content = msg.get("content")
+            if isinstance(content, list) and content:
+                last_item = content[-1]
+                if isinstance(last_item, dict):
+                    last_item["cache_control"] = cache_marker
+                    marked += 1
+                elif hasattr(last_item, "type"):
+                    try:
+                        as_dict = last_item.model_dump() if hasattr(last_item, "model_dump") else dict(last_item)
+                        as_dict["cache_control"] = cache_marker
+                        content[-1] = as_dict
+                        marked += 1
+                    except Exception:
+                        pass
+            elif isinstance(content, str):
+                msg["content"] = [{"type": "text", "text": content, "cache_control": cache_marker}]
+                marked += 1
+        return chat_messages, system_message
+    claude_utils.format_messages = _patched_format_messages

{aru_code-0.14.1 → aru_code-0.16.0}/aru/cli.py RENAMED Viewed

@@ -50,6 +50,7 @@ from aru.display import (  # noqa: F401
 from aru.completers import (  # noqa: F401
     AruCompleter,
     FileMentionCompleter,
+    MentionResult,
     PasteState,
     SlashCommandCompleter,
     TIPS,
@@ -110,6 +111,11 @@ async def run_cli(skip_permissions: bool = False, resume_id: str | None = None):
     from aru.permissions import parse_permission_config, reset_session as perm_reset_session
     from aru.tools.codebase import cleanup_processes
+    # Inject cache breakpoints into Agno's Claude API calls — reduces token
+    # consumption by ~40% on multi-tool-call interactions via prompt caching.
+    from aru.cache_patch import apply_cache_patch
+    apply_cache_patch()
     ctx = init_ctx(console=console, skip_permissions=skip_permissions)
     store = SessionStore()
@@ -253,16 +259,19 @@ async def run_cli(skip_permissions: bool = False, resume_id: str | None = None):
         # Resolve @file mentions (skip known agent names)
         _agent_names = set(config.custom_agents.keys()) if config.custom_agents else set()
-        resolved, injected, attached_images = _resolve_mentions(user_input, os.getcwd(), _agent_names)
-        if injected > 0:
+        mention_result = _resolve_mentions(user_input, os.getcwd(), _agent_names)
+        attached_images = mention_result.images
+        # File contents go into history as separate prunable messages (not inline)
+        mention_file_msgs = mention_result.file_messages
+        if mention_result.count > 0:
             parts = []
-            text_count = injected - len(attached_images)
+            text_count = mention_result.count - len(attached_images)
             if text_count > 0:
                 parts.append(f"{text_count} file(s)")
             if attached_images:
                 parts.append(f"{len(attached_images)} image(s)")
             console.print(f"[dim]Attached {', '.join(parts)} from @ mentions[/dim]")
-            user_input = resolved
+            user_input = mention_result.text
         if paste_state.pasted_content and user_text:
             console.print(
@@ -276,6 +285,14 @@ async def run_cli(skip_permissions: bool = False, resume_id: str | None = None):
         if not user_input:
             continue
+        # Inject @file contents as prunable history entries BEFORE the user message.
+        # These look like simulated read_file tool calls and can be pruned/compacted
+        # normally, unlike inline content which bloats the user message permanently.
+        if mention_file_msgs:
+            for msg in mention_file_msgs:
+                session.add_message(msg["role"], msg["content"])
+            mention_file_msgs = []  # consumed
         # Reset "allow all" approvals for each new user message
         perm_reset_session()

{aru_code-0.14.1 → aru_code-0.16.0}/aru/completers.py RENAMED Viewed

@@ -4,6 +4,7 @@ from __future__ import annotations
 import os
 import re
+from dataclasses import dataclass
 from prompt_toolkit import PromptSession
 from prompt_toolkit.completion import Completer, Completion
@@ -18,24 +19,36 @@ from aru.commands import SLASH_COMMANDS
 from aru.config import AgentConfig
 _MENTION_RE = re.compile(r'(?<!\S)@([a-zA-Z0-9_./\\:-]+)')
-_MENTION_MAX_SIZE = 30_000  # bytes, same limit as read_file
+_MENTION_MAX_SIZE = 10_000  # bytes — smaller to protect context (model uses read_file for large files)
 _IMAGE_EXTENSIONS = {".png", ".jpg", ".jpeg", ".gif", ".webp", ".bmp"}
 _IMAGE_MAX_SIZE = 20 * 1024 * 1024  # 20MB
-def _resolve_mentions(text: str, cwd: str, agent_names: set[str] | None = None) -> tuple[str, int, list[Image]]:
-    """Resolve @file mentions by appending file contents to the message.
+@dataclass
+class MentionResult:
+    """Result of resolving @file mentions."""
+    text: str                          # User text (without file contents)
+    file_messages: list[dict[str, str]]  # Simulated tool-call pairs for history
+    images: list[Image]
+    count: int                         # Total attached (files + images)
-    Image files (png, jpg, etc.) are returned as Image objects instead of text.
+def _resolve_mentions(text: str, cwd: str, agent_names: set[str] | None = None) -> MentionResult:
+    """Resolve @file mentions as simulated read_file tool calls.
+    Instead of inlining file contents into the user message (which bloats
+    history and can't be pruned), we return separate assistant+tool_result
+    message pairs that the session can prune/compact like normal tool outputs.
+    Image files are returned as Image objects.
     Skips @mentions that match known agent names.
-    Returns (resolved_text, number_of_files_attached, images).
     """
     agent_names = agent_names or set()
     matches = list(_MENTION_RE.finditer(text))
     if not matches:
-        return text, 0, []
+        return MentionResult(text=text, file_messages=[], images=[], count=0)
-    appendix_parts = []
+    file_messages: list[dict[str, str]] = []
     images: list[Image] = []
     seen = set()
     for m in matches:
@@ -64,21 +77,18 @@ def _resolve_mentions(text: str, cwd: str, agent_names: set[str] | None = None)
             size = os.path.getsize(abs_path)
             with open(abs_path, "r", encoding="utf-8", errors="replace") as f:
                 content = f.read(_MENTION_MAX_SIZE)
-            if size > _MENTION_MAX_SIZE:
-                appendix_parts.append(
-                    f"\n\n---\nContents of {rel_path} (truncated to {_MENTION_MAX_SIZE // 1000}KB):\n```\n{content}\n```"
-                )
-            else:
-                appendix_parts.append(
-                    f"\n\n---\nContents of {rel_path}:\n```\n{content}\n```"
-                )
+            truncated = size > _MENTION_MAX_SIZE
+            label = f"[read_file: {rel_path}]"
+            if truncated:
+                label += f" (truncated to {_MENTION_MAX_SIZE // 1000}KB of {size // 1000}KB — use read_file for the rest)"
+            # Simulated tool call pair — can be pruned like normal tool outputs
+            file_messages.append({"role": "assistant", "content": label})
+            file_messages.append({"role": "user", "content": content})
         except OSError:
             continue
-    attached = len(appendix_parts) + len(images)
-    if appendix_parts:
-        return text + "".join(appendix_parts), attached, images
-    return text, attached, images
+    count = len(file_messages) // 2 + len(images)
+    return MentionResult(text=text, file_messages=file_messages, images=images, count=count)
 def _extract_agent_mention(

aru-code 0.14.1__tar.gz → 0.16.0__tar.gz

aru-code 0.14.1tar.gz → 0.16.0tar.gz