PyPI - zrb - Versions diffs - 1.4.2__py3-none-any.whl → 1.5.0__py3-none-any.whl - Mend

zrb 1.4.2py3-none-any.whl → 1.5.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (13) hide show

zrb/builtin/llm/llm_chat.py +8 -6
zrb/builtin/llm/tool/api.py +1 -1
zrb/builtin/llm/tool/file.py +471 -113
zrb/builtin/llm/tool/rag.py +28 -10
zrb/builtin/llm/tool/web.py +47 -15
zrb/builtin/todo.py +37 -12
zrb/config.py +4 -4
zrb/llm_config.py +41 -14
zrb/task/llm_task.py +29 -14
{zrb-1.4.2.dist-info → zrb-1.5.0.dist-info}/METADATA +64 -41
{zrb-1.4.2.dist-info → zrb-1.5.0.dist-info}/RECORD +13 -13
{zrb-1.4.2.dist-info → zrb-1.5.0.dist-info}/WHEEL +0 -0
{zrb-1.4.2.dist-info → zrb-1.5.0.dist-info}/entry_points.txt +0 -0

zrb/builtin/llm/llm_chat.py CHANGED Viewed

@@ -6,10 +6,11 @@ from zrb.builtin.group import llm_group
 from zrb.builtin.llm.tool.api import get_current_location, get_current_weather
 from zrb.builtin.llm.tool.cli import run_shell_command
 from zrb.builtin.llm.tool.file import (
+    apply_diff,
     list_files,
-    read_all_files,
-    read_text_file,
-    write_text_file,
+    read_from_file,
+    search_files,
+    write_to_file,
 )
 from zrb.builtin.llm.tool.web import (
     create_search_internet_tool,
@@ -161,10 +162,11 @@ llm_chat: LLMTask = llm_group.add_task(
 if LLM_ALLOW_ACCESS_LOCAL_FILE:
-    llm_chat.add_tool(read_all_files)
     llm_chat.add_tool(list_files)
-    llm_chat.add_tool(read_text_file)
-    llm_chat.add_tool(write_text_file)
+    llm_chat.add_tool(read_from_file)
+    llm_chat.add_tool(write_to_file)
+    llm_chat.add_tool(search_files)
+    llm_chat.add_tool(apply_diff)
 if LLM_ALLOW_ACCESS_SHELL:
     llm_chat.add_tool(run_shell_command)

zrb/builtin/llm/tool/api.py CHANGED Viewed

@@ -5,7 +5,7 @@ from typing import Annotated, Literal
 def get_current_location() -> (
     Annotated[str, "JSON string representing latitude and longitude"]
 ):  # noqa
-    """Get the user's current location."""
+    """Get the user's current location. This function take no argument."""
     import requests
     return json.dumps(requests.get("http://ip-api.com/json?fields=lat,lon").json())

zrb/builtin/llm/tool/file.py CHANGED Viewed

@@ -1,119 +1,125 @@
 import fnmatch
 import os
+import re
+from typing import Dict, List, Optional, Tuple, Union
-from zrb.util.file import read_file, write_file
-_INCLUDED_PATTERNS: list[str] = [
-    "*.py",  # Python
-    "*.go",  # Go
-    "*.rs",  # Rust
-    "*.js",  # JavaScript
-    "*.ts",  # TypeScript
-    "*.java",  # Java
-    "*.c",  # C
-    "*.cpp",  # C++
-    "*.cc",  # Alternative C++ extension
-    "*.cxx",  # Alternative C++ extension
-    "*.rb",  # Ruby
-    "*.swift",  # Swift
-    "*.kt",  # Kotlin
-    "*.php",  # PHP
-    "*.pl",  # Perl / Prolog
-    "*.pm",  # Perl module
-    "*.sh",  # Shell
-    "*.bat",  # Batch
-    "*.ps1",  # PowerShell
-    "*.R",  # R (capital)
-    "*.r",  # R (lowercase)
-    "*.scala",  # Scala
-    "*.hs",  # Haskell
-    "*.cs",  # C#
-    "*.fs",  # F#
-    "*.ex",  # Elixir
-    "*.exs",  # Elixir script
-    "*.erl",  # Erlang
-    "*.hrl",  # Erlang header
-    "*.dart",  # Dart
-    "*.m",  # Objective-C / Matlab (note: conflicts may arise)
-    "*.mm",  # Objective-C++
-    "*.lua",  # Lua
-    "*.jl",  # Julia
-    "*.groovy",  # Groovy
-    "*.clj",  # Clojure
-    "*.cljs",  # ClojureScript
-    "*.cljc",  # Clojure common
-    "*.vb",  # Visual Basic
-    "*.f90",  # Fortran
-    "*.f95",  # Fortran
-    "*.adb",  # Ada
-    "*.ads",  # Ada specification
-    "*.pas",  # Pascal
-    "*.pp",  # Pascal
-    "*.ml",  # OCaml
-    "*.mli",  # OCaml interface
-    "*.nim",  # Nim
-    "*.rkt",  # Racket
-    "*.d",  # D
-    "*.lisp",  # Common Lisp
-    "*.lsp",  # Lisp variant
-    "*.cl",  # Common Lisp
-    "*.scm",  # Scheme
-    "*.st",  # Smalltalk
-    "*.vhd",  # VHDL
-    "*.vhdl",  # VHDL
-    "*.v",  # Verilog
-    "*.asm",  # Assembly
-    "*.s",  # Assembly (alternative)
-    "*.sql",  # SQL (if desired)
-]
+from zrb.util.file import read_file as _read_file
+from zrb.util.file import write_file as _write_file
-# Extended list of directories and patterns to exclude.
-_EXCLUDED_PATTERNS: list[str] = [
-    "venv",  # Python virtual environments
+# Common directories and files to exclude from file operations
+_DEFAULT_EXCLUDES = [
+    # Version control
+    ".git",
+    ".svn",
+    ".hg",
+    # Dependencies and packages
+    "node_modules",
+    "venv",
     ".venv",
-    "node_modules",  # Node.js dependencies
-    ".git",  # Git repositories
-    "__pycache__",  # Python cache directories
-    "build",  # Build directories
-    "dist",  # Distribution directories
-    "target",  # Build output directories (Java, Rust, etc.)
-    "bin",  # Binary directories
-    "obj",  # Object files directories
-    ".idea",  # JetBrains IDEs
-    ".vscode",  # VS Code settings
-    ".eggs",  # Python eggs
+    "env",
+    ".env",
+    # Build and cache
+    "__pycache__",
+    "*.pyc",
+    "build",
+    "dist",
+    "target",
+    # IDE and editor files
+    ".idea",
+    ".vscode",
+    "*.swp",
+    "*.swo",
+    # OS-specific
+    ".DS_Store",
+    "Thumbs.db",
+    # Temporary and backup files
+    "*.tmp",
+    "*.bak",
+    "*.log",
 ]
+# Maximum number of lines to read before truncating
+_MAX_LINES_BEFORE_TRUNCATION = 1000
+# Number of context lines to show around method definitions when truncating
+_CONTEXT_LINES = 5
 def list_files(
-    directory: str = ".",
-    included_patterns: list[str] = _INCLUDED_PATTERNS,
-    excluded_patterns: list[str] = _EXCLUDED_PATTERNS,
+    path: str = ".",
+    recursive: bool = True,
+    file_pattern: Optional[str] = None,
+    excluded_patterns: list[str] = _DEFAULT_EXCLUDES,
 ) -> list[str]:
-    """List all files in a directory that match any of the included glob patterns
-    and do not reside in any directory matching an excluded pattern.
-    Patterns are evaluated using glob-style matching.
+    """
+    List files in a directory that match specified patterns.
+    Args:
+        path: The path of the directory to list contents for
+            (relative to the current working directory)
+        recursive: Whether to list files recursively.
+            Use True for recursive listing, False for top-level only.
+        file_pattern: Optional glob pattern to filter files.
+            None by default (all files will be included).
+        excluded_patterns: List of glob patterns to exclude. By default, contains sane values
+            to exclude common directories and files like version control, build artifacts,
+            and temporary files.
+    Returns:
+        A list of file paths matching the criteria
     """
     all_files: list[str] = []
-    for root, dirs, files in os.walk(directory):
-        for filename in files:
-            if any(fnmatch.fnmatch(filename, pat) for pat in included_patterns):
+    if recursive:
+        for root, dirs, files in os.walk(path):
+            # Filter out excluded directories to avoid descending into them
+            dirs[:] = [
+                d
+                for d in dirs
+                if not _should_exclude(os.path.join(root, d), excluded_patterns)
+            ]
+            for filename in files:
                 full_path = os.path.join(root, filename)
-                if _should_exclude(full_path, excluded_patterns):
-                    continue
-                all_files.append(full_path)
-    return all_files
+                # If file_pattern is None, include all files, otherwise match the pattern
+                if file_pattern is None or fnmatch.fnmatch(filename, file_pattern):
+                    if not _should_exclude(full_path, excluded_patterns):
+                        all_files.append(full_path)
+    else:
+        # Non-recursive listing (top-level only)
+        try:
+            for item in os.listdir(path):
+                full_path = os.path.join(path, item)
+                if os.path.isfile(full_path):
+                    # If file_pattern is None, include all files, otherwise match the pattern
+                    if file_pattern is None or fnmatch.fnmatch(item, file_pattern):
+                        if not _should_exclude(full_path, excluded_patterns):
+                            all_files.append(full_path)
+        except (FileNotFoundError, PermissionError) as e:
+            print(f"Error listing files in {path}: {e}")
+    return sorted(all_files)
-def _should_exclude(full_path: str, excluded_patterns: list[str]) -> bool:
+def _should_exclude(
+    full_path: str, excluded_patterns: list[str] = _DEFAULT_EXCLUDES
+) -> bool:
     """
     Return True if the file at full_path should be excluded based on
     the list of excluded_patterns. Patterns that include a path separator
     are applied to the full normalized path; otherwise they are matched
     against each individual component of the path.
+    Args:
+        full_path: The full path to check
+        excluded_patterns: List of patterns to exclude
+    Returns:
+        True if the path should be excluded, False otherwise
     """
     norm_path = os.path.normpath(full_path)
     path_parts = norm_path.split(os.sep)
     for pat in excluded_patterns:
         # If the pattern seems intended for full path matching (contains a separator)
         if os.sep in pat or "/" in pat:
@@ -123,30 +129,382 @@ def _should_exclude(full_path: str, excluded_patterns: list[str]) -> bool:
             # Otherwise check each part of the path
             if any(fnmatch.fnmatch(part, pat) for part in path_parts):
                 return True
+            # Also check the filename against the pattern
+            if os.path.isfile(full_path) and fnmatch.fnmatch(
+                os.path.basename(full_path), pat
+            ):
+                return True
     return False
-def read_text_file(file: str) -> str:
-    """Read a text file and return a string containing the file content."""
-    return read_file(os.path.abspath(file))
+def read_from_file(
+    path: str,
+    start_line: Optional[int] = None,
+    end_line: Optional[int] = None,
+    auto_truncate: bool = False,
+) -> str:
+    """
+    Read the contents of a file at the specified path.
+    Args:
+        path: The path of the file to read (relative to the current working directory)
+        start_line: The starting line number to read from (1-based).
+            If not provided, starts from the beginning.
+        end_line: The ending line number to read to (1-based, inclusive).
+            If not provided, reads to the end.
+        auto_truncate: Whether to automatically truncate large files when start_line
+            and end_line are not specified. If true and the file exceeds a certain
+            line threshold, it will return a subset of lines with information about
+            the total line count and method definitions. Default is False for backward
+            compatibility, but setting to True is recommended for large files.
+    Returns:
+        A string containing the file content, with line numbers prefixed to each line.
+        For truncated files, includes summary information.
+    """
+    try:
+        abs_path = os.path.abspath(path)
-def write_text_file(file: str, content: str):
-    """Write content to a text file"""
-    return write_file(os.path.abspath(file), content)
+        # Read the entire file content
+        content = _read_file(abs_path)
+        lines = content.splitlines()
+        total_lines = len(lines)
+        # Determine if we should truncate
+        should_truncate = (
+            auto_truncate
+            and start_line is None
+            and end_line is None
+            and total_lines > _MAX_LINES_BEFORE_TRUNCATION
+        )
-def read_all_files(
-    directory: str = ".",
-    included_patterns: list[str] = _INCLUDED_PATTERNS,
-    excluded_patterns: list[str] = _EXCLUDED_PATTERNS,
-) -> list[str]:
-    """Read all files in a directory that match any of the included glob patterns
-    and do not match any of the excluded glob patterns.
-    Patterns are evaluated using glob-style matching.
-    """
-    files = list_files(directory, included_patterns, excluded_patterns)
-    for index, file in enumerate(files):
-        content = read_text_file(file)
-        files[index] = f"# {file}\n```\n{content}\n```"
-    return files
+        # Adjust line indices (convert from 1-based to 0-based)
+        start_idx = (start_line - 1) if start_line is not None else 0
+        end_idx = end_line if end_line is not None else total_lines
+        # Validate indices
+        if start_idx < 0:
+            start_idx = 0
+        if end_idx > total_lines:
+            end_idx = total_lines
+        if should_truncate:
+            # Find method definitions and their line ranges
+            method_info = _find_method_definitions(lines)
+            # Create a truncated view with method definitions
+            result_lines = []
+            # Add file info header
+            result_lines.append(f"File: {path} (truncated, {total_lines} lines total)")
+            result_lines.append("")
+            # Add beginning of file (first 100 lines)
+            first_chunk = min(100, total_lines // 3)
+            for i in range(first_chunk):
+                result_lines.append(f"{i+1} | {lines[i]}")
+            result_lines.append("...")
+            omitted_msg = (
+                f"[{first_chunk+1} - {total_lines-100}] Lines omitted for brevity"
+            )
+            result_lines.append(omitted_msg)
+            result_lines.append("...")
+            # Add end of file (last 100 lines)
+            for i in range(max(first_chunk, total_lines - 100), total_lines):
+                result_lines.append(f"{i+1} | {lines[i]}")
+            # Add method definitions summary
+            if method_info:
+                result_lines.append("")
+                result_lines.append("Method definitions found:")
+                for method in method_info:
+                    method_line = (
+                        f"- {method['name']} "
+                        f"(lines {method['start_line']}-{method['end_line']})"
+                    )
+                    result_lines.append(method_line)
+            return "\n".join(result_lines)
+        else:
+            # Return the requested range with line numbers
+            result_lines = []
+            for i in range(start_idx, end_idx):
+                result_lines.append(f"{i+1} | {lines[i]}")
+            return "\n".join(result_lines)
+    except Exception as e:
+        return f"Error reading file {path}: {str(e)}"
+def _find_method_definitions(lines: List[str]) -> List[Dict[str, Union[str, int]]]:
+    """
+    Find method definitions in the given lines of code.
+    Args:
+        lines: List of code lines to analyze
+    Returns:
+        List of dictionaries containing method name, start line, and end line
+    """
+    method_info = []
+    # Simple regex patterns for common method/function definitions
+    patterns = [
+        # Python
+        r"^\s*def\s+([a-zA-Z0-9_]+)\s*\(",
+        # JavaScript/TypeScript
+        r"^\s*(function\s+([a-zA-Z0-9_]+)|([a-zA-Z0-9_]+)\s*=\s*function|"
+        r"\s*([a-zA-Z0-9_]+)\s*\([^)]*\)\s*{)",
+        # Java/C#/C++
+        r"^\s*(?:public|private|protected|static|final|abstract|synchronized)?"
+        r"\s+(?:[a-zA-Z0-9_<>[\]]+\s+)+([a-zA-Z0-9_]+)\s*\(",
+    ]
+    current_method = None
+    for i, line in enumerate(lines):
+        # Check if this line starts a method definition
+        for pattern in patterns:
+            match = re.search(pattern, line)
+            if match:
+                # If we were tracking a method, close it
+                if current_method:
+                    current_method["end_line"] = i
+                    method_info.append(current_method)
+                # Start tracking a new method
+                method_name = next(
+                    group for group in match.groups() if group is not None
+                )
+                current_method = {
+                    "name": method_name,
+                    "start_line": i + 1,  # 1-based line numbering
+                    "end_line": None,
+                }
+                break
+        # Check for method end (simplistic approach)
+        if current_method and line.strip() == "}":
+            current_method["end_line"] = i + 1
+            method_info.append(current_method)
+            current_method = None
+    # Close any open method at the end of the file
+    if current_method:
+        current_method["end_line"] = len(lines)
+        method_info.append(current_method)
+    return method_info
+def write_to_file(path: str, content: str) -> bool:
+    """
+    Write content to a file at the specified path.
+    Args:
+        path: The path of the file to write to (relative to the current working directory)
+        content: The content to write to the file
+    Returns:
+        True if successful, False otherwise
+    """
+    try:
+        # Ensure directory exists
+        directory = os.path.dirname(os.path.abspath(path))
+        if directory and not os.path.exists(directory):
+            os.makedirs(directory, exist_ok=True)
+        # Write the content
+        _write_file(os.path.abspath(path), content)
+        return True
+    except Exception as e:
+        print(f"Error writing to file {path}: {str(e)}")
+        return False
+def search_files(
+    path: str, regex: str, file_pattern: Optional[str] = None, context_lines: int = 2
+) -> str:
+    """
+    Search for a regex pattern across files in a specified directory.
+    Args:
+        path: The path of the directory to search in
+            (relative to the current working directory)
+        regex: The regular expression pattern to search for
+        file_pattern: Optional glob pattern to filter files.
+            Default is None, which includes all files. Only specify this if you need to
+            filter to specific file types (but in most cases, leaving as None is better).
+        context_lines: Number of context lines to show before and after each match.
+            Default is 2, which provides good context without overwhelming output.
+    Returns:
+        A string containing the search results with context
+    """
+    try:
+        # Compile the regex pattern
+        pattern = re.compile(regex)
+        # Get the list of files to search
+        files = list_files(path, recursive=True, file_pattern=file_pattern)
+        results = []
+        match_count = 0
+        for file_path in files:
+            try:
+                with open(file_path, "r", encoding="utf-8", errors="replace") as f:
+                    lines = f.readlines()
+                file_matches = []
+                for i, line in enumerate(lines):
+                    if pattern.search(line):
+                        # Determine context range
+                        start = max(0, i - context_lines)
+                        end = min(len(lines), i + context_lines + 1)
+                        # Add file header if this is the first match in the file
+                        if not file_matches:
+                            file_matches.append(
+                                f"\n{'-' * 80}\n{file_path}\n{'-' * 80}"
+                            )
+                        # Add separator if this isn't the first match and isn't contiguous
+                        # with previous
+                        if (
+                            file_matches
+                            and file_matches[-1] != f"Line {start+1}-{end}:"
+                        ):
+                            file_matches.append(f"\nLine {start+1}-{end}:")
+                        # Add context lines
+                        for j in range(start, end):
+                            prefix = ">" if j == i else " "
+                            file_matches.append(f"{prefix} {j+1}: {lines[j].rstrip()}")
+                        match_count += 1
+                if file_matches:
+                    results.extend(file_matches)
+            except Exception as e:
+                results.append(f"Error reading {file_path}: {str(e)}")
+        if not results:
+            return f"No matches found for pattern '{regex}' in {path}"
+        # Count unique files by counting headers
+        file_count = len([r for r in results if r.startswith("-" * 80)])
+        summary = f"Found {match_count} matches in {file_count} files:\n"
+        return summary + "\n".join(results)
+    except Exception as e:
+        return f"Error searching files: {str(e)}"
+def apply_diff(path: str, diff: str, start_line: int, end_line: int) -> bool:
+    """
+    Replace existing code using a search and replace block.
+    Args:
+        path: The path of the file to modify (relative to the current working directory)
+        diff: The search/replace block defining the changes
+        start_line: The line number where the search block starts (1-based)
+        end_line: The line number where the search block ends (1-based)
+    Returns:
+        True if successful, False otherwise
+    The diff format should be:
+    ```
+    <<<<<<< SEARCH
+    [exact content to find including whitespace]
+    =======
+    [new content to replace with]
+    >>>>>>> REPLACE
+    ```
+    """
+    try:
+        # Read the file
+        abs_path = os.path.abspath(path)
+        content = _read_file(abs_path)
+        lines = content.splitlines()
+        # Validate line numbers
+        if start_line < 1 or end_line > len(lines) or start_line > end_line:
+            print(
+                f"Invalid line range: {start_line}-{end_line} (file has {len(lines)} lines)"
+            )
+            return False
+        # Parse the diff
+        search_content, replace_content = _parse_diff(diff)
+        if search_content is None or replace_content is None:
+            print("Invalid diff format")
+            return False
+        # Extract the content to be replaced
+        original_content = "\n".join(lines[start_line - 1 : end_line])
+        # Verify the search content matches
+        if original_content != search_content:
+            print("Search content does not match the specified lines in the file")
+            return False
+        # Replace the content
+        new_lines = (
+            lines[: start_line - 1] + replace_content.splitlines() + lines[end_line:]
+        )
+        new_content = "\n".join(new_lines)
+        # Write the modified content back to the file
+        _write_file(abs_path, new_content)
+        return True
+    except Exception as e:
+        print(f"Error applying diff to {path}: {str(e)}")
+        return False
+def _parse_diff(diff: str) -> Tuple[Optional[str], Optional[str]]:
+    """
+    Parse a diff string to extract search and replace content.
+    Args:
+        diff: The diff string to parse
+    Returns:
+        A tuple of (search_content, replace_content), or (None, None) if parsing fails
+    """
+    try:
+        # Split the diff into sections
+        search_marker = "<<<<<<< SEARCH"
+        separator = "======="
+        replace_marker = ">>>>>>> REPLACE"
+        if (
+            search_marker not in diff
+            or separator not in diff
+            or replace_marker not in diff
+        ):
+            return None, None
+        # Extract search content
+        search_start = diff.index(search_marker) + len(search_marker)
+        search_end = diff.index(separator)
+        search_content = diff[search_start:search_end].strip()
+        # Extract replace content
+        replace_start = diff.index(separator) + len(separator)
+        replace_end = diff.index(replace_marker)
+        replace_content = diff[replace_start:replace_end].strip()
+        return search_content, replace_content
+    except Exception:
+        return None, None

zrb 1.4.2__py3-none-any.whl → 1.5.0__py3-none-any.whl

zrb 1.4.2py3-none-any.whl → 1.5.0py3-none-any.whl