PyPI - loom-code - Versions diffs - 0.1.1__py3-none-any.whl - Mend

loom-code 0.1.1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (58) hide show

loom_code/__init__.py +22 -0
loom_code/_post_commit.py +119 -0
loom_code/agent.py +544 -0
loom_code/approval.py +616 -0
loom_code/browse/__init__.py +291 -0
loom_code/browse/act.py +467 -0
loom_code/browse/observe.py +249 -0
loom_code/browse/session.py +96 -0
loom_code/browse/verify.py +194 -0
loom_code/checkpoint.py +283 -0
loom_code/cli.py +495 -0
loom_code/code_index.py +703 -0
loom_code/compact.py +143 -0
loom_code/consent.py +47 -0
loom_code/credentials.py +527 -0
loom_code/edit_tool.py +635 -0
loom_code/extensions.py +522 -0
loom_code/file_history.py +322 -0
loom_code/file_tools.py +93 -0
loom_code/git_hook.py +200 -0
loom_code/grep_tool.py +430 -0
loom_code/hooks.py +297 -0
loom_code/loominit/__init__.py +23 -0
loom_code/loominit/_ast_walk.py +429 -0
loom_code/loominit/_files.py +284 -0
loom_code/loominit/_graph.py +141 -0
loom_code/loominit/_resolve.py +392 -0
loom_code/loominit/_tests_map.py +108 -0
loom_code/loominit/extractor.py +332 -0
loom_code/loominit/repomap.py +225 -0
loom_code/loominit/schema.py +242 -0
loom_code/lsp_tools.py +396 -0
loom_code/mcp_host.py +79 -0
loom_code/operator.py +449 -0
loom_code/paste.py +97 -0
loom_code/paths.py +52 -0
loom_code/permissions.py +177 -0
loom_code/project.py +104 -0
loom_code/prompts.py +451 -0
loom_code/render.py +783 -0
loom_code/repl.py +4080 -0
loom_code/rules.py +267 -0
loom_code/sandboxed_bash.py +176 -0
loom_code/scribe.py +88 -0
loom_code/skills/__init__.py +16 -0
loom_code/skills/graphify/SKILL.md +97 -0
loom_code/skills/graphify/tools.py +570 -0
loom_code/trust.py +216 -0
loom_code/turn.py +169 -0
loom_code/web_fetch.py +370 -0
loom_code/workers.py +758 -0
loom_code/worktree.py +134 -0
loom_code-0.1.1.dist-info/METADATA +224 -0
loom_code-0.1.1.dist-info/RECORD +58 -0
loom_code-0.1.1.dist-info/WHEEL +5 -0
loom_code-0.1.1.dist-info/entry_points.txt +2 -0
loom_code-0.1.1.dist-info/licenses/LICENSE +21 -0
loom_code-0.1.1.dist-info/top_level.txt +1 -0

loom_code/grep_tool.py ADDED Viewed

@@ -0,0 +1,430 @@
+"""Enhanced ``grep`` tool for loom-code agents.
+Same role as ``loomflow.tools.grep_tool`` — find regex matches under a
+working directory — but with structured output the agent can actually
+USE without N follow-up reads:
+* **Surrounding context** — ±N lines around each match so the agent
+  sees the match in context (loomflow's default is just the matching
+  line, which forces a separate ``read`` of every interesting hit).
+* **Grouped by file** — all matches for one file in a single block
+  with the path as a header. Easier to scan than 50 ``path:line:``
+  prefixes.
+* **Test-file collapsing** — hits in ``tests/`` / ``test_*.py`` /
+  ``*_test.py`` collapse into a one-line "+N matches in test files"
+  summary by default. Keeps prod code in focus; agent opts in to
+  test matches with ``include_tests=True``.
+* **Optional language filter** — ``type=("py", "ts")`` restricts to
+  those extensions.
+Default behaviour is the enhanced form so the agent's default grep is
+the good one. Pass ``raw=True`` for the old flat-line format if a
+tight one-line-per-match shape is needed.
+Why this lives in loom-code (not loomflow): loom-code is opinionated
+about the SHAPE of grep output for coding-agent UX. The framework's
+``grep_tool`` is a sensible generic; this wrapper adds the loom-code
+ergonomics without forking the framework.
+"""
+from __future__ import annotations
+import json
+import re
+import shutil
+import subprocess
+from pathlib import Path
+from typing import Any
+from loomflow import tool
+from loomflow.tools.registry import Tool
+def _as_int(value: Any, default: int) -> int:
+    """Coerce a model-supplied value to int. The tool-call layer
+    often serialises ``context=2`` as the STRING ``"2"`` (and some
+    providers send floats), so a typed ``int`` param arrives as a
+    str and ``lineno - context`` crashes with 'int - str'. Coerce
+    leniently; fall back to ``default`` on anything unparseable."""
+    if isinstance(value, bool):
+        # bool is an int subclass — don't let True become 1 silently
+        # for a numeric arg; treat as default.
+        return default
+    if isinstance(value, int):
+        return value
+    try:
+        return int(str(value).strip())
+    except (TypeError, ValueError):
+        return default
+def _as_bool(value: Any, default: bool = False) -> bool:
+    """Coerce a model-supplied value to bool. Weak models send
+    ``ignore_case=true`` as the STRING ``"true"`` (or ``"1"`` /
+    ``"yes"``); a typed ``bool`` param then arrives truthy-non-empty
+    for ANY non-empty string including ``"false"``. Parse the
+    common truthy/falsy spellings explicitly."""
+    if isinstance(value, bool):
+        return value
+    if value is None:
+        return default
+    s = str(value).strip().lower()
+    if s in ("true", "1", "yes", "y", "on"):
+        return True
+    if s in ("false", "0", "no", "n", "off", ""):
+        return False
+    return default
+# Directories we never search — matches loomflow's grep_tool noise
+# list so behaviour around big virtualenvs / build outputs is the
+# same as the framework default. Keeps walk time bounded on real
+# projects with .venv / node_modules / etc.
+_NOISE_DIRS = frozenset({
+    ".git", "node_modules", "__pycache__", ".venv", "venv",
+    ".env", ".tox", "dist", "build", ".pytest_cache", ".ruff_cache",
+    ".mypy_cache", "graphify-out", ".loom",
+})
+# Heuristics for "is this a test file?". Anything under a ``tests``
+# folder, or named ``test_*.py`` / ``*_test.py`` / ``*.test.*``.
+_TEST_DIR_NAMES = frozenset({"tests", "test", "__tests__"})
+def _is_test_path(rel: Path) -> bool:
+    """True if the relative path is a test file by directory or
+    filename convention."""
+    parts = set(rel.parts)
+    if parts & _TEST_DIR_NAMES:
+        return True
+    name = rel.name.lower()
+    if name.startswith("test_") or name.endswith("_test.py"):
+        return True
+    if ".test." in name or ".spec." in name:
+        return True
+    return False
+def _walk_files(
+    root: Path,
+    glob: str,
+    type_filter: tuple[str, ...] | None,
+) -> list[Path]:
+    """Walk ``root`` honouring ``_NOISE_DIRS`` + the user's glob +
+    optional extension allowlist. Returns absolute paths."""
+    out: list[Path] = []
+    for path in root.rglob(glob):
+        if not path.is_file():
+            continue
+        if any(p in _NOISE_DIRS for p in path.parts):
+            continue
+        if type_filter is not None:
+            suffix = path.suffix.lstrip(".").lower()
+            if suffix not in type_filter:
+                continue
+        out.append(path)
+    return out
+def _rg_path() -> str | None:
+    """Absolute path to the real ripgrep binary, or None if absent.
+    ``shutil.which`` finds the executable on PATH — not any shell
+    function shim (subprocess never sees shell functions anyway)."""
+    return shutil.which("rg")
+def _collect_with_ripgrep(
+    target: Path,
+    pattern: str,
+    *,
+    ignore_case: bool,
+    glob: str,
+    type_filter: tuple[str, ...] | None,
+    max_files: int,
+    max_per_file: int,
+) -> dict[Path, list[tuple[int, str]]] | None:
+    """Fast path: ripgrep does the matching; we parse its --json stream.
+    Returns ``matches_by_file`` (same shape the Python walk produces), or
+    ``None`` to signal "fall back to Python" — when rg is absent, the
+    pattern uses a feature rg's Rust regex rejects (lookahead /
+    backrefs → exit 2), or rg errors. Never raises, so the caller's
+    fallback stays a simple ``is None`` check.
+    rg respects .gitignore (correct for a code tool); we ALSO pass the
+    historical _NOISE_DIRS as --glob excludes so a non-git tree or an
+    un-ignored .venv stays quiet — a superset of the old walk, never a
+    regression."""
+    rg = _rg_path()
+    if rg is None:
+        return None
+    argv = [rg, "--json", "--no-messages"]
+    if ignore_case:
+        argv.append("--ignore-case")
+    if glob and glob != "*":
+        argv += ["--glob", glob]
+    for noise in _NOISE_DIRS:
+        argv += ["--glob", f"!**/{noise}/**"]
+    if type_filter:
+        # rg has no arbitrary-extension flag — express each as a glob.
+        for ext in type_filter:
+            argv += ["--glob", f"*.{ext}"]
+    argv += ["--regexp", pattern, str(target)]
+    try:
+        proc = subprocess.run(
+            argv, capture_output=True, text=True, timeout=30
+        )
+    except (OSError, subprocess.SubprocessError):
+        return None
+    # rg exit codes: 0 = matches, 1 = no matches (NOT an error),
+    # 2 = real error (bad/unsupported regex) → fall back to the Python
+    # engine, which may accept the pattern.
+    if proc.returncode == 2:
+        return None
+    matches_by_file: dict[Path, list[tuple[int, str]]] = {}
+    for raw_line in proc.stdout.splitlines():
+        if not raw_line:
+            continue
+        try:
+            evt = json.loads(raw_line)
+        except json.JSONDecodeError:
+            continue
+        if evt.get("type") != "match":
+            continue
+        data = evt["data"]
+        fpath = Path(data["path"]["text"])
+        lineno = int(data["line_number"])
+        text = str(data["lines"]["text"]).rstrip("\n")
+        bucket = matches_by_file.setdefault(fpath, [])
+        if len(bucket) < max_per_file:
+            bucket.append((lineno, text))
+    # Honour the file cap deterministically (rg emits in walk order).
+    if len(matches_by_file) > max_files:
+        keep = sorted(matches_by_file)[:max_files]
+        matches_by_file = {k: matches_by_file[k] for k in keep}
+    return matches_by_file
+def _render_grouped(
+    matches_by_file: dict[Path, list[tuple[int, str]]],
+    file_lines: dict[Path, list[str]],
+    *,
+    context: int,
+    root: Path,
+) -> str:
+    """Render the structured per-file output with context lines."""
+    if not matches_by_file:
+        return "no matches"
+    sections: list[str] = []
+    for path in sorted(matches_by_file):
+        hits = matches_by_file[path]
+        lines = file_lines[path]
+        rel = path.relative_to(root)
+        sections.append(
+            f"─ {rel} ({len(hits)} match{'es' if len(hits) != 1 else ''}) "
+            + "─" * max(0, 40 - len(str(rel)))
+        )
+        # For each hit, show context lines. If multiple hits are
+        # close together their context windows merge naturally —
+        # we DON'T deduplicate here because that'd hide hit
+        # boundaries; instead we render each hit's window. Agent
+        # gets a slight redundancy in exchange for clearer per-
+        # hit framing.
+        for lineno, _ in hits:
+            start = max(0, lineno - 1 - context)
+            end = min(len(lines), lineno + context)
+            for i in range(start, end):
+                marker = "▸ " if i + 1 == lineno else "  "
+                sections.append(
+                    f"  {marker}{i + 1:4d} │ {lines[i].rstrip()}"
+                )
+            sections.append("")  # blank line between hit windows
+        # Remove trailing blank for tidiness.
+        if sections and sections[-1] == "":
+            sections.pop()
+    return "\n".join(sections)
+def enhanced_grep_tool(
+    workdir: Path | str,
+    *,
+    max_files_with_matches: int = 30,
+    max_matches_per_file: int = 10,
+    default_context: int = 2,
+) -> Tool:
+    """Build the loom-code grep tool. Sees the model with:
+        grep(pattern, path=".", glob="*",
+             ignore_case=False, context=2,
+             include_tests=False, raw=False,
+             type="")
+    ``pattern`` is a Python regex. ``path`` is relative to the agent's
+    workdir. ``context`` is ±N lines around each match (default 2).
+    ``include_tests=True`` un-collapses test-file hits. ``raw=True``
+    drops the grouped/contextual rendering and falls back to flat
+    ``path:lineno: line`` lines (loomflow's classic shape) for
+    consumers that want one-line-per-match. ``type`` is a
+    comma-separated extension filter (e.g. ``"py,ts"``) — empty
+    means no filter.
+    """
+    root = Path(workdir).resolve()
+    async def grep(
+        pattern: str,
+        path: str = ".",
+        glob: str = "*",
+        ignore_case: bool = False,
+        context: int = default_context,
+        include_tests: bool = False,
+        raw: bool = False,
+        type: str = "",  # noqa: A002 — model-facing arg name; matches CLI ergonomics
+    ) -> str:
+        """Find regex matches under ``path`` and return grouped,
+        context-rich results. See module docstring for the full
+        contract."""
+        # Coerce model-supplied args defensively — the tool-call
+        # layer serialises typed params as strings ("2", "true"),
+        # which crashed the line-window math ('int - str') and
+        # made bool flags always-truthy. Same lenient coercion
+        # loomflow's plan_write does for weak-model serialisation.
+        context = _as_int(context, default_context)
+        ignore_case = _as_bool(ignore_case, default=False)
+        include_tests = _as_bool(include_tests, default=False)
+        raw = _as_bool(raw, default=False)
+        # Resolve and bounds-check ``path``. Must stay under root.
+        target = (root / path).resolve()
+        try:
+            target.relative_to(root)
+        except ValueError:
+            return f"grep: refusing to search outside workdir: {target}"
+        if not target.exists():
+            return f"grep: path not found: {path}"
+        # Pre-compile the pattern; surface regex errors to the agent
+        # so it can fix the call instead of getting empty output.
+        flags = re.IGNORECASE if ignore_case else 0
+        try:
+            regex = re.compile(pattern, flags)
+        except re.error as exc:
+            return f"grep: invalid regex {pattern!r}: {exc}"
+        # Normalise the type filter.
+        type_filter: tuple[str, ...] | None = None
+        if type:
+            type_filter = tuple(
+                t.strip().lower() for t in type.split(",") if t.strip()
+            )
+        # Collect raw per-file hits. FAST PATH: ripgrep (respects
+        # .gitignore, Rust-fast). FALLBACK: the pure-Python walk below,
+        # used when rg is absent or rejects the pattern (lookahead /
+        # backrefs) — so capability never regresses, only speed varies.
+        raw_hits: dict[Path, list[tuple[int, str]]] = {}
+        rg_result = _collect_with_ripgrep(
+            target,
+            pattern,
+            ignore_case=ignore_case,
+            glob=glob,
+            type_filter=type_filter,
+            max_files=max_files_with_matches * 4,
+            max_per_file=max_matches_per_file,
+        )
+        if rg_result is not None:
+            raw_hits = rg_result
+        else:
+            # Pure-Python walk: read every candidate file, regex each
+            # line. Identical regex dialect to the agent's `pattern`.
+            for fpath in _walk_files(target, glob, type_filter):
+                try:
+                    text = fpath.read_text(
+                        encoding="utf-8", errors="replace"
+                    )
+                except OSError:
+                    continue
+                hits: list[tuple[int, str]] = []
+                for i, line in enumerate(text.splitlines(), start=1):
+                    if regex.search(line):
+                        hits.append((i, line))
+                        if len(hits) >= max_matches_per_file:
+                            break
+                if hits:
+                    raw_hits[fpath] = hits
+        # Shared post-process: apply the test-file collapse + file cap +
+        # build the context cache. Runs identically for both paths so rg
+        # and Python output are byte-for-byte the same.
+        matches_by_file: dict[Path, list[tuple[int, str]]] = {}
+        file_lines_cache: dict[Path, list[str]] = {}
+        test_file_count = 0
+        test_match_count = 0
+        for fpath in sorted(raw_hits):
+            hits = raw_hits[fpath]
+            rel = fpath.relative_to(root)
+            if (not include_tests) and _is_test_path(rel):
+                test_file_count += 1
+                test_match_count += len(hits)
+                continue
+            try:
+                lines = fpath.read_text(
+                    encoding="utf-8", errors="replace"
+                ).splitlines()
+            except OSError:
+                continue
+            matches_by_file[fpath] = hits
+            file_lines_cache[fpath] = lines
+            if len(matches_by_file) >= max_files_with_matches:
+                break
+        if raw:
+            # Old flat shape — loomflow's classic output. Kept as
+            # an escape hatch for one-line-per-match consumers.
+            out: list[str] = []
+            for fpath in sorted(matches_by_file):
+                rel = fpath.relative_to(root)
+                for lineno, line in matches_by_file[fpath]:
+                    out.append(f"{rel}:{lineno}: {line}")
+            if test_match_count and not include_tests:
+                out.append(
+                    f"... +{test_match_count} match(es) in "
+                    f"{test_file_count} test file(s) "
+                    "(pass include_tests=True to show)"
+                )
+            return "\n".join(out) if out else "no matches"
+        # Default rendering: grouped + with context.
+        body = _render_grouped(
+            matches_by_file,
+            file_lines_cache,
+            context=context,
+            root=root,
+        )
+        if test_match_count and not include_tests:
+            body += (
+                f"\n\n+ {test_match_count} match(es) in "
+                f"{test_file_count} test file(s) — "
+                "pass include_tests=True to show"
+            )
+        return body
+    # Use the @tool decorator pattern by promoting the closure
+    # into a Tool with a manually-built schema. We can't use the
+    # bare @tool decorator on a nested function because the
+    # decorator-derived description would lose the loom-code-
+    # specific guidance the agent needs to pick the right args.
+    return tool(
+        name="grep",
+        description=(
+            "Search file contents for a regex. Returns grouped "
+            "results: one block per file, with ±2 lines of "
+            "context around each hit. Test-file matches are "
+            "collapsed by default — pass include_tests=True to "
+            "show. Args: pattern (regex), path='.', glob='*', "
+            "ignore_case=False, context=2 (±N lines), "
+            "include_tests=False, raw=False (raw=True for "
+            "flat one-line-per-match output), type='' "
+            "(comma-separated extensions e.g. 'py,ts')."
+        ),
+    )(grep)