PyPI - harnesskit - Versions diffs - 0.1.0__tar.gz - Mend

harnesskit 0.1.0__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (11) hide show

harnesskit-0.1.0/LICENSE +21 -0
harnesskit-0.1.0/PKG-INFO +169 -0
harnesskit-0.1.0/README.md +152 -0
harnesskit-0.1.0/harnesskit.egg-info/PKG-INFO +169 -0
harnesskit-0.1.0/harnesskit.egg-info/SOURCES.txt +9 -0
harnesskit-0.1.0/harnesskit.egg-info/dependency_links.txt +1 -0
harnesskit-0.1.0/harnesskit.egg-info/entry_points.txt +2 -0
harnesskit-0.1.0/harnesskit.egg-info/top_level.txt +1 -0
harnesskit-0.1.0/hk.py +419 -0
harnesskit-0.1.0/pyproject.toml +30 -0
harnesskit-0.1.0/setup.cfg +4 -0

harnesskit-0.1.0/LICENSE ADDED Viewed

@@ -0,0 +1,21 @@
+MIT License
+Copyright (c) 2026 Alex Melges
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.

harnesskit-0.1.0/PKG-INFO ADDED Viewed

@@ -0,0 +1,169 @@
+Metadata-Version: 2.4
+Name: harnesskit
+Version: 0.1.0
+Summary: Fuzzy edit tool for LLM coding agents — never fail a str_replace again
+Author-email: Alex Melges <alex@melges.dev>
+License-Expression: MIT
+Project-URL: Homepage, https://github.com/alexmelges/harnesskit
+Project-URL: Repository, https://github.com/alexmelges/harnesskit
+Classifier: Development Status :: 3 - Alpha
+Classifier: Intended Audience :: Developers
+Classifier: Programming Language :: Python :: 3
+Classifier: Topic :: Software Development :: Libraries
+Requires-Python: >=3.8
+Description-Content-Type: text/markdown
+License-File: LICENSE
+Dynamic: license-file
+# 🔧 HarnessKit
+> **Fuzzy edit tool for LLM coding agents — never fail a `str_replace` again.**
+[![License: MIT](https://img.shields.io/badge/License-MIT-blue.svg)](LICENSE)
+[![Python 3.8+](https://img.shields.io/badge/python-3.8+-green.svg)](https://python.org)
+[![Zero Dependencies](https://img.shields.io/badge/dependencies-zero-brightgreen.svg)](#)
+---
+## The Problem
+Every LLM coding agent has the same Achilles' heel: **edit application**.
+When Claude, GPT, or any model tries to modify code, it generates an `old_text` → `new_text` pair. The tool then does an exact string match to find where to apply the change. And it fails. A lot.
+- **Whitespace differences** — the model adds a space, drops a tab, or normalizes indentation
+- **Minor hallucinations** — a variable name is slightly off, a comment is paraphrased
+- **Format fragility** — diffs, patches, and line-number schemes all break in different ways
+The result? Up to **50% edit failure rates** on non-native models. Every failed edit wastes a tool call, burns tokens on retries, and breaks agent flow.
+## The Solution
+HarnessKit (`hk`) is a drop-in edit tool that **fuzzy-matches** the old text before replacing it. It uses a 4-stage matching cascade:
+1. **Exact match** — zero overhead when the model is precise
+2. **Normalized whitespace** — catches the most common failure mode
+3. **Sequence matching** — `difflib.SequenceMatcher` with configurable threshold (default 0.8)
+4. **Line-by-line fuzzy** — finds the best contiguous block match for heavily drifted edits
+Every edit returns a **confidence score** and **match type**, so your agent knows exactly how the edit was resolved.
+## Quick Start
+```bash
+pip install harnesskit
+```
+Or just copy `hk.py` into your project — it's a single file, stdlib only.
+### CLI Usage
+```bash
+# Direct arguments
+hk apply --file app.py --old "def hello():\n    print('hi')" --new "def hello():\n    print('hello world')"
+# JSON from stdin (perfect for tool_use integration)
+echo '{"file": "app.py", "old_text": "def hello():", "new_text": "def greet():"}' | hk apply --stdin
+# From a JSON file
+hk apply --edit changes.json
+# Dry run — see what would change without writing
+hk apply --file app.py --old "..." --new "..." --dry-run
+```
+### JSON Edit Format
+```json
+{
+  "file": "path/to/file.py",
+  "old_text": "def hello():\n    print('hi')",
+  "new_text": "def hello():\n    print('hello world')"
+}
+```
+Batch multiple edits:
+```json
+{
+  "edits": [
+    {"file": "a.py", "old_text": "...", "new_text": "..."},
+    {"file": "b.py", "old_text": "...", "new_text": "..."}
+  ]
+}
+```
+### Output
+```json
+{
+  "status": "applied",
+  "file": "app.py",
+  "match_type": "fuzzy",
+  "confidence": 0.92,
+  "matched_text": "def hello():\n    print( 'hi' )"
+}
+```
+### Exit Codes
+| Code | Meaning |
+|------|---------|
+| `0`  | Edit applied successfully |
+| `1`  | No match found |
+| `2`  | Ambiguous — multiple matches |
+## Integration
+HarnessKit is designed to slot into any agent framework as the edit backend:
+```python
+import subprocess, json
+def apply_edit(file, old_text, new_text):
+    result = subprocess.run(
+        ["hk", "apply", "--stdin"],
+        input=json.dumps({"file": file, "old_text": old_text, "new_text": new_text}),
+        capture_output=True, text=True
+    )
+    return json.loads(result.stdout)
+```
+Or import directly:
+```python
+from hk import apply_edit
+result = apply_edit("app.py", old_text, new_text, threshold=0.8)
+```
+## Design Principles
+- **Single file, stdlib only** — copy it, vendor it, pip install it. No dependency hell.
+- **419 lines of Python** — small enough to audit in one sitting
+- **Graceful degradation** — exact match when possible, fuzzy only when needed
+- **Transparent** — every result tells you *how* it matched and *how confident* it is
+- **Model-agnostic** — works with any LLM that can produce old/new text pairs
+## Configuration
+| Flag | Default | Description |
+|------|---------|-------------|
+| `--threshold` | `0.8` | Minimum similarity score for fuzzy matching |
+| `--dry-run` | `false` | Preview changes without writing to disk |
+## Development
+```bash
+git clone https://github.com/alexmelges/harnesskit.git
+cd harnesskit
+python3 test_hk.py  # 39 tests, stdlib unittest
+```
+## License
+MIT — see [LICENSE](LICENSE).
+---
+**Built for the agents that build everything else.**

harnesskit-0.1.0/README.md ADDED Viewed

@@ -0,0 +1,152 @@
+# 🔧 HarnessKit
+> **Fuzzy edit tool for LLM coding agents — never fail a `str_replace` again.**
+[![License: MIT](https://img.shields.io/badge/License-MIT-blue.svg)](LICENSE)
+[![Python 3.8+](https://img.shields.io/badge/python-3.8+-green.svg)](https://python.org)
+[![Zero Dependencies](https://img.shields.io/badge/dependencies-zero-brightgreen.svg)](#)
+---
+## The Problem
+Every LLM coding agent has the same Achilles' heel: **edit application**.
+When Claude, GPT, or any model tries to modify code, it generates an `old_text` → `new_text` pair. The tool then does an exact string match to find where to apply the change. And it fails. A lot.
+- **Whitespace differences** — the model adds a space, drops a tab, or normalizes indentation
+- **Minor hallucinations** — a variable name is slightly off, a comment is paraphrased
+- **Format fragility** — diffs, patches, and line-number schemes all break in different ways
+The result? Up to **50% edit failure rates** on non-native models. Every failed edit wastes a tool call, burns tokens on retries, and breaks agent flow.
+## The Solution
+HarnessKit (`hk`) is a drop-in edit tool that **fuzzy-matches** the old text before replacing it. It uses a 4-stage matching cascade:
+1. **Exact match** — zero overhead when the model is precise
+2. **Normalized whitespace** — catches the most common failure mode
+3. **Sequence matching** — `difflib.SequenceMatcher` with configurable threshold (default 0.8)
+4. **Line-by-line fuzzy** — finds the best contiguous block match for heavily drifted edits
+Every edit returns a **confidence score** and **match type**, so your agent knows exactly how the edit was resolved.
+## Quick Start
+```bash
+pip install harnesskit
+```
+Or just copy `hk.py` into your project — it's a single file, stdlib only.
+### CLI Usage
+```bash
+# Direct arguments
+hk apply --file app.py --old "def hello():\n    print('hi')" --new "def hello():\n    print('hello world')"
+# JSON from stdin (perfect for tool_use integration)
+echo '{"file": "app.py", "old_text": "def hello():", "new_text": "def greet():"}' | hk apply --stdin
+# From a JSON file
+hk apply --edit changes.json
+# Dry run — see what would change without writing
+hk apply --file app.py --old "..." --new "..." --dry-run
+```
+### JSON Edit Format
+```json
+{
+  "file": "path/to/file.py",
+  "old_text": "def hello():\n    print('hi')",
+  "new_text": "def hello():\n    print('hello world')"
+}
+```
+Batch multiple edits:
+```json
+{
+  "edits": [
+    {"file": "a.py", "old_text": "...", "new_text": "..."},
+    {"file": "b.py", "old_text": "...", "new_text": "..."}
+  ]
+}
+```
+### Output
+```json
+{
+  "status": "applied",
+  "file": "app.py",
+  "match_type": "fuzzy",
+  "confidence": 0.92,
+  "matched_text": "def hello():\n    print( 'hi' )"
+}
+```
+### Exit Codes
+| Code | Meaning |
+|------|---------|
+| `0`  | Edit applied successfully |
+| `1`  | No match found |
+| `2`  | Ambiguous — multiple matches |
+## Integration
+HarnessKit is designed to slot into any agent framework as the edit backend:
+```python
+import subprocess, json
+def apply_edit(file, old_text, new_text):
+    result = subprocess.run(
+        ["hk", "apply", "--stdin"],
+        input=json.dumps({"file": file, "old_text": old_text, "new_text": new_text}),
+        capture_output=True, text=True
+    )
+    return json.loads(result.stdout)
+```
+Or import directly:
+```python
+from hk import apply_edit
+result = apply_edit("app.py", old_text, new_text, threshold=0.8)
+```
+## Design Principles
+- **Single file, stdlib only** — copy it, vendor it, pip install it. No dependency hell.
+- **419 lines of Python** — small enough to audit in one sitting
+- **Graceful degradation** — exact match when possible, fuzzy only when needed
+- **Transparent** — every result tells you *how* it matched and *how confident* it is
+- **Model-agnostic** — works with any LLM that can produce old/new text pairs
+## Configuration
+| Flag | Default | Description |
+|------|---------|-------------|
+| `--threshold` | `0.8` | Minimum similarity score for fuzzy matching |
+| `--dry-run` | `false` | Preview changes without writing to disk |
+## Development
+```bash
+git clone https://github.com/alexmelges/harnesskit.git
+cd harnesskit
+python3 test_hk.py  # 39 tests, stdlib unittest
+```
+## License
+MIT — see [LICENSE](LICENSE).
+---
+**Built for the agents that build everything else.**

harnesskit-0.1.0/harnesskit.egg-info/PKG-INFO ADDED Viewed

@@ -0,0 +1,169 @@
+Metadata-Version: 2.4
+Name: harnesskit
+Version: 0.1.0
+Summary: Fuzzy edit tool for LLM coding agents — never fail a str_replace again
+Author-email: Alex Melges <alex@melges.dev>
+License-Expression: MIT
+Project-URL: Homepage, https://github.com/alexmelges/harnesskit
+Project-URL: Repository, https://github.com/alexmelges/harnesskit
+Classifier: Development Status :: 3 - Alpha
+Classifier: Intended Audience :: Developers
+Classifier: Programming Language :: Python :: 3
+Classifier: Topic :: Software Development :: Libraries
+Requires-Python: >=3.8
+Description-Content-Type: text/markdown
+License-File: LICENSE
+Dynamic: license-file
+# 🔧 HarnessKit
+> **Fuzzy edit tool for LLM coding agents — never fail a `str_replace` again.**
+[![License: MIT](https://img.shields.io/badge/License-MIT-blue.svg)](LICENSE)
+[![Python 3.8+](https://img.shields.io/badge/python-3.8+-green.svg)](https://python.org)
+[![Zero Dependencies](https://img.shields.io/badge/dependencies-zero-brightgreen.svg)](#)
+---
+## The Problem
+Every LLM coding agent has the same Achilles' heel: **edit application**.
+When Claude, GPT, or any model tries to modify code, it generates an `old_text` → `new_text` pair. The tool then does an exact string match to find where to apply the change. And it fails. A lot.
+- **Whitespace differences** — the model adds a space, drops a tab, or normalizes indentation
+- **Minor hallucinations** — a variable name is slightly off, a comment is paraphrased
+- **Format fragility** — diffs, patches, and line-number schemes all break in different ways
+The result? Up to **50% edit failure rates** on non-native models. Every failed edit wastes a tool call, burns tokens on retries, and breaks agent flow.
+## The Solution
+HarnessKit (`hk`) is a drop-in edit tool that **fuzzy-matches** the old text before replacing it. It uses a 4-stage matching cascade:
+1. **Exact match** — zero overhead when the model is precise
+2. **Normalized whitespace** — catches the most common failure mode
+3. **Sequence matching** — `difflib.SequenceMatcher` with configurable threshold (default 0.8)
+4. **Line-by-line fuzzy** — finds the best contiguous block match for heavily drifted edits
+Every edit returns a **confidence score** and **match type**, so your agent knows exactly how the edit was resolved.
+## Quick Start
+```bash
+pip install harnesskit
+```
+Or just copy `hk.py` into your project — it's a single file, stdlib only.
+### CLI Usage
+```bash
+# Direct arguments
+hk apply --file app.py --old "def hello():\n    print('hi')" --new "def hello():\n    print('hello world')"
+# JSON from stdin (perfect for tool_use integration)
+echo '{"file": "app.py", "old_text": "def hello():", "new_text": "def greet():"}' | hk apply --stdin
+# From a JSON file
+hk apply --edit changes.json
+# Dry run — see what would change without writing
+hk apply --file app.py --old "..." --new "..." --dry-run
+```
+### JSON Edit Format
+```json
+{
+  "file": "path/to/file.py",
+  "old_text": "def hello():\n    print('hi')",
+  "new_text": "def hello():\n    print('hello world')"
+}
+```
+Batch multiple edits:
+```json
+{
+  "edits": [
+    {"file": "a.py", "old_text": "...", "new_text": "..."},
+    {"file": "b.py", "old_text": "...", "new_text": "..."}
+  ]
+}
+```
+### Output
+```json
+{
+  "status": "applied",
+  "file": "app.py",
+  "match_type": "fuzzy",
+  "confidence": 0.92,
+  "matched_text": "def hello():\n    print( 'hi' )"
+}
+```
+### Exit Codes
+| Code | Meaning |
+|------|---------|
+| `0`  | Edit applied successfully |
+| `1`  | No match found |
+| `2`  | Ambiguous — multiple matches |
+## Integration
+HarnessKit is designed to slot into any agent framework as the edit backend:
+```python
+import subprocess, json
+def apply_edit(file, old_text, new_text):
+    result = subprocess.run(
+        ["hk", "apply", "--stdin"],
+        input=json.dumps({"file": file, "old_text": old_text, "new_text": new_text}),
+        capture_output=True, text=True
+    )
+    return json.loads(result.stdout)
+```
+Or import directly:
+```python
+from hk import apply_edit
+result = apply_edit("app.py", old_text, new_text, threshold=0.8)
+```
+## Design Principles
+- **Single file, stdlib only** — copy it, vendor it, pip install it. No dependency hell.
+- **419 lines of Python** — small enough to audit in one sitting
+- **Graceful degradation** — exact match when possible, fuzzy only when needed
+- **Transparent** — every result tells you *how* it matched and *how confident* it is
+- **Model-agnostic** — works with any LLM that can produce old/new text pairs
+## Configuration
+| Flag | Default | Description |
+|------|---------|-------------|
+| `--threshold` | `0.8` | Minimum similarity score for fuzzy matching |
+| `--dry-run` | `false` | Preview changes without writing to disk |
+## Development
+```bash
+git clone https://github.com/alexmelges/harnesskit.git
+cd harnesskit
+python3 test_hk.py  # 39 tests, stdlib unittest
+```
+## License
+MIT — see [LICENSE](LICENSE).
+---
+**Built for the agents that build everything else.**

harnesskit-0.1.0/harnesskit.egg-info/SOURCES.txt ADDED Viewed

@@ -0,0 +1,9 @@
+LICENSE
+README.md
+hk.py
+pyproject.toml
+harnesskit.egg-info/PKG-INFO
+harnesskit.egg-info/SOURCES.txt
+harnesskit.egg-info/dependency_links.txt
+harnesskit.egg-info/entry_points.txt
+harnesskit.egg-info/top_level.txt

harnesskit-0.1.0/harnesskit.egg-info/dependency_links.txt ADDED Viewed

	@@ -0,0 +1 @@
1	+

harnesskit-0.1.0/harnesskit.egg-info/entry_points.txt ADDED Viewed

	@@ -0,0 +1,2 @@
1	+ [console_scripts]
2	+ hk = hk:main

harnesskit-0.1.0/harnesskit.egg-info/top_level.txt ADDED Viewed

	@@ -0,0 +1 @@
1	+ hk

harnesskit-0.1.0/hk.py ADDED Viewed

@@ -0,0 +1,419 @@
+#!/usr/bin/env python3
+"""HarnessKit — Fuzzy edit tool for LLM coding agents.
+A single-file CLI tool that applies edits to files using fuzzy matching.
+Accepts a simple, model-agnostic edit format and robustly applies changes
+even when the LLM's output isn't pixel-perfect.
+Algorithm:
+  1. Try exact match
+  2. Fall back to normalized whitespace match
+  3. Fall back to difflib.SequenceMatcher (configurable threshold)
+  4. Fall back to line-by-line fuzzy match (best contiguous block)
+Exit codes: 0=applied, 1=no match found, 2=ambiguous (multiple matches)
+"""
+import argparse
+import difflib
+import json
+import re
+import sys
+from dataclasses import dataclass
+from typing import List, Optional, Tuple
+@dataclass
+class MatchResult:
+    start: int
+    end: int
+    matched_text: str
+    match_type: str  # "exact", "whitespace", "fuzzy", "line_fuzzy"
+    confidence: float
+@dataclass
+class EditResult:
+    status: str  # "applied", "no_match", "ambiguous", "error"
+    file: str
+    match_type: Optional[str] = None
+    confidence: Optional[float] = None
+    matched_text: Optional[str] = None
+    error: Optional[str] = None
+def normalize_whitespace(text: str) -> str:
+    """Collapse all runs of whitespace to single spaces and strip."""
+    return re.sub(r'\s+', ' ', text).strip()
+def find_exact_matches(content: str, old_text: str) -> List[MatchResult]:
+    """Find all exact occurrences of old_text in content."""
+    matches = []
+    start = 0
+    while True:
+        idx = content.find(old_text, start)
+        if idx == -1:
+            break
+        matches.append(MatchResult(
+            start=idx,
+            end=idx + len(old_text),
+            matched_text=old_text,
+            match_type="exact",
+            confidence=1.0,
+        ))
+        start = idx + 1
+    return matches
+def _strip_whitespace_with_map(text: str) -> Tuple[str, List[int]]:
+    """Strip all whitespace from text, returning (stripped, position_map).
+    position_map[i] = index in original text of the i-th non-ws char.
+    """
+    chars: List[str] = []
+    positions: List[int] = []
+    for i, ch in enumerate(text):
+        if not ch.isspace():
+            chars.append(ch)
+            positions.append(i)
+    return ''.join(chars), positions
+def find_whitespace_matches(content: str, old_text: str) -> List[MatchResult]:
+    """Find matches where the only differences are whitespace.
+    Strips all whitespace from both strings, finds substring matches
+    in the stripped content, then maps positions back to the original.
+    """
+    stripped_old, _ = _strip_whitespace_with_map(old_text)
+    if not stripped_old:
+        return []
+    stripped_content, content_pos_map = _strip_whitespace_with_map(content)
+    matches = []
+    start = 0
+    while True:
+        idx = stripped_content.find(stripped_old, start)
+        if idx == -1:
+            break
+        # Map back to original positions
+        orig_start = content_pos_map[idx]
+        orig_end_char = content_pos_map[idx + len(stripped_old) - 1]
+        orig_end = orig_end_char + 1
+        matched = content[orig_start:orig_end]
+        matches.append(MatchResult(
+            start=orig_start,
+            end=orig_end,
+            matched_text=matched,
+            match_type="whitespace",
+            confidence=0.95,
+        ))
+        start = idx + 1
+    return matches
+def find_fuzzy_matches(
+    content: str, old_text: str, threshold: float
+) -> List[MatchResult]:
+    """Find fuzzy matches using SequenceMatcher on sliding windows."""
+    if not old_text.strip():
+        return []
+    old_len = len(old_text)
+    best: List[MatchResult] = []
+    best_ratio = threshold
+    # Slide a window of varying sizes around the expected length
+    min_window = max(1, int(old_len * 0.7))
+    max_window = min(len(content), int(old_len * 1.3) + 1)
+    for window_size in range(min_window, max_window + 1):
+        for start in range(0, len(content) - window_size + 1):
+            candidate = content[start:start + window_size]
+            ratio = difflib.SequenceMatcher(
+                None, old_text, candidate
+            ).ratio()
+            if ratio > best_ratio:
+                best = [MatchResult(
+                    start=start,
+                    end=start + window_size,
+                    matched_text=candidate,
+                    match_type="fuzzy",
+                    confidence=round(ratio, 4),
+                )]
+                best_ratio = ratio
+            elif ratio == best_ratio and best:
+                # Check overlap — only add if non-overlapping
+                overlaps = any(
+                    not (start >= m.end or start + window_size <= m.start)
+                    for m in best
+                )
+                if not overlaps:
+                    best.append(MatchResult(
+                        start=start,
+                        end=start + window_size,
+                        matched_text=candidate,
+                        match_type="fuzzy",
+                        confidence=round(ratio, 4),
+                    ))
+    return best
+def find_line_fuzzy_matches(
+    content: str, old_text: str, threshold: float
+) -> List[MatchResult]:
+    """Find best contiguous block of lines matching old_text lines."""
+    content_lines = content.splitlines(keepends=True)
+    old_lines = old_text.splitlines(keepends=True)
+    if not old_lines or not content_lines:
+        return []
+    n_old = len(old_lines)
+    best_score = threshold
+    best_matches: List[Tuple[int, int, float]] = []  # (start_line, end_line, score)
+    for start_line in range(0, len(content_lines) - n_old + 1):
+        block = content_lines[start_line:start_line + n_old]
+        # Compare line by line
+        total = 0.0
+        for ol, cl in zip(old_lines, block):
+            total += difflib.SequenceMatcher(None, ol, cl).ratio()
+        avg = total / n_old
+        if avg > best_score:
+            best_score = avg
+            best_matches = [(start_line, start_line + n_old, avg)]
+        elif avg == best_score and best_matches:
+            best_matches.append((start_line, start_line + n_old, avg))
+    results = []
+    for start_line, end_line, score in best_matches:
+        block = content_lines[start_line:end_line]
+        matched_text = ''.join(block)
+        # Calculate char offsets
+        char_start = sum(len(l) for l in content_lines[:start_line])
+        char_end = char_start + len(matched_text)
+        results.append(MatchResult(
+            start=char_start,
+            end=char_end,
+            matched_text=matched_text,
+            match_type="line_fuzzy",
+            confidence=round(score, 4),
+        ))
+    return results
+def find_best_match(
+    content: str, old_text: str, threshold: float = 0.8
+) -> Optional[MatchResult]:
+    """Find the best match for old_text in content, trying strategies in order.
+    Returns None if no match meets the threshold, or if multiple ambiguous
+    matches are found (raises AmbiguousMatchError).
+    """
+    # Strategy 1: Exact match
+    matches = find_exact_matches(content, old_text)
+    if len(matches) == 1:
+        return matches[0]
+    if len(matches) > 1:
+        raise AmbiguousMatchError(matches)
+    # Strategy 2: Whitespace-normalized match
+    matches = find_whitespace_matches(content, old_text)
+    if len(matches) == 1:
+        return matches[0]
+    if len(matches) > 1:
+        raise AmbiguousMatchError(matches)
+    # Strategy 3: SequenceMatcher fuzzy match
+    matches = find_fuzzy_matches(content, old_text, threshold)
+    if len(matches) == 1:
+        return matches[0]
+    if len(matches) > 1:
+        raise AmbiguousMatchError(matches)
+    # Strategy 4: Line-by-line fuzzy match
+    matches = find_line_fuzzy_matches(content, old_text, threshold)
+    if len(matches) == 1:
+        return matches[0]
+    if len(matches) > 1:
+        raise AmbiguousMatchError(matches)
+    return None
+class AmbiguousMatchError(Exception):
+    """Raised when multiple equally-good matches are found."""
+    def __init__(self, matches: List[MatchResult]):
+        self.matches = matches
+        super().__init__(f"Found {len(matches)} ambiguous matches")
+def apply_edit(
+    file_path: str,
+    old_text: str,
+    new_text: str,
+    threshold: float = 0.8,
+    dry_run: bool = False,
+) -> EditResult:
+    """Apply a single edit to a file."""
+    try:
+        with open(file_path, 'r') as f:
+            content = f.read()
+    except FileNotFoundError:
+        return EditResult(
+            status="error",
+            file=file_path,
+            error=f"File not found: {file_path}",
+        )
+    except OSError as e:
+        return EditResult(
+            status="error",
+            file=file_path,
+            error=str(e),
+        )
+    try:
+        match = find_best_match(content, old_text, threshold)
+    except AmbiguousMatchError as e:
+        return EditResult(
+            status="ambiguous",
+            file=file_path,
+            match_type=e.matches[0].match_type,
+            confidence=e.matches[0].confidence,
+            error=f"Found {len(e.matches)} ambiguous matches",
+        )
+    if match is None:
+        return EditResult(
+            status="no_match",
+            file=file_path,
+            error="No match found above threshold",
+        )
+    new_content = content[:match.start] + new_text + content[match.end:]
+    if not dry_run:
+        with open(file_path, 'w') as f:
+            f.write(new_content)
+    return EditResult(
+        status="applied",
+        file=file_path,
+        match_type=match.match_type,
+        confidence=match.confidence,
+        matched_text=match.matched_text,
+    )
+def result_to_dict(result: EditResult) -> dict:
+    """Convert EditResult to JSON-serializable dict."""
+    d = {"status": result.status, "file": result.file}
+    if result.match_type is not None:
+        d["match_type"] = result.match_type
+    if result.confidence is not None:
+        d["confidence"] = result.confidence
+    if result.matched_text is not None:
+        d["matched_text"] = result.matched_text
+    if result.error is not None:
+        d["error"] = result.error
+    return d
+def parse_edit_input(args) -> List[dict]:
+    """Parse edit instructions from CLI args or stdin."""
+    if args.stdin:
+        data = json.load(sys.stdin)
+        if "edits" in data:
+            return data["edits"]
+        return [data]
+    if args.edit:
+        with open(args.edit, 'r') as f:
+            data = json.load(f)
+        if "edits" in data:
+            return data["edits"]
+        return [data]
+    if args.file and args.old is not None and args.new is not None:
+        return [{"file": args.file, "old_text": args.old, "new_text": args.new}]
+    raise ValueError(
+        "Must provide --file/--old/--new, --edit <file>, or --stdin"
+    )
+def main(argv: Optional[List[str]] = None) -> int:
+    parser = argparse.ArgumentParser(
+        prog="hk",
+        description="HarnessKit — Fuzzy edit tool for LLM coding agents",
+    )
+    sub = parser.add_subparsers(dest="command")
+    apply_parser = sub.add_parser("apply", help="Apply edit(s) to file(s)")
+    apply_parser.add_argument("--file", help="Target file path")
+    apply_parser.add_argument("--old", help="Text to find")
+    apply_parser.add_argument("--new", help="Replacement text")
+    apply_parser.add_argument("--edit", help="JSON edit instruction file")
+    apply_parser.add_argument(
+        "--stdin", action="store_true", help="Read JSON from stdin"
+    )
+    apply_parser.add_argument(
+        "--threshold",
+        type=float,
+        default=0.8,
+        help="Fuzzy match threshold (default: 0.8)",
+    )
+    apply_parser.add_argument(
+        "--dry-run",
+        action="store_true",
+        help="Show what would change without applying",
+    )
+    args = parser.parse_args(argv)
+    if args.command != "apply":
+        parser.print_help()
+        return 1
+    try:
+        edits = parse_edit_input(args)
+    except (ValueError, FileNotFoundError, json.JSONDecodeError) as e:
+        print(json.dumps({"status": "error", "error": str(e)}))
+        return 1
+    results = []
+    exit_code = 0
+    for edit in edits:
+        file_path = edit.get("file", "")
+        old_text = edit.get("old_text", "")
+        new_text = edit.get("new_text", "")
+        result = apply_edit(
+            file_path, old_text, new_text,
+            threshold=args.threshold,
+            dry_run=args.dry_run,
+        )
+        results.append(result_to_dict(result))
+        if result.status == "no_match" or result.status == "error":
+            exit_code = max(exit_code, 1)
+        elif result.status == "ambiguous":
+            exit_code = max(exit_code, 2)
+    if len(results) == 1:
+        print(json.dumps(results[0], indent=2))
+    else:
+        print(json.dumps(results, indent=2))
+    return exit_code
+if __name__ == "__main__":
+    sys.exit(main())

harnesskit-0.1.0/pyproject.toml ADDED Viewed

@@ -0,0 +1,30 @@
+[build-system]
+requires = ["setuptools>=64"]
+build-backend = "setuptools.build_meta"
+[project]
+name = "harnesskit"
+version = "0.1.0"
+description = "Fuzzy edit tool for LLM coding agents — never fail a str_replace again"
+readme = "README.md"
+license = "MIT"
+requires-python = ">=3.8"
+authors = [
+    {name = "Alex Melges", email = "alex@melges.dev"},
+]
+classifiers = [
+    "Development Status :: 3 - Alpha",
+    "Intended Audience :: Developers",
+    "Programming Language :: Python :: 3",
+    "Topic :: Software Development :: Libraries",
+]
+[project.urls]
+Homepage = "https://github.com/alexmelges/harnesskit"
+Repository = "https://github.com/alexmelges/harnesskit"
+[project.scripts]
+hk = "hk:main"
+[tool.setuptools]
+py-modules = ["hk"]

harnesskit-0.1.0/setup.cfg ADDED Viewed

@@ -0,0 +1,4 @@
+[egg_info]
+tag_build =
+tag_date = 0