PyPI - sourcepack - Versions diffs - 1.10.0a0__py3-none-any.whl - Mend

sourcepack 1.10.0a0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (33) hide show

sourcepack/__init__.py +19 -0
sourcepack/assets/__init__.py +1 -0
sourcepack/assets/audit_template.md +3 -0
sourcepack/assets/packet_instructions.md +3 -0
sourcepack/baseline.py +285 -0
sourcepack/cli.py +2991 -0
sourcepack/commands.py +149 -0
sourcepack/dependencies.py +98 -0
sourcepack/diff_parser.py +122 -0
sourcepack/ecosystems/__init__.py +3 -0
sourcepack/ecosystems/generic.py +13 -0
sourcepack/ecosystems/node.py +3 -0
sourcepack/ecosystems/python.py +12 -0
sourcepack/errors.py +19 -0
sourcepack/evidence.py +109 -0
sourcepack/execution_ledger.py +252 -0
sourcepack/git.py +50 -0
sourcepack/judgment.py +1922 -0
sourcepack/packet.py +837 -0
sourcepack/paths.py +68 -0
sourcepack/policy.py +38 -0
sourcepack/reason_codes.py +72 -0
sourcepack/reports/__init__.py +5 -0
sourcepack/reports/html.py +88 -0
sourcepack/reports/json.py +123 -0
sourcepack/reports/markdown.py +61 -0
sourcepack/schemas.py +63 -0
sourcepack-1.10.0a0.dist-info/METADATA +311 -0
sourcepack-1.10.0a0.dist-info/RECORD +33 -0
sourcepack-1.10.0a0.dist-info/WHEEL +5 -0
sourcepack-1.10.0a0.dist-info/entry_points.txt +2 -0
sourcepack-1.10.0a0.dist-info/licenses/LICENSE +21 -0
sourcepack-1.10.0a0.dist-info/top_level.txt +1 -0

sourcepack/execution_ledger.py ADDED Viewed

@@ -0,0 +1,252 @@
+from __future__ import annotations
+import hashlib
+import json
+import os
+import platform
+import re
+import shutil
+import subprocess
+import time
+import uuid
+from dataclasses import asdict, dataclass
+from datetime import datetime, timezone
+from pathlib import Path
+from typing import Iterable
+from sourcepack import __version__
+SCHEMA_VERSION = "sourcepack.execution_ledger.v1"
+LEDGER_FILENAME = "ledger.jsonl"
+MAX_EXCERPT_CHARS = 2048
+@dataclass(frozen=True)
+class ExecutionClaim:
+    command: str
+    phrase: str
+    start: int
+    end: int
+@dataclass(frozen=True)
+class ExecutionLedgerEntry:
+    schema_version: str
+    entry_id: str
+    generated_at: str
+    repo_root: str
+    git_head: str | None
+    worktree_dirty_before: bool | None
+    worktree_dirty_after: bool | None
+    command: list[str]
+    cwd: str
+    exit_code: int
+    stdout_sha256: str
+    stderr_sha256: str
+    stdout_excerpt: str
+    stderr_excerpt: str
+    duration_ms: int
+    environment_summary: dict
+    sourcepack_version: str
+def utc_now() -> str:
+    return datetime.now(timezone.utc).isoformat()
+def sha256_bytes(data: bytes) -> str:
+    return hashlib.sha256(data).hexdigest()
+def excerpt_bytes(data: bytes, limit: int = MAX_EXCERPT_CHARS) -> str:
+    text = data.decode("utf-8", "replace")
+    if len(text) <= limit:
+        return text
+    return text[:limit] + "…[truncated]"
+def find_repo_root(start: str | Path = ".") -> Path:
+    start_path = Path(start).resolve()
+    cp = subprocess.run(["git", "rev-parse", "--show-toplevel"], cwd=start_path, text=True, stdout=subprocess.PIPE, stderr=subprocess.PIPE)
+    if cp.returncode == 0 and cp.stdout.strip():
+        return Path(cp.stdout.strip()).resolve()
+    return start_path
+def _git_head(repo_root: Path) -> str | None:
+    cp = subprocess.run(["git", "rev-parse", "HEAD"], cwd=repo_root, text=True, stdout=subprocess.PIPE, stderr=subprocess.DEVNULL)
+    return cp.stdout.strip() if cp.returncode == 0 and cp.stdout.strip() else None
+def _worktree_dirty(repo_root: Path) -> bool | None:
+    cp = subprocess.run(["git", "status", "--porcelain"], cwd=repo_root, text=True, stdout=subprocess.PIPE, stderr=subprocess.DEVNULL)
+    if cp.returncode != 0:
+        return None
+    return bool(cp.stdout.strip())
+def ledger_dir(repo_root: str | Path) -> Path:
+    return Path(repo_root) / ".sourcepack" / "evidence"
+def ledger_path(repo_root: str | Path) -> Path:
+    return ledger_dir(repo_root) / LEDGER_FILENAME
+def entry_to_json(entry: ExecutionLedgerEntry) -> str:
+    return json.dumps(asdict(entry), sort_keys=True, separators=(",", ":"))
+def append_entry(repo_root: str | Path, entry: ExecutionLedgerEntry) -> None:
+    path = ledger_path(repo_root)
+    path.parent.mkdir(parents=True, exist_ok=True)
+    with path.open("a", encoding="utf-8") as fh:
+        fh.write(entry_to_json(entry) + "\n")
+def iter_entries(repo_root: str | Path) -> Iterable[dict]:
+    path = ledger_path(repo_root)
+    if not path.exists():
+        return
+    with path.open("r", encoding="utf-8") as fh:
+        for line in fh:
+            line = line.strip()
+            if line:
+                yield json.loads(line)
+def clear_ledger(repo_root: str | Path) -> None:
+    path = ledger_path(repo_root)
+    if path.exists():
+        path.unlink()
+def environment_summary() -> dict:
+    return {
+        "platform": platform.platform(),
+        "python": platform.python_version(),
+        "shell": os.environ.get("SHELL"),
+        "path_entries": len(os.environ.get("PATH", "").split(os.pathsep)) if os.environ.get("PATH") else 0,
+    }
+def run_and_record(command: list[str], cwd: str | Path = ".") -> ExecutionLedgerEntry:
+    if not command:
+        raise ValueError("sourcepack exec requires a command after --")
+    repo_root = find_repo_root(cwd)
+    dirty_before = _worktree_dirty(repo_root)
+    head = _git_head(repo_root)
+    start = time.monotonic()
+    cp = subprocess.run(command, cwd=Path(cwd).resolve(), stdout=subprocess.PIPE, stderr=subprocess.PIPE)
+    duration_ms = int((time.monotonic() - start) * 1000)
+    dirty_after = _worktree_dirty(repo_root)
+    entry = ExecutionLedgerEntry(
+        schema_version=SCHEMA_VERSION,
+        entry_id=uuid.uuid4().hex,
+        generated_at=utc_now(),
+        repo_root=str(repo_root),
+        git_head=head,
+        worktree_dirty_before=dirty_before,
+        worktree_dirty_after=dirty_after,
+        command=list(command),
+        cwd=str(Path(cwd).resolve()),
+        exit_code=int(cp.returncode),
+        stdout_sha256=sha256_bytes(cp.stdout),
+        stderr_sha256=sha256_bytes(cp.stderr),
+        stdout_excerpt=excerpt_bytes(cp.stdout),
+        stderr_excerpt=excerpt_bytes(cp.stderr),
+        duration_ms=duration_ms,
+        environment_summary=environment_summary(),
+        sourcepack_version=__version__,
+    )
+    append_entry(repo_root, entry)
+    return entry
+_CLEAR_PHRASES = [
+    "tests passed", "test passed", "build passed", "lint passed", "typecheck passed",
+    "pytest passed", "npm test passed", "npm run build passed",
+]
+_SUPPORTED_COMMAND_PREFIXES = ["pytest", "npm test", "npm run build", "npm run test", "python -m pytest", "make test", "ruff check", "mypy"]
+_RAN_RE = re.compile(r"\bI\s+(?:ran|tested)\s+([^\n.;]+)", re.IGNORECASE)
+def detect_execution_claims(text: str) -> list[ExecutionClaim]:
+    """Return bounded, explicit command-execution claims without semantic guessing."""
+    claims: list[ExecutionClaim] = []
+    lower = text.lower()
+    for phrase in _CLEAR_PHRASES:
+        start = lower.find(phrase)
+        while start != -1:
+            if not re.search(r"\b(should|probably|expected to)\s+" + re.escape(phrase.split()[0]), lower[max(0, start-20):start+len(phrase)]):
+                cmd = phrase.removesuffix(" passed")
+                claims.append(ExecutionClaim(command=cmd, phrase=text[start:start + len(phrase)], start=start, end=start + len(phrase)))
+            start = lower.find(phrase, start + 1)
+    for prefix in _SUPPORTED_COMMAND_PREFIXES:
+        pattern = re.compile(r"\b" + re.escape(prefix) + r"\s+(passed|works|succeeds)\b", re.IGNORECASE)
+        for m in pattern.finditer(text):
+            claims.append(ExecutionClaim(command=prefix, phrase=m.group(0), start=m.start(), end=m.end()))
+    for m in _RAN_RE.finditer(text):
+        cmd = m.group(1).strip().strip('`"\'')
+        if cmd and len(cmd.split()) <= 8 and not cmd.lower().startswith(("tests", "the test file")):
+            claims.append(ExecutionClaim(command=cmd, phrase=m.group(0), start=m.start(), end=m.end()))
+    claims.sort(key=lambda c: (c.start, c.end, c.command))
+    deduped: list[ExecutionClaim] = []
+    seen = set()
+    for claim in claims:
+        key = (claim.command.lower(), claim.start, claim.end)
+        if key not in seen:
+            seen.add(key)
+            deduped.append(claim)
+    return deduped
+def _command_matches(claim: str, entry_command: list[str]) -> bool:
+    normalized_entry = " ".join(entry_command).strip().lower()
+    normalized_claim = claim.strip().lower()
+    return normalized_entry == normalized_claim or normalized_entry.startswith(normalized_claim + " ")
+def evidence_for_claim(repo_root: str | Path, claim: ExecutionClaim) -> tuple[str, dict | None]:
+    matches = [entry for entry in iter_entries(repo_root) if _command_matches(claim.command, list(entry.get("command") or []))]
+    if not matches:
+        return "execution_evidence_missing", None
+    latest = sorted(matches, key=lambda e: str(e.get("generated_at") or ""))[-1]
+    if len({int(m.get("exit_code", -999)) for m in matches}) > 1:
+        return "execution_inconclusive", latest
+    if int(latest.get("exit_code", -1)) == 0:
+        return "execution_evidence_present", latest
+    return "execution_failed", latest
+def execution_findings(repo_root: str | Path, text: str) -> list[dict]:
+    findings: list[dict] = []
+    for claim in detect_execution_claims(text):
+        status, entry = evidence_for_claim(repo_root, claim)
+        if status == "execution_evidence_present":
+            severity = "info"
+            message = f"Execution ledger contains a successful local run for: {claim.command}."
+        elif status == "execution_failed":
+            severity = "warn"
+            message = f"Execution ledger contains a failed local run for: {claim.command}."
+        elif status == "execution_inconclusive":
+            severity = "warn"
+            message = f"Execution ledger has mixed or ambiguous local runs for: {claim.command}."
+        else:
+            severity = "warn"
+            message = f"No SourcePack execution-ledger entry supports claimed run: {claim.command}."
+        findings.append({
+            "id": status,
+            "severity": severity,
+            "category": "execution",
+            "path": None,
+            "message": message,
+            "evidence": claim.command,
+            "suggestion": "Run the command through `sourcepack exec -- ...` if local execution evidence is intended." if severity == "warn" else None,
+            "ledger_entry_id": entry.get("entry_id") if entry else None,
+        })
+    return findings
+def command_available(command: str) -> bool:
+    return shutil.which(command) is not None

sourcepack/git.py ADDED Viewed

@@ -0,0 +1,50 @@
+from __future__ import annotations
+import subprocess
+from pathlib import Path
+def run_git(repo: str | Path, args: list[str]) -> subprocess.CompletedProcess:
+    try:
+        return subprocess.run(["git", *args], cwd=Path(repo), text=True, stdout=subprocess.PIPE, stderr=subprocess.PIPE)
+    except FileNotFoundError:
+        return subprocess.CompletedProcess(["git", *args], 127, "", "git executable not found")
+def repo_root(path: str | Path) -> Path | None:
+    cp = run_git(path, ["rev-parse", "--show-toplevel"])
+    return Path(cp.stdout.strip()).resolve() if cp.returncode == 0 else None
+def diff(repo: str | Path, *, staged: bool = False, relative: bool = False) -> str:
+    args = ["diff", "--staged"] if staged else ["diff"]
+    if relative:
+        args.append("--relative")
+    return run_git(repo, args).stdout
+def untracked_files(repo: str | Path) -> list[str]:
+    cp = run_git(repo, ["ls-files", "--others", "--exclude-standard"])
+    return [line.strip() for line in cp.stdout.splitlines() if line.strip()] if cp.returncode == 0 else []
+def dirty_worktree(repo: str | Path) -> tuple[bool, str | None]:
+    root = repo_root(repo)
+    if root is None:
+        cp = run_git(repo, ["rev-parse", "--show-toplevel"])
+        return False, "git_unavailable" if cp.returncode == 127 else "not_git"
+    for args in (["diff", "--quiet"], ["diff", "--staged", "--quiet"]):
+        cp = run_git(root, list(args))
+        if cp.returncode == 1:
+            return True, None
+        if cp.returncode == 127:
+            return False, "git_unavailable"
+    return (bool(untracked_files(root)), None)
+def metadata(repo: str | Path) -> dict:
+    root = Path(repo)
+    head = run_git(root, ["rev-parse", "HEAD"])
+    branch = run_git(root, ["rev-parse", "--abbrev-ref", "HEAD"])
+    dirty, state = dirty_worktree(root)
+    return {"branch": branch.stdout.strip() if branch.returncode == 0 else None, "head_commit": head.stdout.strip() if head.returncode == 0 else None, "dirty": dirty if state is None else None, "dirty_state": state}