PyPI - sin-code-bundle - Versions diffs - 0.9.2__py3-none-any.whl - Mend

sin-code-bundle 0.9.2__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (41) hide show

sin_code_bundle/__init__.py +6 -0
sin_code_bundle/agents_md.py +245 -0
sin_code_bundle/ast_edit.py +323 -0
sin_code_bundle/bench.py +506 -0
sin_code_bundle/budget.py +51 -0
sin_code_bundle/cache.py +131 -0
sin_code_bundle/checkpoint.py +230 -0
sin_code_bundle/cli.py +1943 -0
sin_code_bundle/codocs.py +328 -0
sin_code_bundle/dap_bridge.py +135 -0
sin_code_bundle/data/codocs/SKILL.md +280 -0
sin_code_bundle/gitnexus.py +368 -0
sin_code_bundle/hashline.py +216 -0
sin_code_bundle/hooks.py +249 -0
sin_code_bundle/immortal_commit.py +288 -0
sin_code_bundle/interceptor.py +119 -0
sin_code_bundle/lsp_backend.py +303 -0
sin_code_bundle/lsp_bootstrap.py +85 -0
sin_code_bundle/markitdown.py +254 -0
sin_code_bundle/mcp_config.py +455 -0
sin_code_bundle/mcp_server.py +963 -0
sin_code_bundle/memory.py +208 -0
sin_code_bundle/merge_safety.py +313 -0
sin_code_bundle/orchestration_worktrees.py +102 -0
sin_code_bundle/policy.py +224 -0
sin_code_bundle/preflight.py +152 -0
sin_code_bundle/programming_workflow.py +541 -0
sin_code_bundle/rtk.py +154 -0
sin_code_bundle/safety.py +52 -0
sin_code_bundle/session_warmup.py +247 -0
sin_code_bundle/skills.py +188 -0
sin_code_bundle/symbol_resolve.py +166 -0
sin_code_bundle/tools/__init__.py +4 -0
sin_code_bundle/tools/pypi_setup.py +289 -0
sin_code_bundle/vfs.py +264 -0
sin_code_bundle-0.9.2.dist-info/METADATA +470 -0
sin_code_bundle-0.9.2.dist-info/RECORD +41 -0
sin_code_bundle-0.9.2.dist-info/WHEEL +5 -0
sin_code_bundle-0.9.2.dist-info/entry_points.txt +4 -0
sin_code_bundle-0.9.2.dist-info/licenses/LICENSE +21 -0
sin_code_bundle-0.9.2.dist-info/top_level.txt +1 -0

sin_code_bundle/policy.py ADDED Viewed

@@ -0,0 +1,224 @@
+# SPDX-License-Identifier: MIT
+"""Risk-gating, approval, and tamper-evident audit logging for SIN tools.
+MCP has no native access control. This module wraps every tool execution with:
+  - a per-tool risk classification (read | write | exec | network)
+  - a configurable policy (allow | ask | deny) per risk class
+  - an append-only, hash-chained audit log under .sin/audit/log.jsonl
+  - path sandboxing helpers so tools cannot read/write outside the project root
+Policy is loaded from .sin/policy.yaml (falls back to safe defaults).
+Docs: policy.doc.md
+"""
+from __future__ import annotations
+import hashlib
+import json
+import os
+import time
+from dataclasses import dataclass, field
+from pathlib import Path
+from typing import Callable, Literal, Optional
+try:
+    import yaml
+except ImportError:  # pragma: no cover
+    yaml = None  # type: ignore
+RiskClass = Literal["read", "write", "exec", "network"]
+Decision = Literal["allow", "ask", "deny"]
+# ── Tool risk classification ─────────────────────────────────────────
+# New MCP tools must be added here so the policy engine can rate them.
+TOOL_RISK: dict[str, RiskClass] = {
+    "impact": "read",
+    "semantic_diff": "read",
+    "semantic_review": "read",
+    "architectural_debt": "read",
+    "prove": "read",
+    "verify_tests": "exec",
+    "mock_env": "network",
+}
+# Safe defaults: reads are silent, everything else prompts.
+# Never set "exec" or "network" to "allow" without explicit user opt-in.
+DEFAULT_POLICY: dict[RiskClass, Decision] = {
+    "read": "allow",
+    "write": "ask",
+    "exec": "ask",
+    "network": "ask",
+}
+class PolicyError(RuntimeError):
+    """Raised when a tool call is denied by policy."""
+# ── Policy: Rule Container ────────────────────────────────────────────
+@dataclass
+class Policy:
+    """Loaded policy rules + auto-approval flag.
+    `auto_approve` is a kill switch for the approval prompt: if True
+    (or `SIN_AUTO_APPROVE=1` in the env), all "ask" decisions pass
+    without user interaction. Use only in trusted CI.
+    """
+    rules: dict[RiskClass, Decision] = field(default_factory=lambda: dict(DEFAULT_POLICY))
+    auto_approve: bool = field(default_factory=lambda: os.environ.get("SIN_AUTO_APPROVE") == "1")
+    @classmethod
+    def load(cls, root: Path = Path(".")) -> "Policy":
+        """Load policy from `<root>/.sin/policy.yaml`, falling back to defaults.
+        Missing file or missing PyYAML → returns a `Policy` populated with
+        `DEFAULT_POLICY` and `auto_approve` derived from `SIN_AUTO_APPROVE`.
+        User-supplied `rules` are merged on top of defaults (per-key override).
+        """
+        path = root / ".sin" / "policy.yaml"
+        if path.exists() and yaml is not None:
+            data = yaml.safe_load(path.read_text(encoding="utf-8")) or {}
+            rules = {**DEFAULT_POLICY, **(data.get("rules") or {})}
+            return cls(rules=rules, auto_approve=bool(data.get("auto_approve", False)))
+        return cls()
+    def decide(self, tool: str) -> Decision:
+        """Map a tool name to its policy decision.
+        Unknown tools default to risk class `"exec"` (fail-closed — the
+        default decision for `exec` is `"ask"`, so they prompt unless
+        `auto_approve` is on).
+        """
+        risk = TOOL_RISK.get(tool, "exec")
+        return self.rules.get(risk, "ask")
+# ── Tamper-evident Audit Log (hash chain) ────────────────────────────────
+class AuditLog:
+    """Append-only JSONL log under `<root>/.sin/audit/log.jsonl`.
+    Each entry's `hash` is `sha256(prev_hash || canonical_json(entry))`,
+    forming a hash chain. `verify_chain()` re-walks the file to confirm
+    no entry has been edited or removed. Argument *values* are never
+    logged — only the *keys* (to avoid leaking secrets via the audit log).
+    """
+    def __init__(self, root: Path = Path(".")) -> None:
+        self.path = root / ".sin" / "audit" / "log.jsonl"
+        # parents=True — creates .sin/ and .sin/audit/ in one shot
+        self.path.parent.mkdir(parents=True, exist_ok=True)
+    def _last_hash(self) -> str:
+        if not self.path.exists():
+            return "0" * 64
+        last = ""
+        for line in self.path.read_text(encoding="utf-8").splitlines():
+            if line.strip():
+                last = line
+        if not last:
+            return "0" * 64
+        return json.loads(last).get("hash", "0" * 64)
+    def record(self, tool: str, args: dict, decision: Decision, outcome: str) -> str:
+        """Append one entry to the log and return its hash.
+        `args` is inspected by *key* only (sorted) — values are not stored,
+        so secrets in tool args never reach disk.
+        """
+        prev = self._last_hash()
+        entry = {
+            "ts": time.strftime("%Y-%m-%dT%H:%M:%SZ", time.gmtime()),
+            "tool": tool,
+            "risk": TOOL_RISK.get(tool, "exec"),
+            "decision": decision,
+            "outcome": outcome,
+            "args_keys": sorted(args.keys()),
+            "prev": prev,
+        }
+        # sort_keys=True — canonical form so verify_chain() can reproduce
+        # the exact same digest bit-for-bit regardless of dict insertion order
+        digest = hashlib.sha256(
+            (prev + json.dumps(entry, sort_keys=True)).encode("utf-8")
+        ).hexdigest()
+        entry["hash"] = digest
+        with self.path.open("a", encoding="utf-8") as fh:
+            fh.write(json.dumps(entry) + "\n")
+        return digest
+    def verify_chain(self) -> bool:
+        """Return True if the hash chain is intact (no tampering)."""
+        if not self.path.exists():
+            return True
+        prev = "0" * 64
+        for line in self.path.read_text(encoding="utf-8").splitlines():
+            if not line.strip():
+                continue
+            entry = json.loads(line)
+            stored = entry.pop("hash", "")
+            if entry.get("prev") != prev:
+                return False
+            # MUST use sort_keys=True here to match the digest computed in
+            # record(); otherwise any field-order change in json.dumps would
+            # fail verification even on a benign log.
+            recomputed = hashlib.sha256(
+                (prev + json.dumps(entry, sort_keys=True)).encode("utf-8")
+            ).hexdigest()
+            if recomputed != stored:
+                return False
+            prev = stored
+        return True
+# ── Path Sandboxing ───────────────────────────────────────────────────────
+def ensure_within_root(target: str | Path, root: Optional[str | Path] = None) -> Path:
+    """Resolve `target` and guarantee it stays inside the project root."""
+    root_path = Path(root or os.environ.get("SIN_PROJECT_ROOT", ".")).resolve()
+    resolved = (
+        (root_path / target).resolve()
+        if not Path(target).is_absolute()  # type: ignore[arg-type]
+        else Path(target).resolve()  # type: ignore[arg-type]
+    )
+    if root_path not in resolved.parents and resolved != root_path:
+        raise PolicyError(f"path '{resolved}' is outside project root '{root_path}'")
+    return resolved
+# ── Guarded Tool Wrapper (MCP gate) ────────────────────────────────────────
+def guarded(
+    tool: str,
+    args: dict,
+    run: Callable[[], dict],
+    root: Path = Path("."),
+    approver: Optional[Callable[[str, dict], bool]] = None,
+) -> dict:
+    """Apply policy + audit around a tool execution.
+    `approver` is called for 'ask' decisions; defaults to auto-deny unless
+    SIN_AUTO_APPROVE=1 (so non-interactive runs are safe by default).
+    """
+    policy = Policy.load(root)
+    audit = AuditLog(root)
+    decision = policy.decide(tool)
+    if decision == "deny":
+        audit.record(tool, args, decision, "denied")
+        raise PolicyError(f"tool '{tool}' denied by policy (risk={TOOL_RISK.get(tool)})")
+    if decision == "ask":
+        approved = policy.auto_approve or (approver(tool, args) if approver else False)
+        if not approved:
+            audit.record(tool, args, decision, "rejected")
+            raise PolicyError(
+                f"tool '{tool}' requires approval (risk={TOOL_RISK.get(tool)}). "
+                "Set SIN_AUTO_APPROVE=1 or adjust .sin/policy.yaml."
+            )
+    try:
+        result = run()
+        audit.record(tool, args, decision, "ok")
+        return result
+    except Exception as exc:  # noqa: BLE001
+        audit.record(tool, args, decision, f"error:{type(exc).__name__}")
+        raise

sin_code_bundle/preflight.py ADDED Viewed

@@ -0,0 +1,152 @@
+# Purpose: Pre-flight safety gate — checks before state-changing tool calls.
+# Docs: preflight.doc.md
+"""Consolidates policy (sin_check_architecture) + docs (codocs) + git + tests
+into 1 call. Run BEFORE sin_write, sin_edit, sin_bash, sin_ast_edit.
+Docs: preflight.doc.md
+"""
+from __future__ import annotations
+import subprocess
+from pathlib import Path
+from typing import Any, Dict, Optional
+class PreflightChecker:
+    """Run all pre-flight checks in one go.
+    Each check is independent — failure of one does not block the others.
+    Returns a structured dict with per-check results and a derived risk score.
+    """
+    def __init__(self, repo_root: Optional[Path] = None) -> None:
+        self.repo_root = Path(repo_root) if repo_root else Path.cwd()
+    def check(self, tool_name: str, tool_input: Dict[str, Any]) -> Dict[str, Any]:
+        """Run policy + docs + git + tests checks.
+        Args:
+            tool_name: tool about to be called (e.g. ``sin_write``).
+            tool_input: arguments to that tool.
+        Returns:
+            Dict with ``allowed``, ``policy_ok``, ``docs_ok``, ``git_clean``,
+            ``tests_status``, ``estimated_risk``, ``violations`` and ``details``.
+        """
+        result: Dict[str, Any] = {
+            "tool_name": tool_name,
+            "allowed": True,
+            "policy_ok": True,
+            "docs_ok": True,
+            "git_clean": True,
+            "tests_status": "unknown",
+            "estimated_risk": "low",
+            "violations": [],
+            "details": {},
+        }
+        # ── 1. Policy check (existing SINInterceptor) ────────────────────
+        # Reuses the same rule engine as sin_check_architecture, so behaviour
+        # stays consistent with the single-call variant.
+        try:
+            from .interceptor import SINInterceptor
+            policy = SINInterceptor(repo_root=self.repo_root).preflight(tool_name, tool_input)
+            result["policy_ok"] = policy.get("allowed", True)
+            result["violations"] = policy.get("violations", [])
+            if not result["policy_ok"]:
+                result["allowed"] = False
+                result["estimated_risk"] = "high"
+        except Exception as exc:
+            result["details"]["policy_error"] = str(exc)
+        # ── 2. Docs check (codocs) ───────────────────────────────────────
+        # Surfaces broken .doc.md references; non-fatal but raises risk.
+        try:
+            from . import codocs
+            broken = codocs.find_broken(str(self.repo_root))
+            result["docs_ok"] = not bool(broken)
+            if not result["docs_ok"]:
+                result["details"]["broken_docs"] = [b.to_dict() for b in broken]
+        except Exception as exc:
+            result["details"]["docs_error"] = str(exc)
+        # ── 3. Git status ────────────────────────────────────────────────
+        # Skipped silently if the directory is not a git repository.
+        try:
+            if (self.repo_root / ".git").exists():
+                proc = subprocess.run(
+                    ["git", "status", "--porcelain"],
+                    cwd=self.repo_root,
+                    capture_output=True,
+                    text=True,
+                    timeout=5,
+                )
+                if proc.returncode == 0:
+                    changes = proc.stdout.strip()
+                    result["git_clean"] = not bool(changes)
+                    if changes:
+                        result["details"]["git_changes_count"] = len(changes.split("\n"))
+                else:
+                    result["git_clean"] = False
+                    result["details"]["git_error"] = proc.stderr[-500:]
+        except subprocess.TimeoutExpired:
+            result["details"]["git_error"] = "git status timeout"
+        except FileNotFoundError:
+            result["details"]["git_error"] = "git not installed"
+        except Exception as exc:
+            result["details"]["git_error"] = str(exc)
+        # ── 4. Test collection (pytest --collect-only) ───────────────────
+        # Only runs when a tests/ or test/ directory exists AND pytest is
+        # importable. Collection (not execution) keeps the pre-flight cheap.
+        try:
+            has_tests = (self.repo_root / "tests").exists() or (self.repo_root / "test").exists()
+            if has_tests:
+                proc = subprocess.run(
+                    ["python3", "-m", "pytest", "--collect-only", "-q"],
+                    cwd=self.repo_root,
+                    capture_output=True,
+                    text=True,
+                    timeout=15,
+                )
+                if proc.returncode == 0:
+                    result["tests_status"] = "pass"
+                    # Capture the "N tests collected" summary line for context.
+                    for line in proc.stdout.split("\n"):
+                        if "tests collected" in line.lower():
+                            result["details"]["tests_collected"] = line.strip()
+                            break
+                else:
+                    result["tests_status"] = "fail"
+                    result["details"]["test_errors"] = proc.stderr[-500:]
+        except subprocess.TimeoutExpired:
+            result["tests_status"] = "timeout"
+        except FileNotFoundError:
+            # pytest not installed — non-fatal, leave status as "unknown".
+            result["tests_status"] = "skipped"
+        except Exception as exc:
+            result["details"]["tests_error"] = str(exc)
+        # ── 5. Risk estimation ───────────────────────────────────────────
+        # 5 independent signals; 0 → low, 1-2 → medium, 3+ → high + block.
+        risk_signals = sum(
+            [
+                not result["policy_ok"],
+                not result["docs_ok"],
+                not result["git_clean"],
+                result["tests_status"] == "fail",
+                len(result["violations"]) > 0,
+            ]
+        )
+        if risk_signals == 0:
+            result["estimated_risk"] = "low"
+        elif risk_signals <= 2:
+            result["estimated_risk"] = "medium"
+        else:
+            result["estimated_risk"] = "high"
+            result["allowed"] = False
+        return result