PyPI - buildlog - Versions diffs - 0.6.1__py3-none-any.whl → 0.8.0__py3-none-any.whl - Mend

buildlog 0.6.1py3-none-any.whl → 0.8.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (40) hide show

buildlog/__init__.py +1 -1
buildlog/cli.py +589 -44
buildlog/confidence.py +27 -0
buildlog/core/__init__.py +12 -0
buildlog/core/bandit.py +699 -0
buildlog/core/operations.py +499 -11
buildlog/distill.py +80 -1
buildlog/engine/__init__.py +61 -0
buildlog/engine/bandit.py +23 -0
buildlog/engine/confidence.py +28 -0
buildlog/engine/embeddings.py +28 -0
buildlog/engine/experiments.py +619 -0
buildlog/engine/types.py +31 -0
buildlog/llm.py +461 -0
buildlog/mcp/server.py +12 -6
buildlog/mcp/tools.py +166 -13
buildlog/render/__init__.py +19 -2
buildlog/render/claude_md.py +74 -26
buildlog/render/continue_dev.py +102 -0
buildlog/render/copilot.py +100 -0
buildlog/render/cursor.py +105 -0
buildlog/render/tracking.py +20 -1
buildlog/render/windsurf.py +95 -0
buildlog/seeds.py +41 -0
buildlog/skills.py +69 -6
{buildlog-0.6.1.data → buildlog-0.8.0.data}/data/share/buildlog/copier.yml +0 -4
buildlog-0.8.0.data/data/share/buildlog/template/buildlog/_TEMPLATE_QUICK.md +21 -0
buildlog-0.8.0.dist-info/METADATA +151 -0
buildlog-0.8.0.dist-info/RECORD +54 -0
buildlog-0.6.1.dist-info/METADATA +0 -490
buildlog-0.6.1.dist-info/RECORD +0 -41
{buildlog-0.6.1.data → buildlog-0.8.0.data}/data/share/buildlog/post_gen.py +0 -0
{buildlog-0.6.1.data → buildlog-0.8.0.data}/data/share/buildlog/template/buildlog/.gitkeep +0 -0
{buildlog-0.6.1.data → buildlog-0.8.0.data}/data/share/buildlog/template/buildlog/2026-01-01-example.md +0 -0
{buildlog-0.6.1.data → buildlog-0.8.0.data}/data/share/buildlog/template/buildlog/BUILDLOG_SYSTEM.md +0 -0
{buildlog-0.6.1.data → buildlog-0.8.0.data}/data/share/buildlog/template/buildlog/_TEMPLATE.md +0 -0
{buildlog-0.6.1.data → buildlog-0.8.0.data}/data/share/buildlog/template/buildlog/assets/.gitkeep +0 -0
{buildlog-0.6.1.dist-info → buildlog-0.8.0.dist-info}/WHEEL +0 -0
{buildlog-0.6.1.dist-info → buildlog-0.8.0.dist-info}/entry_points.txt +0 -0
{buildlog-0.6.1.dist-info → buildlog-0.8.0.dist-info}/licenses/LICENSE +0 -0

buildlog/core/operations.py CHANGED Viewed

@@ -14,6 +14,7 @@ from pathlib import Path
 from typing import Literal, TypedDict
 from buildlog.confidence import ConfidenceMetrics, merge_confidence_metrics
+from buildlog.core.bandit import ThompsonSamplingBandit
 from buildlog.render import get_renderer
 from buildlog.skills import Skill, SkillSet, generate_skills
@@ -35,6 +36,9 @@ __all__ = [
     "StartSessionResult",
     "EndSessionResult",
     "LogMistakeResult",
+    # Gauntlet loop
+    "GauntletLoopResult",
+    "GauntletAcceptRiskResult",
     "status",
     "promote",
     "reject",
@@ -49,6 +53,10 @@ __all__ = [
     "log_mistake",
     "get_session_metrics",
     "get_experiment_report",
+    "get_bandit_status",
+    # Gauntlet loop operations
+    "gauntlet_process_issues",
+    "gauntlet_accept_risk",
 ]
@@ -552,7 +560,7 @@ def status(
 def promote(
     buildlog_dir: Path,
     skill_ids: list[str],
-    target: Literal["claude_md", "settings_json", "skill"] = "claude_md",
+    target: str = "claude_md",
     target_path: Path | None = None,
 ) -> PromoteResult:
     """Promote skills to agent rules.
@@ -560,7 +568,8 @@ def promote(
     Args:
         buildlog_dir: Path to buildlog directory.
         skill_ids: List of skill IDs to promote.
-        target: Where to write rules ("claude_md", "settings_json", or "skill").
+        target: Where to write rules. One of: claude_md, settings_json,
+            skill, cursor, copilot, windsurf, continue_dev.
         target_path: Optional custom path for the target file.
     Returns:
@@ -932,14 +941,27 @@ def log_reward(
 ) -> LogRewardResult:
     """Log a reward event for bandit learning.
-    Appends to reward_events.jsonl for later analysis.
+    This is where the bandit learns from EXPLICIT feedback:
+    The reward signal comes from the outcome:
+        - accepted (reward=1.0): Rules helped produce good output
+        - rejected (reward=0.0): Rules failed to prevent bad output
+        - revision (reward=1-distance): Partial credit based on correction needed
+    Unlike log_mistake() which gives implicit negative feedback, this allows
+    direct positive feedback when rules DO help. This is crucial for learning
+    which rules are genuinely effective, not just which ones don't fail.
+    Appends to reward_events.jsonl for analysis AND updates the bandit.
     Args:
         buildlog_dir: Path to buildlog directory.
         outcome: Type of feedback (accepted/revision/rejected).
         rules_active: List of rule IDs that were in context.
+                     If None, tries to use session's selected_rules.
         revision_distance: How much correction was needed (0-1, for revisions).
         error_class: Category of error if applicable.
+                    If None, tries to use session's error_class.
         notes: Optional notes about the feedback.
         source: Where this feedback came from.
@@ -950,6 +972,15 @@ def log_reward(
     reward_id = _generate_reward_id(outcome, now)
     reward_value = _compute_reward_value(outcome, revision_distance)
+    # Try to get rules and context from active session if not provided
+    active_path = _get_active_session_path(buildlog_dir)
+    if active_path.exists():
+        session_data = json.loads(active_path.read_text())
+        if rules_active is None:
+            rules_active = session_data.get("selected_rules", [])
+        if error_class is None:
+            error_class = session_data.get("error_class")
     event = RewardEvent(
         id=reward_id,
         timestamp=now,
@@ -969,6 +1000,32 @@ def log_reward(
     with open(rewards_path, "a") as f:
         f.write(json.dumps(event.to_dict()) + "\n")
+    # =========================================================================
+    # BANDIT LEARNING: Update with explicit reward
+    # =========================================================================
+    #
+    # For accepted (reward=1): Beta(α, β) → Beta(α + 1, β)
+    #   → Distribution shifts RIGHT, increasing expected value
+    #   → Rule becomes MORE likely to be selected
+    #
+    # For rejected (reward=0): Beta(α, β) → Beta(α, β + 1)
+    #   → Distribution shifts LEFT, decreasing expected value
+    #   → Rule becomes LESS likely to be selected
+    #
+    # For revision (0 < reward < 1): Both α and β increase proportionally
+    #   → Distribution narrows (more confident) with moderate expected value
+    # =========================================================================
+    if rules_active:
+        bandit_path = buildlog_dir / "bandit_state.jsonl"
+        bandit = ThompsonSamplingBandit(bandit_path)
+        bandit.batch_update(
+            rule_ids=rules_active,
+            reward=reward_value,
+            context=error_class or "general",
+        )
     # Count total events
     total_events = 0
     if rewards_path.exists():
@@ -976,11 +1033,16 @@ def log_reward(
             1 for line in rewards_path.read_text().strip().split("\n") if line
         )
+    rules_count = len(rules_active) if rules_active else 0
+    message = f"Logged {outcome} (reward={reward_value:.2f})"
+    if rules_count > 0:
+        message += f" | Updated bandit: {rules_count} rules"
     return LogRewardResult(
         reward_id=reward_id,
         reward_value=reward_value,
         total_events=total_events,
-        message=f"Logged {outcome} (reward={reward_value:.2f})",
+        message=message,
     )
@@ -1055,6 +1117,7 @@ class SessionDict(TypedDict, total=False):
     entry_file: str | None
     rules_at_start: list[str]
     rules_at_end: list[str]
+    selected_rules: list[str]  # Bandit-selected subset for this session
     error_class: str | None
     notes: str | None
@@ -1064,15 +1127,17 @@ class Session:
     """A coding session for experiment tracking.
     Tracks the state of rules before and after a session to measure
-    learning effectiveness.
+    learning effectiveness. The bandit selects a subset of rules
+    (selected_rules) to be "active" for this session based on context.
     Attributes:
         id: Unique identifier for this session.
         started_at: When the session started.
         ended_at: When the session ended (None if still active).
         entry_file: Corresponding buildlog entry file, if any.
-        rules_at_start: Rule IDs active at session start.
-        rules_at_end: Rule IDs active at session end.
+        rules_at_start: All rule IDs available at session start.
+        rules_at_end: All rule IDs available at session end.
+        selected_rules: Bandit-selected subset active for this session.
         error_class: Error class being targeted (e.g., "missing_test").
         notes: Optional notes about the session.
     """
@@ -1083,6 +1148,7 @@ class Session:
     entry_file: str | None = None
     rules_at_start: list[str] = field(default_factory=list)
     rules_at_end: list[str] = field(default_factory=list)
+    selected_rules: list[str] = field(default_factory=list)
     error_class: str | None = None
     notes: str | None = None
@@ -1095,6 +1161,8 @@ class Session:
             "rules_at_start": self.rules_at_start,
             "rules_at_end": self.rules_at_end,
         }
+        if self.selected_rules:
+            result["selected_rules"] = self.selected_rules
         if self.entry_file is not None:
             result["entry_file"] = self.entry_file
         if self.error_class is not None:
@@ -1124,6 +1192,7 @@ class Session:
             entry_file=data.get("entry_file"),
             rules_at_start=data.get("rules_at_start", []),
             rules_at_end=data.get("rules_at_end", []),
+            selected_rules=data.get("selected_rules", []),
             error_class=data.get("error_class"),
             notes=data.get("notes"),
         )
@@ -1227,11 +1296,15 @@ class SessionMetrics:
 @dataclass
 class StartSessionResult:
-    """Result of starting a new session."""
+    """Result of starting a new session.
+    Includes both the full rule set and the bandit-selected subset.
+    """
     session_id: str
     error_class: str | None
     rules_count: int
+    selected_rules: list[str]  # Bandit-selected rules for this session
     message: str
@@ -1310,6 +1383,31 @@ def _get_current_rules(buildlog_dir: Path) -> list[str]:
     return list(_load_json_set(promoted_path, "skill_ids"))
+def _get_seed_rule_ids(buildlog_dir: Path) -> set[str]:
+    """Get IDs of rules that come from seed personas.
+    Seed rules (from gauntlet personas like Test Terrorist, Security Karen)
+    have non-empty persona_tags. These rules get boosted priors in the
+    bandit because they represent curated, expert knowledge.
+    Returns:
+        Set of rule IDs that have persona_tags.
+    """
+    try:
+        skill_set = generate_skills(buildlog_dir)
+        seed_ids: set[str] = set()
+        for category_skills in skill_set.skills.values():
+            for skill in category_skills:
+                if skill.persona_tags:  # Non-empty means it's from a seed
+                    seed_ids.add(skill.id)
+        return seed_ids
+    except Exception:
+        # If skill generation fails, treat no rules as seeds
+        return set()
 def _load_sessions(buildlog_dir: Path) -> list[Session]:
     """Load all sessions from JSONL file."""
     sessions_path = _get_sessions_path(buildlog_dir)
@@ -1383,25 +1481,78 @@ def start_session(
     buildlog_dir: Path,
     error_class: str | None = None,
     notes: str | None = None,
+    select_k: int = 3,
 ) -> StartSessionResult:
-    """Start a new experiment session.
+    """Start a new experiment session with bandit-selected rules.
+    This is where Thompson Sampling kicks in:
+    1. Load all available rules (candidates)
+    2. Identify which rules are from seeds (get boosted priors)
+    3. Use bandit to select top-k rules for this error_class context
+    4. Store selected rules in session for later attribution
+    The selected rules are the ones "active" for this session. When a
+    mistake occurs, we'll give negative feedback to these rules (they
+    didn't prevent the mistake). This teaches the bandit which rules
+    are effective for which error classes.
     Args:
         buildlog_dir: Path to buildlog directory.
         error_class: Error class being targeted (e.g., "missing_test").
+                    This is the CONTEXT for contextual bandits - rules
+                    are evaluated per-context.
         notes: Optional notes about the session.
+        select_k: Number of rules to select via Thompson Sampling.
+                 Default 3 balances coverage with attribution clarity.
     Returns:
-        StartSessionResult with session ID and current rules count.
+        StartSessionResult with session ID, rules count, and selected rules.
     """
     now = datetime.now(timezone.utc)
     session_id = _generate_session_id(now)
     current_rules = _get_current_rules(buildlog_dir)
+    # =========================================================================
+    # THOMPSON SAMPLING: Select rules for this session
+    # =========================================================================
+    #
+    # The bandit maintains a Beta distribution for each (context, rule) pair.
+    # At session start, we SAMPLE from each distribution and pick the top-k.
+    #
+    # Why sample instead of using the mean?
+    #   - Arms we're uncertain about have high variance
+    #   - High variance means occasional high samples
+    #   - This causes us to explore uncertain arms
+    #   - As we gather data, variance shrinks, and we exploit
+    #
+    # This is the elegant explore-exploit balance of Thompson Sampling.
+    # =========================================================================
+    selected_rules: list[str] = []
+    if current_rules:
+        # Initialize bandit
+        bandit_path = buildlog_dir / "bandit_state.jsonl"
+        bandit = ThompsonSamplingBandit(bandit_path)
+        # Identify seed rules (those with persona_tags from gauntlet)
+        # Seeds get boosted priors - we believe curated rules are good
+        seed_rule_ids = _get_seed_rule_ids(buildlog_dir)
+        # SELECT: Sample from Beta distributions, pick top-k
+        selected_rules = bandit.select(
+            candidates=current_rules,
+            context=error_class or "general",
+            k=min(select_k, len(current_rules)),
+            seed_rule_ids=seed_rule_ids,
+        )
     session = Session(
         id=session_id,
         started_at=now,
         rules_at_start=current_rules,
+        selected_rules=selected_rules,
         error_class=error_class,
         notes=notes,
     )
@@ -1415,7 +1566,11 @@ def start_session(
         session_id=session_id,
         error_class=error_class,
         rules_count=len(current_rules),
-        message=f"Started session {session_id} with {len(current_rules)} active rules",
+        selected_rules=selected_rules,
+        message=(
+            f"Started session {session_id}: selected {len(selected_rules)}/"
+            f"{len(current_rules)} rules via Thompson Sampling"
+        ),
     )
@@ -1487,6 +1642,16 @@ def log_mistake(
 ) -> LogMistakeResult:
     """Log a mistake during an experiment session.
+    This is where the bandit learns from NEGATIVE feedback:
+    When a mistake occurs, the selected rules for this session FAILED
+    to prevent it. We update the bandit with reward=0 for each selected
+    rule, teaching it that these rules aren't effective for this context.
+    Over time, rules that consistently fail to prevent mistakes will
+    have their Beta distributions shift left (lower expected value),
+    and the bandit will stop selecting them.
     Args:
         buildlog_dir: Path to buildlog directory.
         error_class: Category of error (e.g., "missing_test").
@@ -1533,9 +1698,39 @@ def log_mistake(
     with open(mistakes_path, "a") as f:
         f.write(json.dumps(mistake.to_dict()) + "\n")
+    # =========================================================================
+    # BANDIT LEARNING: Negative feedback for selected rules
+    # =========================================================================
+    #
+    # The selected rules were supposed to help prevent mistakes. A mistake
+    # occurred anyway, so we give them reward=0 (failure).
+    #
+    # Bayesian update: Beta(α, β) → Beta(α + 0, β + 1) = Beta(α, β + 1)
+    #
+    # This shifts the distribution LEFT, decreasing the expected value.
+    # Rules that repeatedly fail will become less likely to be selected.
+    # =========================================================================
+    selected_rules = session_data.get("selected_rules", [])
+    if selected_rules:
+        bandit_path = buildlog_dir / "bandit_state.jsonl"
+        bandit = ThompsonSamplingBandit(bandit_path)
+        # Use session's error_class as context, not the mistake's
+        # (they should match, but session context is authoritative)
+        context = session_data.get("error_class") or "general"
+        bandit.batch_update(
+            rule_ids=selected_rules,
+            reward=0.0,  # Failure: rules didn't prevent mistake
+            context=context,
+        )
     message = f"Logged mistake: {error_class}"
     if similar:
         message += f" (REPEAT of {similar.id})"
+    if selected_rules:
+        message += f" | Updated bandit: {len(selected_rules)} rules got reward=0"
     return LogMistakeResult(
         mistake_id=mistake_id,
@@ -1652,3 +1847,296 @@ def get_experiment_report(buildlog_dir: Path) -> dict:
         "sessions": session_metrics,
         "error_classes": error_classes,
     }
+def get_bandit_status(
+    buildlog_dir: Path,
+    context: str | None = None,
+    top_k: int = 10,
+) -> dict:
+    """Get current bandit state and statistics.
+    Provides insight into the Thompson Sampling bandit's learned beliefs.
+    Useful for debugging and understanding which rules are being favored.
+    Args:
+        buildlog_dir: Path to buildlog directory.
+        context: Specific error class to show. If None, shows all contexts.
+        top_k: Number of top rules to show per context.
+    Returns:
+        Dictionary with:
+            - summary: Overall bandit statistics
+            - contexts: Per-context rule rankings
+            - top_rules: Top rules by expected value per context
+    """
+    bandit_path = buildlog_dir / "bandit_state.jsonl"
+    bandit = ThompsonSamplingBandit(bandit_path)
+    stats = bandit.get_stats(context)
+    # Group stats by context
+    contexts: dict[str, list[dict]] = {}
+    for key, rule_stats in stats.items():
+        ctx = rule_stats["context"]
+        if ctx not in contexts:
+            contexts[ctx] = []
+        contexts[ctx].append(
+            {
+                "rule_id": key.split(":")[-1] if ":" in key else key,
+                **{k: v for k, v in rule_stats.items() if k != "context"},
+            }
+        )
+    # Sort by mean (descending) and take top_k
+    top_rules: dict[str, list[dict]] = {}
+    for ctx, rules in contexts.items():
+        sorted_rules = sorted(rules, key=lambda x: x["mean"], reverse=True)
+        top_rules[ctx] = sorted_rules[:top_k]
+    # Summary stats
+    total_arms = sum(len(rules) for rules in contexts.values())
+    total_observations = sum(
+        rule.get("total_observations", 0)
+        for rules in contexts.values()
+        for rule in rules
+    )
+    return {
+        "summary": {
+            "total_contexts": len(contexts),
+            "total_arms": total_arms,
+            "total_observations": total_observations,
+            "state_file": str(bandit_path),
+        },
+        "top_rules": top_rules,
+        "all_rules": contexts if context else None,  # Only include all if filtering
+    }
+# =============================================================================
+# Gauntlet Loop Operations
+# =============================================================================
+@dataclass
+class GauntletLoopResult:
+    """Result of processing gauntlet issues.
+    Attributes:
+        action: What to do next:
+            - "fix_criticals": Criticals remain, auto-fix and loop
+            - "checkpoint_majors": No criticals, but majors remain (HITL)
+            - "checkpoint_minors": Only minors remain (HITL)
+            - "clean": No issues remain
+        criticals: List of critical severity issues
+        majors: List of major severity issues
+        minors: List of minor/nitpick severity issues
+        iteration: Current iteration number
+        learnings_persisted: Number of learnings persisted this iteration
+        message: Human-readable summary
+    """
+    action: Literal["fix_criticals", "checkpoint_majors", "checkpoint_minors", "clean"]
+    criticals: list[dict]
+    majors: list[dict]
+    minors: list[dict]
+    iteration: int
+    learnings_persisted: int
+    message: str
+@dataclass
+class GauntletAcceptRiskResult:
+    """Result of accepting risk with remaining issues.
+    Attributes:
+        accepted_issues: Number of issues accepted as risk
+        github_issues_created: Number of GitHub issues created (if enabled)
+        github_issue_urls: URLs of created GitHub issues
+        message: Human-readable summary
+        error: Error message if operation failed
+    """
+    accepted_issues: int
+    github_issues_created: int
+    github_issue_urls: list[str]
+    message: str
+    error: str | None = None
+def gauntlet_process_issues(
+    buildlog_dir: Path,
+    issues: list[dict],
+    iteration: int = 1,
+    source: str | None = None,
+) -> GauntletLoopResult:
+    """Process gauntlet issues and determine next action.
+    Categorizes issues by severity, persists learnings, and returns
+    the appropriate next action for the gauntlet loop.
+    Args:
+        buildlog_dir: Path to buildlog directory.
+        issues: List of issues from the gauntlet review.
+        iteration: Current iteration number (for tracking).
+        source: Optional source identifier for learnings.
+    Returns:
+        GauntletLoopResult with categorized issues and next action.
+    """
+    # Categorize by severity
+    criticals = [i for i in issues if i.get("severity") == "critical"]
+    majors = [i for i in issues if i.get("severity") == "major"]
+    minors = [i for i in issues if i.get("severity") in ("minor", "nitpick", None)]
+    # Persist learnings for this iteration
+    learn_source = source or f"gauntlet:iteration-{iteration}"
+    learn_result = learn_from_review(buildlog_dir, issues, learn_source)
+    learnings_persisted = len(learn_result.new_learnings) + len(
+        learn_result.reinforced_learnings
+    )
+    # Determine action
+    if criticals:
+        action: Literal[
+            "fix_criticals", "checkpoint_majors", "checkpoint_minors", "clean"
+        ] = "fix_criticals"
+        message = (
+            f"Iteration {iteration}: {len(criticals)} critical, "
+            f"{len(majors)} major, {len(minors)} minor. "
+            f"Fix criticals (and majors) then re-run."
+        )
+    elif majors:
+        action = "checkpoint_majors"
+        message = (
+            f"Iteration {iteration}: No criticals! "
+            f"{len(majors)} major, {len(minors)} minor remain. "
+            f"Continue clearing majors?"
+        )
+    elif minors:
+        action = "checkpoint_minors"
+        message = (
+            f"Iteration {iteration}: Only {len(minors)} minor issues remain. "
+            f"Accept risk or continue?"
+        )
+    else:
+        action = "clean"
+        message = f"Iteration {iteration}: All clear! No issues found."
+    return GauntletLoopResult(
+        action=action,
+        criticals=criticals,
+        majors=majors,
+        minors=minors,
+        iteration=iteration,
+        learnings_persisted=learnings_persisted,
+        message=message,
+    )
+def gauntlet_accept_risk(
+    remaining_issues: list[dict],
+    create_github_issues: bool = False,
+    repo: str | None = None,
+) -> GauntletAcceptRiskResult:
+    """Accept risk for remaining issues, optionally creating GitHub issues.
+    Args:
+        remaining_issues: Issues being accepted as risk.
+        create_github_issues: Whether to create GitHub issues for tracking.
+        repo: Repository for GitHub issues (uses current repo if None).
+    Returns:
+        GauntletAcceptRiskResult with created issue info.
+    """
+    import subprocess
+    github_urls: list[str] = []
+    error: str | None = None
+    if create_github_issues and remaining_issues:
+        for issue in remaining_issues:
+            severity = issue.get("severity", "minor")
+            rule = issue.get("rule_learned", issue.get("description", "Unknown"))
+            description = issue.get("description", "")
+            location = issue.get("location", "")
+            # Sanitize inputs for GitHub issue creation
+            # Note: We use list args (not shell=True), so this is defense-in-depth
+            def _sanitize_for_gh(text: str, max_len: int = 256) -> str:
+                """Sanitize text for GitHub issue fields."""
+                # Remove/replace problematic characters
+                sanitized = text.replace("\n", " ").replace("\r", " ")
+                # Truncate to max length
+                if len(sanitized) > max_len:
+                    sanitized = sanitized[: max_len - 3] + "..."
+                return sanitized.strip()
+            safe_severity = _sanitize_for_gh(str(severity), 20)
+            safe_rule = _sanitize_for_gh(str(rule), 200)
+            safe_description = _sanitize_for_gh(str(description), 1000)
+            safe_location = _sanitize_for_gh(str(location), 100)
+            # Build issue body
+            body_parts = [
+                f"**Severity:** {safe_severity}",
+                f"**Rule:** {safe_rule}",
+                "",
+                "## Description",
+                safe_description,
+            ]
+            if safe_location:
+                body_parts.extend(["", f"**Location:** `{safe_location}`"])
+            body_parts.extend(
+                [
+                    "",
+                    "---",
+                    "_Created by buildlog gauntlet loop (accepted risk)_",
+                ]
+            )
+            body = "\n".join(body_parts)
+            title = f"[Gauntlet/{safe_severity}] {safe_rule[:60]}"
+            # Create GitHub issue
+            cmd = [
+                "gh",
+                "issue",
+                "create",
+                "--title",
+                title,
+                "--body",
+                body,
+                "--label",
+                severity,
+            ]
+            if repo:
+                cmd.extend(["--repo", repo])
+            try:
+                result = subprocess.run(cmd, capture_output=True, text=True, check=True)
+                # gh issue create outputs the URL
+                url = result.stdout.strip()
+                if url:
+                    github_urls.append(url)
+            except subprocess.CalledProcessError as e:
+                # Don't fail entirely, just note the error
+                error = f"Failed to create some GitHub issues: {e.stderr}"
+            except FileNotFoundError:
+                error = "gh CLI not found. Install GitHub CLI to create issues."
+                break
+    return GauntletAcceptRiskResult(
+        accepted_issues=len(remaining_issues),
+        github_issues_created=len(github_urls),
+        github_issue_urls=github_urls,
+        message=(
+            f"Accepted {len(remaining_issues)} issues as risk. "
+            f"Created {len(github_urls)} GitHub issues."
+            if create_github_issues
+            else f"Accepted {len(remaining_issues)} issues as risk."
+        ),
+        error=error,
+    )

buildlog 0.6.1__py3-none-any.whl → 0.8.0__py3-none-any.whl

buildlog 0.6.1py3-none-any.whl → 0.8.0py3-none-any.whl