npm - shipwright-cli - Versions diffs - 3.0.0 → 3.2.0 - Mend

shipwright-cli 3.0.0 → 3.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (143) hide show

package/README.md +21 -7
package/completions/_shipwright +247 -93
package/completions/shipwright.bash +69 -15
package/completions/shipwright.fish +309 -41
package/config/decision-tiers.json +55 -0
package/config/defaults.json +25 -2
package/config/event-schema.json +142 -5
package/config/policy.json +8 -0
package/dashboard/public/index.html +6 -0
package/dashboard/public/styles.css +76 -0
package/dashboard/server.ts +51 -0
package/dashboard/src/core/api.ts +5 -0
package/dashboard/src/types/api.ts +10 -0
package/dashboard/src/views/metrics.ts +69 -1
package/package.json +3 -3
package/scripts/lib/architecture.sh +2 -1
package/scripts/lib/bootstrap.sh +0 -0
package/scripts/lib/config.sh +0 -0
package/scripts/lib/daemon-adaptive.sh +4 -2
package/scripts/lib/daemon-dispatch.sh +24 -1
package/scripts/lib/daemon-failure.sh +0 -0
package/scripts/lib/daemon-health.sh +0 -0
package/scripts/lib/daemon-patrol.sh +42 -7
package/scripts/lib/daemon-poll.sh +17 -0
package/scripts/lib/daemon-state.sh +17 -0
package/scripts/lib/daemon-triage.sh +1 -1
package/scripts/lib/decide-autonomy.sh +295 -0
package/scripts/lib/decide-scoring.sh +228 -0
package/scripts/lib/decide-signals.sh +462 -0
package/scripts/lib/fleet-failover.sh +0 -0
package/scripts/lib/helpers.sh +19 -18
package/scripts/lib/pipeline-detection.sh +1 -1
package/scripts/lib/pipeline-github.sh +0 -0
package/scripts/lib/pipeline-intelligence.sh +23 -4
package/scripts/lib/pipeline-quality-checks.sh +11 -6
package/scripts/lib/pipeline-quality.sh +0 -0
package/scripts/lib/pipeline-stages.sh +330 -33
package/scripts/lib/pipeline-state.sh +14 -0
package/scripts/lib/policy.sh +0 -0
package/scripts/lib/test-helpers.sh +0 -0
package/scripts/postinstall.mjs +75 -1
package/scripts/signals/example-collector.sh +36 -0
package/scripts/sw +8 -4
package/scripts/sw-activity.sh +1 -7
package/scripts/sw-adaptive.sh +7 -7
package/scripts/sw-adversarial.sh +1 -1
package/scripts/sw-architecture-enforcer.sh +1 -1
package/scripts/sw-auth.sh +1 -1
package/scripts/sw-autonomous.sh +1 -1
package/scripts/sw-changelog.sh +1 -1
package/scripts/sw-checkpoint.sh +1 -1
package/scripts/sw-ci.sh +11 -6
package/scripts/sw-cleanup.sh +1 -1
package/scripts/sw-code-review.sh +36 -17
package/scripts/sw-connect.sh +1 -1
package/scripts/sw-context.sh +1 -1
package/scripts/sw-cost.sh +71 -5
package/scripts/sw-daemon.sh +6 -3
package/scripts/sw-dashboard.sh +1 -1
package/scripts/sw-db.sh +53 -38
package/scripts/sw-decide.sh +685 -0
package/scripts/sw-decompose.sh +1 -1
package/scripts/sw-deps.sh +1 -1
package/scripts/sw-developer-simulation.sh +1 -1
package/scripts/sw-discovery.sh +80 -4
package/scripts/sw-doc-fleet.sh +1 -1
package/scripts/sw-docs-agent.sh +1 -1
package/scripts/sw-docs.sh +1 -1
package/scripts/sw-doctor.sh +1 -1
package/scripts/sw-dora.sh +1 -1
package/scripts/sw-durable.sh +9 -5
package/scripts/sw-e2e-orchestrator.sh +1 -1
package/scripts/sw-eventbus.sh +7 -4
package/scripts/sw-evidence.sh +1 -1
package/scripts/sw-feedback.sh +1 -1
package/scripts/sw-fix.sh +1 -1
package/scripts/sw-fleet-discover.sh +1 -1
package/scripts/sw-fleet-viz.sh +6 -4
package/scripts/sw-fleet.sh +1 -1
package/scripts/sw-github-app.sh +3 -2
package/scripts/sw-github-checks.sh +1 -1
package/scripts/sw-github-deploy.sh +1 -1
package/scripts/sw-github-graphql.sh +1 -1
package/scripts/sw-guild.sh +1 -1
package/scripts/sw-heartbeat.sh +1 -1
package/scripts/sw-hygiene.sh +5 -3
package/scripts/sw-incident.sh +9 -5
package/scripts/sw-init.sh +1 -1
package/scripts/sw-instrument.sh +1 -1
package/scripts/sw-intelligence.sh +11 -6
package/scripts/sw-jira.sh +1 -1
package/scripts/sw-launchd.sh +1 -1
package/scripts/sw-linear.sh +1 -1
package/scripts/sw-logs.sh +1 -1
package/scripts/sw-loop.sh +338 -32
package/scripts/sw-memory.sh +23 -6
package/scripts/sw-mission-control.sh +1 -1
package/scripts/sw-model-router.sh +3 -2
package/scripts/sw-otel.sh +8 -4
package/scripts/sw-oversight.sh +1 -1
package/scripts/sw-pipeline-composer.sh +3 -1
package/scripts/sw-pipeline-vitals.sh +11 -6
package/scripts/sw-pipeline.sh +92 -8
package/scripts/sw-pm.sh +5 -4
package/scripts/sw-pr-lifecycle.sh +7 -4
package/scripts/sw-predictive.sh +11 -5
package/scripts/sw-prep.sh +1 -1
package/scripts/sw-ps.sh +1 -1
package/scripts/sw-public-dashboard.sh +3 -2
package/scripts/sw-quality.sh +21 -10
package/scripts/sw-reaper.sh +1 -1
package/scripts/sw-recruit.sh +1 -1
package/scripts/sw-regression.sh +1 -1
package/scripts/sw-release-manager.sh +1 -1
package/scripts/sw-release.sh +1 -1
package/scripts/sw-remote.sh +1 -1
package/scripts/sw-replay.sh +1 -1
package/scripts/sw-retro.sh +1 -1
package/scripts/sw-review-rerun.sh +1 -1
package/scripts/sw-scale.sh +69 -11
package/scripts/sw-security-audit.sh +1 -1
package/scripts/sw-self-optimize.sh +168 -4
package/scripts/sw-session.sh +3 -3
package/scripts/sw-setup.sh +1 -1
package/scripts/sw-standup.sh +1 -1
package/scripts/sw-status.sh +1 -1
package/scripts/sw-strategic.sh +11 -6
package/scripts/sw-stream.sh +7 -4
package/scripts/sw-swarm.sh +3 -2
package/scripts/sw-team-stages.sh +1 -1
package/scripts/sw-templates.sh +3 -3
package/scripts/sw-testgen.sh +11 -6
package/scripts/sw-tmux-pipeline.sh +1 -1
package/scripts/sw-tmux.sh +35 -1
package/scripts/sw-trace.sh +1 -1
package/scripts/sw-tracker.sh +1 -1
package/scripts/sw-triage.sh +7 -7
package/scripts/sw-upgrade.sh +1 -1
package/scripts/sw-ux.sh +1 -1
package/scripts/sw-webhook.sh +3 -2
package/scripts/sw-widgets.sh +7 -4
package/scripts/sw-worktree.sh +1 -1
package/scripts/update-homebrew-sha.sh +21 -15

package/scripts/lib/pipeline-stages.sh CHANGED Viewed

@@ -1,8 +1,125 @@
-# pipeline-stages.sh — Stage implementations (intake, plan, build, test, review, pr, merge, deploy, validate, monitor) for sw-pipeline.sh
+# pipeline-stages.sh — Stage implementations (intake, plan, build, test, review, compound_quality, pr, merge, deploy, validate, monitor) for sw-pipeline.sh
 # Source from sw-pipeline.sh. Requires all pipeline globals and state/github/detection/quality modules.
 [[ -n "${_PIPELINE_STAGES_LOADED:-}" ]] && return 0
 _PIPELINE_STAGES_LOADED=1
+# ─── Context pruning helpers ────────────────────────────────────────────────
+# prune_context_section — Intelligently truncate a context section to fit a char budget.
+#   $1: section name (for logging/markers)
+#   $2: content string
+#   $3: max_chars (default 5000)
+# For JSON content (starts with { or [): extracts summary fields via jq.
+# For text content: sandwich approach — keeps first + last N lines.
+# Outputs the (possibly truncated) content to stdout.
+prune_context_section() {
+    local section_name="${1:-section}"
+    local content="${2:-}"
+    local max_chars="${3:-5000}"
+    [[ -z "$content" ]] && return 0
+    local content_len=${#content}
+    if [[ "$content_len" -le "$max_chars" ]]; then
+        printf '%s' "$content"
+        return 0
+    fi
+    # JSON content — try jq summary extraction
+    local first_char="${content:0:1}"
+    if [[ "$first_char" == "{" || "$first_char" == "[" ]]; then
+        local summary=""
+        # Try extracting summary/results fields
+        summary=$(printf '%s' "$content" | jq -r '
+            if type == "object" then
+                to_entries | map(
+                    if (.value | type) == "array" then
+                        "\(.key): \(.value | length) items"
+                    elif (.value | type) == "object" then
+                        "\(.key): \(.value | keys | join(", "))"
+                    else
+                        "\(.key): \(.value)"
+                    end
+                ) | join("\n")
+            elif type == "array" then
+                .[:5] | map(tostring) | join("\n")
+            else . end
+        ' 2>/dev/null) || true
+        if [[ -n "$summary" && ${#summary} -le "$max_chars" ]]; then
+            printf '%s' "$summary"
+            return 0
+        fi
+        # jq failed or still too large — fall through to text truncation
+    fi
+    # Text content — sandwich approach (first N + last N lines)
+    local line_count=0
+    line_count=$(printf '%s\n' "$content" | wc -l | xargs)
+    # Calculate how many lines to keep from each end
+    # Approximate chars-per-line to figure out line budget
+    local avg_chars_per_line=80
+    if [[ "$line_count" -gt 0 ]]; then
+        avg_chars_per_line=$(( content_len / line_count ))
+        [[ "$avg_chars_per_line" -lt 20 ]] && avg_chars_per_line=20
+    fi
+    local total_lines_budget=$(( max_chars / avg_chars_per_line ))
+    [[ "$total_lines_budget" -lt 4 ]] && total_lines_budget=4
+    local half=$(( total_lines_budget / 2 ))
+    local head_part=""
+    local tail_part=""
+    head_part=$(printf '%s\n' "$content" | head -"$half")
+    tail_part=$(printf '%s\n' "$content" | tail -"$half")
+    printf '%s\n[... %s truncated: %d→%d chars ...]\n%s' \
+        "$head_part" "$section_name" "$content_len" "$max_chars" "$tail_part"
+}
+# guard_prompt_size — Warn and hard-truncate if prompt exceeds budget.
+#   $1: stage name (for logging)
+#   $2: prompt content
+#   $3: max_chars (default 100000)
+# Outputs the (possibly truncated) prompt to stdout.
+PIPELINE_PROMPT_BUDGET="${PIPELINE_PROMPT_BUDGET:-100000}"
+guard_prompt_size() {
+    local stage_name="${1:-stage}"
+    local prompt="${2:-}"
+    local max_chars="${3:-$PIPELINE_PROMPT_BUDGET}"
+    local prompt_len=${#prompt}
+    if [[ "$prompt_len" -le "$max_chars" ]]; then
+        printf '%s' "$prompt"
+        return 0
+    fi
+    warn "${stage_name} prompt too large (${prompt_len} chars, budget ${max_chars}) — truncating"
+    emit_event "pipeline.prompt_truncated" \
+        "stage=$stage_name" \
+        "original=$prompt_len" \
+        "budget=$max_chars" 2>/dev/null || true
+    printf '%s\n\n... [CONTEXT TRUNCATED: %s prompt exceeded %d char budget. Focus on the goal and requirements.]' \
+        "${prompt:0:$max_chars}" "$stage_name" "$max_chars"
+}
+# ─── Safe git helpers ────────────────────────────────────────────────────────
+# BASE_BRANCH may not exist locally (e.g. --local mode with no remote).
+# These helpers return empty output instead of crashing under set -euo pipefail.
+_safe_base_log() {
+    local branch="${BASE_BRANCH:-main}"
+    git rev-parse --verify "$branch" >/dev/null 2>&1 || { echo ""; return 0; }
+    git log "$@" "${branch}..HEAD" 2>/dev/null || true
+}
+_safe_base_diff() {
+    local branch="${BASE_BRANCH:-main}"
+    git rev-parse --verify "$branch" >/dev/null 2>&1 || { git diff HEAD~5 "$@" 2>/dev/null || true; return 0; }
+    git diff "${branch}...HEAD" "$@" 2>/dev/null || true
+}
 show_stage_preview() {
     local stage_id="$1"
     echo ""
@@ -15,6 +132,7 @@ show_stage_preview() {
         test_first) echo -e "  Generate tests from requirements (TDD mode) before implementation" ;;
         test)     echo -e "  Run test suite and check coverage" ;;
         review)   echo -e "  AI code review on the diff, post findings" ;;
+        compound_quality) echo -e "  Adversarial review, negative tests, e2e, DoD audit" ;;
         pr)       echo -e "  Create GitHub PR with labels, reviewers, milestone" ;;
         merge)    echo -e "  Wait for CI checks, merge PR, optionally delete branch" ;;
         deploy)   echo -e "  Deploy to staging/production with rollback" ;;
@@ -162,6 +280,7 @@ ${ISSUE_BODY}
     # Inject architecture context (import graph, modules, test map)
     if [[ -n "$arch_context" ]]; then
+        arch_context=$(prune_context_section "architecture" "$arch_context" 5000)
         plan_prompt="${plan_prompt}
 ## Architecture Context
 ${arch_context}
@@ -173,6 +292,7 @@ ${arch_context}
     if [[ -f "$_context_bundle" ]]; then
         local _cb_content
         _cb_content=$(cat "$_context_bundle" 2>/dev/null | head -100 || true)
+        _cb_content=$(prune_context_section "context-bundle" "$_cb_content" 8000)
         if [[ -n "$_cb_content" ]]; then
             plan_prompt="${plan_prompt}
 ## Pipeline Context
@@ -188,6 +308,7 @@ ${_cb_content}
         if [[ -n "$plan_memory" && "$plan_memory" != *'"results":[]'* && "$plan_memory" != *'"error"'* ]]; then
             local memory_summary
             memory_summary=$(echo "$plan_memory" | jq -r '.results[]? | "- \(.)"' 2>/dev/null | head -10 || true)
+            memory_summary=$(prune_context_section "memory" "$memory_summary" 10000)
             if [[ -n "$memory_summary" ]]; then
                 plan_prompt="${plan_prompt}
 ## Historical Context (from previous pipelines)
@@ -212,6 +333,7 @@ ${plan_hint}
     if [[ -x "$SCRIPT_DIR/sw-discovery.sh" ]]; then
         local plan_discoveries
         plan_discoveries=$("$SCRIPT_DIR/sw-discovery.sh" inject "*.md,*.json" 2>/dev/null | head -20 || true)
+        plan_discoveries=$(prune_context_section "discoveries" "$plan_discoveries" 3000)
         if [[ -n "$plan_discoveries" ]]; then
             plan_prompt="${plan_prompt}
 ## Discoveries from Other Pipelines
@@ -232,6 +354,7 @@ ${plan_discoveries}
             "Patterns: \((.patterns // []) | join(", "))",
             "Rules: \((.rules // []) | join("; "))"
         ' "$arch_file_plan" 2>/dev/null || true)
+        arch_patterns=$(prune_context_section "intelligence" "$arch_patterns" 5000)
         if [[ -n "$arch_patterns" ]]; then
             plan_prompt="${plan_prompt}
 ## Architecture Patterns
@@ -268,6 +391,12 @@ Focus on: threat modeling, OWASP top 10, input validation, authentication/author
 - Test command: ${TEST_CMD:-not configured}
 - Task type: ${TASK_TYPE:-feature}
+## Context Efficiency
+- Batch independent tool calls in parallel when possible
+- Read specific file sections (offset/limit) instead of entire large files
+- Use targeted grep searches — avoid scanning entire codebases into context
+- Delegate multi-file analysis to subagents when available
 ## Required Output
 Create a Markdown plan with these sections:
@@ -290,6 +419,9 @@ How to verify the implementation works.
 Checklist of completion criteria.
 "
+    # Guard total prompt size
+    plan_prompt=$(guard_prompt_size "plan" "$plan_prompt")
     local plan_model
     plan_model=$(jq -r --arg id "plan" '(.stages[] | select(.id == $id) | .config.model) // .defaults.model // "opus"' "$PIPELINE_CONFIG" 2>/dev/null) || true
     [[ -n "$MODEL" ]] && plan_model="$MODEL"
@@ -300,10 +432,22 @@ Checklist of completion criteria.
     fi
     local _token_log="${ARTIFACTS_DIR}/.claude-tokens-plan.log"
-    claude --print --model "$plan_model" --max-turns 25 \
+    claude --print --model "$plan_model" --max-turns 25 --dangerously-skip-permissions \
         "$plan_prompt" < /dev/null > "$plan_file" 2>"$_token_log" || true
     parse_claude_tokens "$_token_log"
+    # Claude may write to disk via tools instead of stdout — rescue those files
+    local _plan_rescue
+    for _plan_rescue in "${PROJECT_ROOT}/PLAN.md" "${PROJECT_ROOT}/plan.md" \
+                         "${PROJECT_ROOT}/implementation-plan.md"; do
+        if [[ -s "$_plan_rescue" ]] && [[ $(wc -l < "$plan_file" 2>/dev/null | xargs) -lt 10 ]]; then
+            info "Plan written to ${_plan_rescue} via tools — adopting as plan artifact"
+            cat "$_plan_rescue" >> "$plan_file"
+            rm -f "$_plan_rescue"
+            break
+        fi
+    done
     if [[ ! -s "$plan_file" ]]; then
         error "Plan generation failed — empty output"
         return 1
@@ -587,6 +731,7 @@ stage_design() {
     if type gather_architecture_context &>/dev/null; then
         arch_struct_context=$(gather_architecture_context "${PROJECT_ROOT:-.}" 2>/dev/null || true)
     fi
+    arch_struct_context=$(prune_context_section "architecture" "$arch_struct_context" 5000)
     # Memory integration — inject context if memory system available
     local memory_context=""
@@ -597,12 +742,14 @@ stage_design() {
     if [[ -z "$memory_context" ]] && [[ -x "$SCRIPT_DIR/sw-memory.sh" ]]; then
         memory_context=$(bash "$SCRIPT_DIR/sw-memory.sh" inject "design" 2>/dev/null) || true
     fi
+    memory_context=$(prune_context_section "memory" "$memory_context" 10000)
     # Inject cross-pipeline discoveries for design stage
     local design_discoveries=""
     if [[ -x "$SCRIPT_DIR/sw-discovery.sh" ]]; then
         design_discoveries=$("$SCRIPT_DIR/sw-discovery.sh" inject "*.md,*.ts,*.tsx,*.js" 2>/dev/null | head -20 || true)
     fi
+    design_discoveries=$(prune_context_section "discoveries" "$design_discoveries" 3000)
     # Inject architecture model patterns if available
     local arch_context=""
@@ -626,6 +773,7 @@ ${arch_patterns}
 ${arch_layers}}"
         fi
     fi
+    arch_context=$(prune_context_section "intelligence" "$arch_context" 5000)
     # Inject rejected design approaches and anti-patterns from memory
     local design_antipatterns=""
@@ -633,6 +781,7 @@ ${arch_layers}}"
         local rejected_designs
         rejected_designs=$(intelligence_search_memory "rejected design approaches anti-patterns for: ${GOAL:-}" "${HOME}/.shipwright/memory" 3 2>/dev/null) || true
         if [[ -n "$rejected_designs" ]]; then
+            rejected_designs=$(prune_context_section "antipatterns" "$rejected_designs" 5000)
             design_antipatterns="
 ## Rejected Approaches (from past reviews)
 These design approaches were rejected in past reviews. Avoid repeating them:
@@ -698,6 +847,9 @@ Produce this EXACT format:
 Be concrete and specific. Reference actual file paths in the codebase. Consider edge cases and failure modes."
+    # Guard total prompt size
+    design_prompt=$(guard_prompt_size "design" "$design_prompt")
     local design_model
     design_model=$(jq -r --arg id "design" '(.stages[] | select(.id == $id) | .config.model) // .defaults.model // "opus"' "$PIPELINE_CONFIG" 2>/dev/null) || true
     [[ -n "$MODEL" ]] && design_model="$MODEL"
@@ -708,10 +860,22 @@ Be concrete and specific. Reference actual file paths in the codebase. Consider
     fi
     local _token_log="${ARTIFACTS_DIR}/.claude-tokens-design.log"
-    claude --print --model "$design_model" --max-turns 25 \
+    claude --print --model "$design_model" --max-turns 25 --dangerously-skip-permissions \
         "$design_prompt" < /dev/null > "$design_file" 2>"$_token_log" || true
     parse_claude_tokens "$_token_log"
+    # Claude may write to disk via tools instead of stdout — rescue those files
+    local _design_rescue
+    for _design_rescue in "${PROJECT_ROOT}/design-adr.md" "${PROJECT_ROOT}/design.md" \
+                           "${PROJECT_ROOT}/ADR.md" "${PROJECT_ROOT}/DESIGN.md"; do
+        if [[ -s "$_design_rescue" ]] && [[ $(wc -l < "$design_file" 2>/dev/null | xargs) -lt 10 ]]; then
+            info "Design written to ${_design_rescue} via tools — adopting as design artifact"
+            cat "$_design_rescue" >> "$design_file"
+            rm -f "$_design_rescue"
+            break
+        fi
+    done
     if [[ ! -s "$design_file" ]]; then
         error "Design generation failed — empty output"
         return 1
@@ -739,7 +903,7 @@ Be concrete and specific. Reference actual file paths in the codebase. Consider
     files_to_modify=$(sed -n '/Files to modify/,/^-\|^#\|^$/p' "$design_file" 2>/dev/null | grep -E '^\s*-' | head -20 || true)
     if [[ -n "$files_to_create" || -n "$files_to_modify" ]]; then
-        info "Design scope: ${DIM}$(echo "$files_to_create $files_to_modify" | grep -c '^\s*-' || echo 0) file(s)${RESET}"
+        info "Design scope: ${DIM}$(echo "$files_to_create $files_to_modify" | grep -c '^\s*-' || true) file(s)${RESET}"
     fi
     # Post design to GitHub issue
@@ -1077,8 +1241,9 @@ ${prevention_text}"
         loop_args+=(--resume)
     fi
-    # Skip permissions in CI (no interactive terminal)
-    [[ "${CI_MODE:-false}" == "true" ]] && loop_args+=(--skip-permissions)
+    # Skip permissions — pipeline runs headlessly (claude -p) and has no terminal
+    # for interactive permission prompts. Without this flag, agents can't write files.
+    loop_args+=(--skip-permissions)
     info "Starting build loop: ${DIM}shipwright loop${RESET} (max ${max_iter} iterations, ${agents} agent(s))"
@@ -1131,13 +1296,13 @@ ${prevention_text}"
     # Count commits made during build
     local commit_count
-    commit_count=$(git log --oneline "${BASE_BRANCH}..HEAD" 2>/dev/null | wc -l | xargs)
+    commit_count=$(_safe_base_log --oneline | wc -l | xargs)
     info "Build produced ${BOLD}$commit_count${RESET} commit(s)"
     # Commit quality evaluation when intelligence is enabled
     if type intelligence_search_memory >/dev/null 2>&1 && command -v claude >/dev/null 2>&1 && [[ "${commit_count:-0}" -gt 0 ]]; then
         local commit_msgs
-        commit_msgs=$(git log --format="%s" "${BASE_BRANCH}..HEAD" 2>/dev/null | head -20)
+        commit_msgs=$(_safe_base_log --format="%s" | head -20)
         local quality_score
         quality_score=$(claude --print --output-format text -p "Rate the quality of these git commit messages on a scale of 0-100. Consider: focus (one thing per commit), clarity (describes the why), atomicity (small logical units). Reply with ONLY a number 0-100.
@@ -1201,7 +1366,8 @@ stage_test() {
         # Post failure to GitHub with more context
         if [[ -n "$ISSUE_NUMBER" ]]; then
             local log_lines
-            log_lines=$(wc -l < "$test_log" 2>/dev/null || echo "0")
+            log_lines=$(wc -l < "$test_log" 2>/dev/null || true)
+            log_lines="${log_lines:-0}"
             local log_excerpt
             if [[ "$log_lines" -lt 60 ]]; then
                 log_excerpt="$(cat "$test_log" 2>/dev/null || true)"
@@ -1276,8 +1442,7 @@ stage_review() {
     local diff_file="$ARTIFACTS_DIR/review-diff.patch"
     local review_file="$ARTIFACTS_DIR/review.md"
-    git diff "${BASE_BRANCH}...${GIT_BRANCH}" > "$diff_file" 2>/dev/null || \
-        git diff HEAD~5 > "$diff_file" 2>/dev/null || true
+    _safe_base_diff > "$diff_file" 2>/dev/null || true
     if [[ ! -s "$diff_file" ]]; then
         warn "No diff found — skipping review"
@@ -1290,13 +1455,13 @@ stage_review() {
     fi
     local diff_stats
-    diff_stats=$(git diff --stat "${BASE_BRANCH}...${GIT_BRANCH}" 2>/dev/null | tail -1 || echo "")
+    diff_stats=$(_safe_base_diff --stat | tail -1 || echo "")
     info "Running AI code review... ${DIM}($diff_stats)${RESET}"
     # Semantic risk scoring when intelligence is enabled
     if type intelligence_search_memory >/dev/null 2>&1 && command -v claude >/dev/null 2>&1; then
         local diff_files
-        diff_files=$(git diff --name-only "${BASE_BRANCH}...${GIT_BRANCH}" 2>/dev/null || true)
+        diff_files=$(_safe_base_diff --name-only || true)
         local risk_score="low"
         # Fast heuristic: flag high-risk file patterns
         if echo "$diff_files" | grep -qiE 'migration|schema|auth|crypto|security|password|token|secret|\.env'; then
@@ -1343,6 +1508,7 @@ If no issues are found, write: \"Review clean — no issues found.\"
     if type intelligence_search_memory >/dev/null 2>&1; then
         local review_memory
         review_memory=$(intelligence_search_memory "code review findings anti-patterns for: ${GOAL:-}" "${HOME}/.shipwright/memory" 5 2>/dev/null) || true
+        review_memory=$(prune_context_section "memory" "$review_memory" 10000)
         if [[ -n "$review_memory" ]]; then
             review_prompt+="
 ## Known Issues from Previous Reviews
@@ -1390,11 +1556,12 @@ $(cat "$dod_file")
 ## Diff to Review
 $(cat "$diff_file")"
-    # Build claude args — add --dangerously-skip-permissions in CI
-    local review_args=(--print --model "$review_model" --max-turns 25)
-    if [[ "${CI_MODE:-false}" == "true" ]]; then
-        review_args+=(--dangerously-skip-permissions)
-    fi
+    # Guard total prompt size
+    review_prompt=$(guard_prompt_size "review" "$review_prompt")
+    # Skip permissions — pipeline runs headlessly (claude -p) and has no terminal
+    # for interactive permission prompts. Same rationale as build stage (line ~1083).
+    local review_args=(--print --model "$review_model" --max-turns 25 --dangerously-skip-permissions)
     claude "${review_args[@]}" "$review_prompt" < /dev/null > "$review_file" 2>"${ARTIFACTS_DIR}/.claude-tokens-review.log" || true
     parse_claude_tokens "${ARTIFACTS_DIR}/.claude-tokens-review.log"
@@ -1539,15 +1706,143 @@ ${review_summary}
     log_stage "review" "AI review complete ($total_issues issues: $critical_count critical, $bug_count bugs, $warning_count suggestions)"
 }
+# ─── Compound Quality (fallback) ────────────────────────────────────────────
+# Basic implementation: adversarial review, negative testing, e2e checks, DoD audit.
+# If pipeline-intelligence.sh was sourced first, its enhanced version takes priority.
+if ! type stage_compound_quality >/dev/null 2>&1; then
+stage_compound_quality() {
+    CURRENT_STAGE_ID="compound_quality"
+    # Read stage config from pipeline template
+    local cfg
+    cfg=$(jq -r '.stages[] | select(.id == "compound_quality") | .config // {}' "$PIPELINE_CONFIG" 2>/dev/null) || cfg="{}"
+    local do_adversarial do_negative do_e2e do_dod max_cycles blocking
+    do_adversarial=$(echo "$cfg" | jq -r '.adversarial // false')
+    do_negative=$(echo "$cfg" | jq -r '.negative // false')
+    do_e2e=$(echo "$cfg" | jq -r '.e2e // false')
+    do_dod=$(echo "$cfg" | jq -r '.dod_audit // false')
+    max_cycles=$(echo "$cfg" | jq -r '.max_cycles // 1')
+    blocking=$(echo "$cfg" | jq -r '.compound_quality_blocking // false')
+    local pass_count=0 fail_count=0 total=0
+    local compound_log="$ARTIFACTS_DIR/compound-quality.log"
+    : > "$compound_log"
+    # ── Adversarial review ──
+    if [[ "$do_adversarial" == "true" ]]; then
+        total=$((total + 1))
+        info "Running adversarial review..."
+        if [[ -x "$SCRIPT_DIR/sw-adversarial.sh" ]]; then
+            if bash "$SCRIPT_DIR/sw-adversarial.sh" --repo "${REPO_DIR:-.}" >> "$compound_log" 2>&1; then
+                pass_count=$((pass_count + 1))
+                success "Adversarial review passed"
+            else
+                fail_count=$((fail_count + 1))
+                warn "Adversarial review found issues"
+            fi
+        else
+            warn "sw-adversarial.sh not found, skipping"
+        fi
+    fi
+    # ── Negative / edge-case testing ──
+    if [[ "$do_negative" == "true" ]]; then
+        total=$((total + 1))
+        info "Running negative test pass..."
+        if [[ -n "${TEST_CMD:-}" ]]; then
+            if eval "$TEST_CMD" >> "$compound_log" 2>&1; then
+                pass_count=$((pass_count + 1))
+                success "Negative test pass passed"
+            else
+                fail_count=$((fail_count + 1))
+                warn "Negative test pass found failures"
+            fi
+        else
+            pass_count=$((pass_count + 1))
+            info "No test command configured, skipping negative tests"
+        fi
+    fi
+    # ── E2E checks ──
+    if [[ "$do_e2e" == "true" ]]; then
+        total=$((total + 1))
+        info "Running e2e checks..."
+        if [[ -x "$SCRIPT_DIR/sw-e2e-orchestrator.sh" ]]; then
+            if bash "$SCRIPT_DIR/sw-e2e-orchestrator.sh" run >> "$compound_log" 2>&1; then
+                pass_count=$((pass_count + 1))
+                success "E2E checks passed"
+            else
+                fail_count=$((fail_count + 1))
+                warn "E2E checks found issues"
+            fi
+        else
+            pass_count=$((pass_count + 1))
+            info "sw-e2e-orchestrator.sh not found, skipping e2e"
+        fi
+    fi
+    # ── Definition of Done audit ──
+    if [[ "$do_dod" == "true" ]]; then
+        total=$((total + 1))
+        info "Running definition-of-done audit..."
+        if [[ -x "$SCRIPT_DIR/sw-quality.sh" ]]; then
+            if bash "$SCRIPT_DIR/sw-quality.sh" validate >> "$compound_log" 2>&1; then
+                pass_count=$((pass_count + 1))
+                success "DoD audit passed"
+            else
+                fail_count=$((fail_count + 1))
+                warn "DoD audit found gaps"
+            fi
+        else
+            pass_count=$((pass_count + 1))
+            info "sw-quality.sh not found, skipping DoD audit"
+        fi
+    fi
+    # ── Summary ──
+    log_stage "compound_quality" "Compound quality: $pass_count/$total checks passed, $fail_count failed"
+    if [[ "$fail_count" -gt 0 && "$blocking" == "true" ]]; then
+        error "Compound quality gate failed: $fail_count of $total checks failed"
+        return 1
+    fi
+    return 0
+}
+fi  # end fallback stage_compound_quality
 stage_pr() {
     CURRENT_STAGE_ID="pr"
     local plan_file="$ARTIFACTS_DIR/plan.md"
     local test_log="$ARTIFACTS_DIR/test-results.log"
     local review_file="$ARTIFACTS_DIR/review.md"
+    # ── Skip PR in local/no-github mode ──
+    if [[ "${NO_GITHUB:-false}" == "true" || "${SHIPWRIGHT_LOCAL:-}" == "1" || "${LOCAL_MODE:-false}" == "true" ]]; then
+        info "Skipping PR stage — running in local/no-github mode"
+        # Save a PR draft locally for reference
+        local branch_name
+        branch_name=$(git rev-parse --abbrev-ref HEAD 2>/dev/null || echo "unknown")
+        local commit_count
+        commit_count=$(_safe_base_log --oneline | wc -l | xargs)
+        {
+            echo "# PR Draft (local mode)"
+            echo ""
+            echo "**Branch:** ${branch_name}"
+            echo "**Commits:** ${commit_count:-0}"
+            echo "**Goal:** ${GOAL:-N/A}"
+            echo ""
+            echo "## Changes"
+            _safe_base_diff --stat || true
+        } > ".claude/pr-draft.md" 2>/dev/null || true
+        emit_event "pr.skipped" "issue=${ISSUE_NUMBER:-0}" "reason=local_mode"
+        return 0
+    fi
     # ── PR Hygiene Checks (informational) ──
     local hygiene_commit_count
-    hygiene_commit_count=$(git log --oneline "${BASE_BRANCH}..HEAD" 2>/dev/null | wc -l | xargs)
+    hygiene_commit_count=$(_safe_base_log --oneline | wc -l | xargs)
     hygiene_commit_count="${hygiene_commit_count:-0}"
     if [[ "$hygiene_commit_count" -gt 20 ]]; then
@@ -1556,7 +1851,7 @@ stage_pr() {
     # Check for WIP/fixup/squash commits (expanded patterns)
     local wip_commits
-    wip_commits=$(git log --oneline "${BASE_BRANCH}..HEAD" 2>/dev/null | grep -ciE '^[0-9a-f]+ (WIP|fixup!|squash!|TODO|HACK|TEMP|BROKEN|wip[:-]|temp[:-]|broken[:-]|do not merge)' || true)
+    wip_commits=$(_safe_base_log --oneline | grep -ciE '^[0-9a-f]+ (WIP|fixup!|squash!|TODO|HACK|TEMP|BROKEN|wip[:-]|temp[:-]|broken[:-]|do not merge)' || true)
     wip_commits="${wip_commits:-0}"
     if [[ "$wip_commits" -gt 0 ]]; then
         warn "Branch has ${wip_commits} WIP/fixup/squash/temp commit(s) — consider cleaning up"
@@ -1564,7 +1859,7 @@ stage_pr() {
     # ── PR Quality Gate: reject PRs with no real code changes ──
     local real_files
-    real_files=$(git diff --name-only "${BASE_BRANCH}...HEAD" 2>/dev/null | grep -v '^\.claude/' | grep -v '^\.github/' || true)
+    real_files=$(_safe_base_diff --name-only | grep -v '^\.claude/' | grep -v '^\.github/' || true)
     if [[ -z "$real_files" ]]; then
         error "No real code changes detected — only pipeline artifacts (.claude/ logs)."
         error "The build agent did not produce meaningful changes. Skipping PR creation."
@@ -1614,7 +1909,7 @@ stage_pr() {
         if [[ "$sim_enabled" == "true" ]]; then
             info "Running developer simulation review..."
             local diff_for_sim
-            diff_for_sim=$(git diff "${BASE_BRANCH}...HEAD" 2>/dev/null || true)
+            diff_for_sim=$(_safe_base_diff || true)
             if [[ -n "$diff_for_sim" ]]; then
                 local sim_result
                 sim_result=$(simulation_review "$diff_for_sim" "${GOAL:-}" 2>/dev/null || echo "")
@@ -1644,7 +1939,7 @@ stage_pr() {
         if [[ "$arch_enabled" == "true" ]]; then
             info "Validating architecture..."
             local diff_for_arch
-            diff_for_arch=$(git diff "${BASE_BRANCH}...HEAD" 2>/dev/null || true)
+            diff_for_arch=$(_safe_base_diff || true)
             if [[ -n "$diff_for_arch" ]]; then
                 local arch_result
                 arch_result=$(architecture_validate_changes "$diff_for_arch" "" 2>/dev/null || echo "")
@@ -1668,10 +1963,11 @@ stage_pr() {
     # Pre-PR diff gate — verify meaningful code changes exist (not just bookkeeping)
     local real_changes
-    real_changes=$(git diff --name-only "origin/${BASE_BRANCH:-main}...HEAD" \
+    real_changes=$(_safe_base_diff --name-only \
         -- . ':!.claude/loop-state.md' ':!.claude/pipeline-state.md' \
         ':!.claude/pipeline-artifacts/*' ':!**/progress.md' \
-        ':!**/error-summary.json' 2>/dev/null | wc -l | xargs || echo "0")
+        ':!**/error-summary.json' | wc -l | xargs || true)
+    real_changes="${real_changes:-0}"
     if [[ "${real_changes:-0}" -eq 0 ]]; then
         error "No meaningful code changes detected — only bookkeeping files modified"
         error "Refusing to create PR with zero real changes"
@@ -1726,10 +2022,10 @@ stage_pr() {
     [[ -n "${GITHUB_ISSUE:-}" ]] && closes_line="Closes ${GITHUB_ISSUE}"
     local diff_stats
-    diff_stats=$(git diff --stat "${BASE_BRANCH}...${GIT_BRANCH}" 2>/dev/null | tail -1 || echo "")
+    diff_stats=$(_safe_base_diff --stat | tail -1 || echo "")
     local commit_count
-    commit_count=$(git log --oneline "${BASE_BRANCH}..HEAD" 2>/dev/null | wc -l | xargs)
+    commit_count=$(_safe_base_log --oneline | wc -l | xargs)
     local total_dur=""
     if [[ -n "$PIPELINE_START_EPOCH" ]]; then
@@ -1774,7 +2070,7 @@ EOF
     risk_tier="low"
     if [[ -f "$REPO_DIR/config/policy.json" ]]; then
         local changed_files
-        changed_files=$(git diff --name-only "${BASE_BRANCH}...HEAD" 2>/dev/null || true)
+        changed_files=$(_safe_base_diff --name-only || true)
         if [[ -n "$changed_files" ]]; then
             local policy_file="$REPO_DIR/config/policy.json"
             check_tier_match() {
@@ -1906,7 +2202,7 @@ EOF
             codeowners_json=$(gh_codeowners "$REPO_OWNER" "$REPO_NAME" 2>/dev/null || echo "[]")
             if [[ "$codeowners_json" != "[]" && -n "$codeowners_json" ]]; then
                 local changed_files
-                changed_files=$(git diff --name-only "${BASE_BRANCH}...HEAD" 2>/dev/null || true)
+                changed_files=$(_safe_base_diff --name-only || true)
                 if [[ -n "$changed_files" ]]; then
                     local co_reviewers
                     co_reviewers=$(echo "$codeowners_json" | jq -r '.[].owners[]' 2>/dev/null | sort -u | head -3 || true)
@@ -1980,13 +2276,14 @@ stage_merge() {
         local merge_diff_file="${ARTIFACTS_DIR}/review-diff.patch"
         local merge_review_file="${ARTIFACTS_DIR}/review.md"
         if [[ ! -s "$merge_diff_file" ]]; then
-            git diff "${BASE_BRANCH}...${GIT_BRANCH}" > "$merge_diff_file" 2>/dev/null || \
-                git diff HEAD~5 > "$merge_diff_file" 2>/dev/null || true
+            _safe_base_diff > "$merge_diff_file" 2>/dev/null || true
         fi
         if [[ -s "$merge_diff_file" ]]; then
             local _merge_critical _merge_sec _merge_blocking _merge_reject
-            _merge_critical=$(grep -ciE '\*\*\[?Critical\]?\*\*' "$merge_review_file" 2>/dev/null || echo "0")
-            _merge_sec=$(grep -ciE '\*\*\[?Security\]?\*\*' "$merge_review_file" 2>/dev/null || echo "0")
+            _merge_critical=$(grep -ciE '\*\*\[?Critical\]?\*\*' "$merge_review_file" 2>/dev/null || true)
+            _merge_critical="${_merge_critical:-0}"
+            _merge_sec=$(grep -ciE '\*\*\[?Security\]?\*\*' "$merge_review_file" 2>/dev/null || true)
+            _merge_sec="${_merge_sec:-0}"
             _merge_blocking=$((${_merge_critical:-0} + ${_merge_sec:-0}))
             [[ "$_merge_blocking" -gt 0 ]] && _merge_reject="Review found ${_merge_blocking} critical/security issue(s)"
             if ! bash "$SCRIPT_DIR/sw-oversight.sh" gate --diff "$merge_diff_file" --description "${GOAL:-Pipeline merge}" --reject-if "${_merge_reject:-}" >/dev/null 2>&1; then

package/scripts/lib/pipeline-state.sh CHANGED Viewed

@@ -176,6 +176,13 @@ mark_stage_complete() {
     write_state
     record_stage_effectiveness "$stage_id" "complete"
+    # Record stage completion in SQLite pipeline_stages table
+    if type record_stage >/dev/null 2>&1; then
+        local _stage_secs
+        _stage_secs=$(get_stage_timing_seconds "$stage_id")
+        record_stage "${SHIPWRIGHT_PIPELINE_ID:-}" "$stage_id" "complete" "${_stage_secs:-0}" "" 2>/dev/null || true
+    fi
     # Update memory baselines and predictive baselines for stage durations
     if [[ "$stage_id" == "test" || "$stage_id" == "build" ]]; then
         local secs
@@ -354,6 +361,13 @@ mark_stage_failed() {
     log_stage "$stage_id" "failed (${timing})"
     write_state
+    # Record stage failure in SQLite pipeline_stages table
+    if type record_stage >/dev/null 2>&1; then
+        local _stage_secs
+        _stage_secs=$(get_stage_timing_seconds "$stage_id")
+        record_stage "${SHIPWRIGHT_PIPELINE_ID:-}" "$stage_id" "failed" "${_stage_secs:-0}" "" 2>/dev/null || true
+    fi
     # Update GitHub progress + comment failure
     if [[ -n "$ISSUE_NUMBER" ]]; then
         local body

package/scripts/lib/policy.sh CHANGED Viewed

File without changes

package/scripts/lib/test-helpers.sh CHANGED Viewed

File without changes