npm - shipwright-cli - Versions diffs - 3.0.0 → 3.1.0 - Mend

shipwright-cli 3.0.0 → 3.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (135) hide show

package/README.md +3 -3
package/completions/_shipwright +247 -93
package/completions/shipwright.bash +69 -15
package/completions/shipwright.fish +309 -41
package/config/decision-tiers.json +55 -0
package/config/event-schema.json +142 -5
package/config/policy.json +8 -0
package/package.json +3 -3
package/scripts/lib/architecture.sh +2 -1
package/scripts/lib/bootstrap.sh +0 -0
package/scripts/lib/config.sh +0 -0
package/scripts/lib/daemon-adaptive.sh +0 -0
package/scripts/lib/daemon-dispatch.sh +24 -1
package/scripts/lib/daemon-failure.sh +0 -0
package/scripts/lib/daemon-health.sh +0 -0
package/scripts/lib/daemon-patrol.sh +40 -5
package/scripts/lib/daemon-poll.sh +17 -0
package/scripts/lib/daemon-state.sh +10 -0
package/scripts/lib/daemon-triage.sh +1 -1
package/scripts/lib/decide-autonomy.sh +295 -0
package/scripts/lib/decide-scoring.sh +228 -0
package/scripts/lib/decide-signals.sh +462 -0
package/scripts/lib/fleet-failover.sh +0 -0
package/scripts/lib/helpers.sh +16 -17
package/scripts/lib/pipeline-detection.sh +0 -0
package/scripts/lib/pipeline-github.sh +0 -0
package/scripts/lib/pipeline-intelligence.sh +20 -3
package/scripts/lib/pipeline-quality-checks.sh +3 -2
package/scripts/lib/pipeline-quality.sh +0 -0
package/scripts/lib/pipeline-stages.sh +199 -32
package/scripts/lib/pipeline-state.sh +14 -0
package/scripts/lib/policy.sh +0 -0
package/scripts/lib/test-helpers.sh +0 -0
package/scripts/postinstall.mjs +75 -1
package/scripts/signals/example-collector.sh +36 -0
package/scripts/sw +8 -4
package/scripts/sw-activity.sh +1 -1
package/scripts/sw-adaptive.sh +1 -1
package/scripts/sw-adversarial.sh +1 -1
package/scripts/sw-architecture-enforcer.sh +1 -1
package/scripts/sw-auth.sh +1 -1
package/scripts/sw-autonomous.sh +1 -1
package/scripts/sw-changelog.sh +1 -1
package/scripts/sw-checkpoint.sh +1 -1
package/scripts/sw-ci.sh +1 -1
package/scripts/sw-cleanup.sh +1 -1
package/scripts/sw-code-review.sh +1 -1
package/scripts/sw-connect.sh +1 -1
package/scripts/sw-context.sh +1 -1
package/scripts/sw-cost.sh +12 -3
package/scripts/sw-daemon.sh +2 -2
package/scripts/sw-dashboard.sh +1 -1
package/scripts/sw-db.sh +41 -34
package/scripts/sw-decide.sh +685 -0
package/scripts/sw-decompose.sh +1 -1
package/scripts/sw-deps.sh +1 -1
package/scripts/sw-developer-simulation.sh +1 -1
package/scripts/sw-discovery.sh +27 -1
package/scripts/sw-doc-fleet.sh +1 -1
package/scripts/sw-docs-agent.sh +1 -1
package/scripts/sw-docs.sh +1 -1
package/scripts/sw-doctor.sh +1 -1
package/scripts/sw-dora.sh +1 -1
package/scripts/sw-durable.sh +1 -1
package/scripts/sw-e2e-orchestrator.sh +1 -1
package/scripts/sw-eventbus.sh +1 -1
package/scripts/sw-evidence.sh +1 -1
package/scripts/sw-feedback.sh +1 -1
package/scripts/sw-fix.sh +1 -1
package/scripts/sw-fleet-discover.sh +1 -1
package/scripts/sw-fleet-viz.sh +1 -1
package/scripts/sw-fleet.sh +1 -1
package/scripts/sw-github-app.sh +1 -1
package/scripts/sw-github-checks.sh +1 -1
package/scripts/sw-github-deploy.sh +1 -1
package/scripts/sw-github-graphql.sh +1 -1
package/scripts/sw-guild.sh +1 -1
package/scripts/sw-heartbeat.sh +1 -1
package/scripts/sw-hygiene.sh +1 -1
package/scripts/sw-incident.sh +1 -1
package/scripts/sw-init.sh +1 -1
package/scripts/sw-instrument.sh +1 -1
package/scripts/sw-intelligence.sh +9 -5
package/scripts/sw-jira.sh +1 -1
package/scripts/sw-launchd.sh +1 -1
package/scripts/sw-linear.sh +1 -1
package/scripts/sw-logs.sh +1 -1
package/scripts/sw-loop.sh +267 -17
package/scripts/sw-memory.sh +22 -5
package/scripts/sw-mission-control.sh +1 -1
package/scripts/sw-model-router.sh +1 -1
package/scripts/sw-otel.sh +5 -3
package/scripts/sw-oversight.sh +1 -1
package/scripts/sw-pipeline-composer.sh +1 -1
package/scripts/sw-pipeline-vitals.sh +1 -1
package/scripts/sw-pipeline.sh +73 -1
package/scripts/sw-pm.sh +1 -1
package/scripts/sw-pr-lifecycle.sh +7 -4
package/scripts/sw-predictive.sh +1 -1
package/scripts/sw-prep.sh +1 -1
package/scripts/sw-ps.sh +1 -1
package/scripts/sw-public-dashboard.sh +1 -1
package/scripts/sw-quality.sh +9 -5
package/scripts/sw-reaper.sh +1 -1
package/scripts/sw-regression.sh +1 -1
package/scripts/sw-release-manager.sh +1 -1
package/scripts/sw-release.sh +1 -1
package/scripts/sw-remote.sh +1 -1
package/scripts/sw-replay.sh +1 -1
package/scripts/sw-retro.sh +1 -1
package/scripts/sw-review-rerun.sh +1 -1
package/scripts/sw-scale.sh +66 -10
package/scripts/sw-security-audit.sh +1 -1
package/scripts/sw-self-optimize.sh +1 -1
package/scripts/sw-session.sh +3 -3
package/scripts/sw-setup.sh +1 -1
package/scripts/sw-standup.sh +1 -1
package/scripts/sw-status.sh +1 -1
package/scripts/sw-strategic.sh +1 -1
package/scripts/sw-stream.sh +1 -1
package/scripts/sw-swarm.sh +1 -1
package/scripts/sw-team-stages.sh +1 -1
package/scripts/sw-templates.sh +1 -1
package/scripts/sw-testgen.sh +1 -1
package/scripts/sw-tmux-pipeline.sh +1 -1
package/scripts/sw-tmux.sh +1 -1
package/scripts/sw-trace.sh +1 -1
package/scripts/sw-tracker.sh +1 -1
package/scripts/sw-triage.sh +6 -6
package/scripts/sw-upgrade.sh +1 -1
package/scripts/sw-ux.sh +1 -1
package/scripts/sw-webhook.sh +1 -1
package/scripts/sw-widgets.sh +1 -1
package/scripts/sw-worktree.sh +1 -1
package/scripts/update-homebrew-sha.sh +21 -15

package/scripts/sw-loop.sh CHANGED Viewed

@@ -24,6 +24,12 @@ SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
 # shellcheck source=lib/helpers.sh
 [[ -f "$SCRIPT_DIR/lib/helpers.sh" ]] && source "$SCRIPT_DIR/lib/helpers.sh"
 [[ -f "$SCRIPT_DIR/lib/config.sh" ]] && source "$SCRIPT_DIR/lib/config.sh"
+# Source DB for dual-write (emit_event → JSONL + SQLite).
+# Note: do NOT call init_schema here — the pipeline (sw-pipeline.sh) owns schema
+# initialization. Calling it here would create an empty DB that shadows JSON cost data.
+if [[ -f "$SCRIPT_DIR/sw-db.sh" ]]; then
+    source "$SCRIPT_DIR/sw-db.sh" 2>/dev/null || true
+fi
 # Fallbacks when helpers not loaded (e.g. test env with overridden SCRIPT_DIR)
 [[ "$(type -t info 2>/dev/null)" == "function" ]]    || info()    { echo -e "\033[38;2;0;212;255m\033[1m▸\033[0m $*"; }
 [[ "$(type -t success 2>/dev/null)" == "function" ]] || success() { echo -e "\033[38;2;74;222;128m\033[1m✓\033[0m $*"; }
@@ -63,7 +69,7 @@ MAX_RESTARTS=$(_config_get_int "loop.max_restarts" 0 2>/dev/null || echo 0)
 SESSION_RESTART=false
 RESTART_COUNT=0
 REPO_OVERRIDE=""
-VERSION="3.0.0"
+VERSION="3.1.0"
 # ─── Token Tracking ─────────────────────────────────────────────────────────
 LOOP_INPUT_TOKENS=0
@@ -655,6 +661,9 @@ initialize_state() {
     STATUS="running"
     LOG_ENTRIES=""
+    # Record starting commit for cumulative diff in quality gates
+    LOOP_START_COMMIT="$(git -C "$PROJECT_ROOT" rev-parse HEAD 2>/dev/null || echo "")"
     write_state
 }
@@ -726,6 +735,11 @@ resume_state() {
     START_EPOCH="$(now_epoch)"
     STATUS="running"
+    # Set starting commit for cumulative diff (approximate: use earliest tracked commit)
+    if [[ -z "${LOOP_START_COMMIT:-}" ]]; then
+        LOOP_START_COMMIT="$(git -C "$PROJECT_ROOT" rev-list --max-parents=0 HEAD 2>/dev/null | tail -1 || echo "")"
+    fi
     # If we hit max iterations before, warn user to extend
     if [[ "$ITERATION" -ge "$MAX_ITERATIONS" ]] && ! $MAX_ITERATIONS_EXPLICIT; then
         warn "Previous run stopped at iteration $ITERATION/$MAX_ITERATIONS."
@@ -872,7 +886,8 @@ validate_claude_output() {
     # Check for obviously corrupt output (API errors dumped as code)
     local total_changed
-    total_changed=$(echo "$changed_files" | grep -c '.' 2>/dev/null || echo "0")
+    total_changed=$(echo "$changed_files" | grep -c '.' 2>/dev/null || true)
+    total_changed="${total_changed:-0}"
     if [[ "$total_changed" -eq 0 ]]; then
         warn "Claude iteration produced no file changes"
         issues=$((issues + 1))
@@ -966,7 +981,8 @@ check_fatal_error() {
     # Non-zero exit + tiny output = likely CLI crash
     if [[ "$cli_exit_code" -ne 0 ]]; then
         local line_count
-        line_count=$(grep -cv '^$' "$log_file" 2>/dev/null || echo 0)
+        line_count=$(grep -cv '^$' "$log_file" 2>/dev/null || true)
+        line_count="${line_count:-0}"
         if [[ "$line_count" -lt 3 ]]; then
             local content
             content=$(head -3 "$log_file" 2>/dev/null | cut -c1-120)
@@ -1140,7 +1156,8 @@ diagnose_failure() {
     local diagnosis_file="${LOG_DIR:-/tmp}/diagnoses.txt"
     local repeat_count=0
     if [[ -f "$diagnosis_file" ]]; then
-        repeat_count=$(grep -c "^${diagnosis}$" "$diagnosis_file" 2>/dev/null || echo "0")
+        repeat_count=$(grep -c "^${diagnosis}$" "$diagnosis_file" 2>/dev/null || true)
+        repeat_count="${repeat_count:-0}"
     fi
     echo "$diagnosis" >> "$diagnosis_file"
@@ -1317,33 +1334,60 @@ run_audit_agent() {
     local log_file="$LOG_DIR/iteration-${ITERATION}.log"
     local audit_log="$LOG_DIR/audit-iter-${ITERATION}.log"
-    # Gather context: tail of implementer output + git diff
+    # Gather context: tail of implementer output + cumulative diff
     local impl_tail
     impl_tail="$(tail -100 "$log_file" 2>/dev/null || echo "(no output)")"
-    local diff_stat
-    diff_stat="$(git -C "$PROJECT_ROOT" diff --stat HEAD~1 2>/dev/null || echo "(no changes)")"
+    # Use cumulative diff from loop start so auditor sees ALL work, not just latest commit
+    local diff_stat cumulative_note=""
+    if [[ -n "${LOOP_START_COMMIT:-}" ]]; then
+        diff_stat="$(git -C "$PROJECT_ROOT" diff --stat "${LOOP_START_COMMIT}..HEAD" 2>/dev/null || echo "(no changes)")"
+        cumulative_note="Note: This diff shows ALL changes since the loop started (iteration 1 through ${ITERATION}), not just the latest commit."
+    else
+        diff_stat="$(git -C "$PROJECT_ROOT" diff --stat HEAD~1 2>/dev/null || echo "(no changes)")"
+    fi
+    # Include verified test status so auditor doesn't have to guess
+    local test_context=""
+    if [[ -n "$TEST_CMD" ]]; then
+        if [[ "${TEST_PASSED:-}" == "true" ]]; then
+            test_context="## Verified Test Status (from harness, not from agent)
+Tests: ALL PASSING (command: ${TEST_CMD})"
+        else
+            test_context="## Verified Test Status (from harness)
+Tests: FAILING (command: ${TEST_CMD})
+$(echo "${TEST_OUTPUT:-}" | tail -10)"
+        fi
+    fi
     local audit_prompt
     read -r -d '' audit_prompt <<AUDIT_PROMPT || true
-You are an independent code auditor reviewing an autonomous coding agent.
+You are an independent code auditor reviewing an autonomous coding agent's CUMULATIVE work.
+This is iteration ${ITERATION}. The agent may have done most of the work in earlier iterations.
 ## Goal the agent was working toward
 ${GOAL}
-## Agent Output (last 100 lines)
+## Agent Output This Iteration (last 100 lines)
 ${impl_tail}
-## Changes Made (git diff --stat)
+## Cumulative Changes Made (git diff --stat)
+${cumulative_note}
 ${diff_stat}
+${test_context}
 ## Your Task
-Critically review the work:
-1. Did the agent make meaningful progress toward the goal?
-2. Are there obvious bugs, logic errors, or security issues?
+Critically review the CUMULATIVE work (not just the latest iteration):
+1. Has the agent made meaningful progress toward the goal across all iterations?
+2. Are there obvious bugs, logic errors, or security issues in the current codebase?
 3. Did the agent leave incomplete work (TODOs, placeholder code)?
 4. Are there any regressions or broken patterns?
 5. Is the code quality acceptable?
+IMPORTANT: If the current iteration made small or no code changes, that may be acceptable
+if earlier iterations already completed the substantive work. Judge the whole body of work.
 If the work is acceptable and moves toward the goal, output exactly: AUDIT_PASS
 Otherwise, list the specific issues that need fixing.
 AUDIT_PROMPT
@@ -1429,21 +1473,52 @@ check_definition_of_done() {
     local dod_content
     dod_content="$(cat "$DOD_FILE")"
+    # Use cumulative diff from loop start (not just HEAD~1) so the evaluator
+    # can see ALL work done across every iteration, not just the latest commit.
     local diff_content
-    diff_content="$(git -C "$PROJECT_ROOT" diff HEAD~1 2>/dev/null || echo "(no diff)")"
+    if [[ -n "${LOOP_START_COMMIT:-}" ]]; then
+        diff_content="$(git -C "$PROJECT_ROOT" diff --stat "${LOOP_START_COMMIT}..HEAD" 2>/dev/null || echo "(no diff)")"
+        diff_content="${diff_content}
+## Detailed Changes (cumulative diff, truncated to 200 lines)
+$(git -C "$PROJECT_ROOT" diff "${LOOP_START_COMMIT}..HEAD" 2>/dev/null | head -200 || echo "(no diff)")"
+    else
+        diff_content="$(git -C "$PROJECT_ROOT" diff HEAD~1 2>/dev/null || echo "(no diff)")"
+    fi
+    # Inject verified runtime facts so the evaluator doesn't have to guess
+    local runtime_facts=""
+    if [[ -n "$TEST_CMD" ]]; then
+        if [[ "${TEST_PASSED:-}" == "true" ]]; then
+            runtime_facts="## Verified Runtime Facts (from the loop harness, not from the agent)
+- Tests: ALL PASSING (verified by running '${TEST_CMD}' after this iteration)
+- Test output (last 10 lines):
+$(echo "${TEST_OUTPUT:-}" | tail -10)"
+        else
+            runtime_facts="## Verified Runtime Facts
+- Tests: FAILING (verified by running '${TEST_CMD}')
+- Test output (last 10 lines):
+$(echo "${TEST_OUTPUT:-}" | tail -10)"
+        fi
+    fi
     local dod_prompt
     read -r -d '' dod_prompt <<DOD_PROMPT || true
-You are evaluating whether code changes satisfy a Definition of Done checklist.
+You are evaluating whether a project satisfies a Definition of Done checklist.
+You are reviewing the CUMULATIVE work across all iterations, not just the latest commit.
 ## Definition of Done
 ${dod_content}
-## Changes Made (git diff)
+${runtime_facts}
+## Cumulative Changes Made (git diff from start of loop to now)
 ${diff_content}
 ## Your Task
-For each item in the Definition of Done, determine if the changes satisfy it.
+For each item in the Definition of Done, determine if the project satisfies it.
+The runtime facts above are verified by the harness — trust them as ground truth.
 If ALL items are satisfied, output exactly: DOD_PASS
 Otherwise, list which items are NOT satisfied and why.
 DOD_PROMPT
@@ -1497,6 +1572,14 @@ guard_completion() {
         rejection_reasons+=("tests failing")
     fi
+    # Holistic final gate: when all other gates pass, run a project-level assessment
+    # that evaluates the entire codebase against the goal (not just the latest diff)
+    if [[ ${#rejection_reasons[@]} -eq 0 ]]; then
+        if ! run_holistic_gate; then
+            rejection_reasons+=("holistic project assessment found gaps")
+        fi
+    fi
     if [[ ${#rejection_reasons[@]} -gt 0 ]]; then
         local reasons_str
         reasons_str="$(printf ', %s' "${rejection_reasons[@]}")"
@@ -1510,6 +1593,70 @@ guard_completion() {
     return 0
 }
+# Holistic gate: evaluates the full project against the original goal.
+# Only runs when all other gates pass (final checkpoint before acceptance).
+run_holistic_gate() {
+    # Skip if no starting commit (can't compute cumulative diff)
+    [[ -z "${LOOP_START_COMMIT:-}" ]] && return 0
+    local holistic_log="$LOG_DIR/holistic-iter-${ITERATION}.log"
+    # Build a project summary: file tree, test count, cumulative diff stats
+    local file_count
+    file_count=$(git -C "$PROJECT_ROOT" ls-files | wc -l | tr -d ' ')
+    local cumulative_stat
+    cumulative_stat="$(git -C "$PROJECT_ROOT" diff --stat "${LOOP_START_COMMIT}..HEAD" 2>/dev/null | tail -1 || echo "(no changes)")"
+    local test_summary=""
+    if [[ -n "${TEST_OUTPUT:-}" ]]; then
+        test_summary="$(echo "$TEST_OUTPUT" | tail -5)"
+    fi
+    local holistic_prompt
+    read -r -d '' holistic_prompt <<HOLISTIC_PROMPT || true
+You are a final quality gate evaluating whether an autonomous coding agent has FULLY achieved its goal.
+## Original Goal
+${GOAL}
+## Project Stats
+- Files in repo: ${file_count}
+- Iterations completed: ${ITERATION}
+- Cumulative changes: ${cumulative_stat}
+- Tests: ${TEST_PASSED:-unknown} (command: ${TEST_CMD:-none})
+${test_summary:+- Test output: ${test_summary}}
+## Cumulative Git Changes (diff --stat from start)
+$(git -C "$PROJECT_ROOT" diff --stat "${LOOP_START_COMMIT}..HEAD" 2>/dev/null | head -40 || echo "(none)")
+## Your Task
+Based on the goal and the cumulative work done:
+1. Has the goal been FULLY achieved (not partially)?
+2. Is there any critical gap that would make this unacceptable for production?
+If the goal is fully achieved, output exactly: HOLISTIC_PASS
+Otherwise, list the specific gaps remaining.
+HOLISTIC_PROMPT
+    echo -e "  ${PURPLE}▸${RESET} Running holistic project assessment..."
+    local hol_model
+    hol_model="$(select_audit_model)"
+    local hol_flags=("--model" "$hol_model")
+    if $SKIP_PERMISSIONS; then
+        hol_flags+=("--dangerously-skip-permissions")
+    fi
+    claude -p "$holistic_prompt" "${hol_flags[@]}" > "$holistic_log" 2>&1 || true
+    if grep -q "HOLISTIC_PASS" "$holistic_log" 2>/dev/null; then
+        echo -e "  ${GREEN}✓${RESET} Holistic assessment: passed"
+        return 0
+    else
+        echo -e "  ${YELLOW}⚠${RESET} Holistic assessment: gaps found"
+        return 1
+    fi
+}
 # ─── Context Window Management ───────────────────────────────────────────────
 # Prevents prompt from exceeding Claude's context limit (~200K tokens).
 # Trims least-critical sections first when over budget.
@@ -1810,12 +1957,25 @@ ${_test_tail}
         RESUMED_TEST_OUTPUT=""
     fi
+    # Build cumulative progress summary showing all iterations' work
+    local cumulative_section=""
+    if [[ -n "${LOOP_START_COMMIT:-}" ]] && [[ "$ITERATION" -gt 1 ]]; then
+        local cum_stat
+        cum_stat="$(git -C "$PROJECT_ROOT" diff --stat "${LOOP_START_COMMIT}..HEAD" 2>/dev/null | tail -1 || true)"
+        if [[ -n "$cum_stat" ]]; then
+            cumulative_section="## Cumulative Progress (all iterations combined)
+${cum_stat}
+"
+        fi
+    fi
     cat <<PROMPT
 You are an autonomous coding agent on iteration ${ITERATION}/${MAX_ITERATIONS} of a continuous loop.
 ${resume_section}
 ## Your Goal
 ${GOAL}
+${cumulative_section}
 ## Current Progress
 ${recent_log}
@@ -1861,6 +2021,58 @@ ${stuckness_section}
 PROMPT
 }
+# ─── Alternative Strategy Exploration ─────────────────────────────────────────
+# When stuckness is detected, generate a context-aware alternative strategy.
+# Uses pattern matching on error type + iteration count to suggest different approaches.
+explore_alternative_strategy() {
+    local last_error="${1:-unknown}"
+    local iteration="${2:-0}"
+    local diagnosis="${3:-}"
+    # Track attempted strategies to avoid repeating them
+    local strategy_file="${LOG_DIR:-/tmp}/strategy-attempts.txt"
+    local attempted
+    attempted=$(cat "$strategy_file" 2>/dev/null || true)
+    local strategy=""
+    # If quality gates are passing but evaluators disagree, suggest focusing on evaluator alignment
+    if [[ "${TEST_PASSED:-}" == "true" ]] && [[ "${QUALITY_GATE_PASSED:-}" == "true" || "${AUDIT_RESULT:-}" == "pass" ]]; then
+        if ! echo "$attempted" | grep -q "evaluator_alignment"; then
+            echo "evaluator_alignment" >> "$strategy_file"
+            strategy="## Alternative Strategy: Evaluator Alignment
+The code appears functionally complete (tests pass). Focus on satisfying the remaining
+quality gate evaluators. Check the DoD log and audit log for specific complaints, then
+address those exact points rather than adding new features."
+        fi
+    fi
+    # If no code changes in last iteration, suggest verifying existing work
+    if echo "$last_error" | grep -qi "no code changes" || [[ "$diagnosis" == *"no code"* ]]; then
+        if ! echo "$attempted" | grep -q "verify_existing"; then
+            echo "verify_existing" >> "$strategy_file"
+            strategy="## Alternative Strategy: Verify Existing Work
+Recent iterations made no code changes. The work may already be complete.
+Run the full test suite, verify all features work, and if everything passes,
+commit a verification message and declare LOOP_COMPLETE with evidence."
+        fi
+    fi
+    # Generic fallback: break the problem down
+    if [[ -z "$strategy" ]]; then
+        if ! echo "$attempted" | grep -q "decompose"; then
+            echo "decompose" >> "$strategy_file"
+            strategy="## Alternative Strategy: Decompose
+Break the remaining work into smaller, independent steps. Focus on one specific
+file or function at a time. Read error messages literally — the root cause may
+differ from your assumption."
+        fi
+    fi
+    echo "$strategy"
+}
 # ─── Stuckness Detection ─────────────────────────────────────────────────────
 # Multi-signal detection: text overlap, git diff hash, error repetition, exit code pattern, iteration budget.
 # Returns 0 when stuck, 1 when not. Outputs stuckness section and sets STUCKNESS_HINT when stuck.
@@ -1994,6 +2206,17 @@ detect_stuckness() {
         stuckness_reasons+=("used ${progress_pct}% of iteration budget without passing tests")
     fi
+    # Gate-aware dampening: if tests pass and the agent has made progress overall,
+    # reduce stuckness signal count. The "no code changes" and "identical diffs" signals
+    # fire when code is already complete and the agent is fighting evaluator quirks —
+    # that's not genuine stuckness, it's "done but gates disagree."
+    if [[ "${TEST_PASSED:-}" == "true" ]] && [[ "$stuckness_signals" -ge 2 ]]; then
+        # If at least one quality signal is positive, dampen by 1
+        if [[ "${AUDIT_RESULT:-}" == "pass" ]] || $QUALITY_GATE_PASSED 2>/dev/null; then
+            stuckness_signals=$((stuckness_signals - 1))
+        fi
+    fi
     # Decision: 2+ signals = stuck
     if [[ "$stuckness_signals" -ge 2 ]]; then
         STUCKNESS_COUNT=$(( STUCKNESS_COUNT + 1 ))
@@ -2719,6 +2942,11 @@ run_single_agent_loop() {
         initialize_state
     fi
+    # Ensure LOOP_START_COMMIT is set (may not be on resume/restart)
+    if [[ -z "${LOOP_START_COMMIT:-}" ]]; then
+        LOOP_START_COMMIT="$(git -C "$PROJECT_ROOT" rev-parse HEAD 2>/dev/null || echo "")"
+    fi
     # Apply adaptive budget/model before showing banner
     apply_adaptive_budget
     MODEL="$(select_adaptive_model "build" "$MODEL")"
@@ -2746,6 +2974,16 @@ run_single_agent_loop() {
         }
         ITERATION=$(( ITERATION + 1 ))
+        # Emit iteration start event for pipeline visibility
+        if type emit_event >/dev/null 2>&1; then
+            emit_event "loop.iteration_start" \
+                "iteration=$ITERATION" \
+                "max=$MAX_ITERATIONS" \
+                "job_id=${PIPELINE_JOB_ID:-loop-$$}" \
+                "agent=${AGENT_NUM:-1}" \
+                "test_passed=${TEST_PASSED:-unknown}"
+        fi
         # Root-cause diagnosis and memory-based fix on retry after test failure
         if [[ "${TEST_PASSED:-}" == "false" ]]; then
             # Source memory module for diagnosis and fix lookup
@@ -2915,6 +3153,18 @@ $summary
         write_state
         write_progress
+        # Emit iteration complete event for pipeline visibility
+        if type emit_event >/dev/null 2>&1; then
+            emit_event "loop.iteration_complete" \
+                "iteration=$ITERATION" \
+                "max=$MAX_ITERATIONS" \
+                "job_id=${PIPELINE_JOB_ID:-loop-$$}" \
+                "agent=${AGENT_NUM:-1}" \
+                "test_passed=${TEST_PASSED:-unknown}" \
+                "commits=$TOTAL_COMMITS" \
+                "status=${STATUS:-running}"
+        fi
         # Update heartbeat
         "$SCRIPT_DIR/sw-heartbeat.sh" write "${PIPELINE_JOB_ID:-loop-$$}" \
             --pid $$ \

package/scripts/sw-memory.sh CHANGED Viewed

@@ -6,7 +6,7 @@
 set -euo pipefail
 trap 'echo "ERROR: $BASH_SOURCE:$LINENO exited with status $?" >&2' ERR
-VERSION="3.0.0"
+VERSION="3.1.0"
 SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
 REPO_DIR="${REPO_DIR:-$(cd "$SCRIPT_DIR/.." && pwd)}"
@@ -88,7 +88,13 @@ memory_ranked_search() {
         memory_dir="$(repo_memory_dir)"
     fi
     memory_dir="${memory_dir:-$HOME/.shipwright/memory}"
-    [[ ! -d "$memory_dir" ]] && echo "[]" && return 0
+    if [[ ! -d "$memory_dir" ]]; then
+        info "Memory dir not found at ${memory_dir} — auto-creating"
+        mkdir -p "$memory_dir"
+        emit_event "memory.not_available" "path=$memory_dir" "action=auto_created"
+        echo "[]"
+        return 0
+    fi
     # Extract and expand query keywords
     local keywords
@@ -372,7 +378,10 @@ memory_capture_failure() {
         pattern=$(echo "$error_output" | head -1 | cut -c1-200)
     fi
-    [[ -z "$pattern" ]] && return 0
+    if [[ -z "$pattern" ]]; then
+        warn "Memory capture: empty error pattern — skipping"
+        return 0
+    fi
     # Check for duplicate — increment seen_count if pattern already exists
     local existing_idx
@@ -987,6 +996,7 @@ memory_inject_context() {
     done
     if [[ "$has_memory" == "false" ]]; then
+        info "No memory available for repo (${mem_dir}) — first pipeline run will seed it"
         echo "# No memory available for this repository yet."
         return 0
     fi
@@ -1642,6 +1652,11 @@ memory_export() {
     local mem_dir
     mem_dir="$(repo_memory_dir)"
+    # Ensure all memory files exist (jq --slurpfile fails on missing files)
+    for f in patterns.json failures.json decisions.json metrics.json; do
+        [[ -f "$mem_dir/$f" ]] || echo '{}' > "$mem_dir/$f"
+    done
     # Merge all memory files into a single JSON export
     local export_json
     export_json=$(jq -n \
@@ -1757,8 +1772,10 @@ memory_stats() {
     # Event-based hit rate
     local inject_count capture_count
     if [[ -f "$EVENTS_FILE" ]]; then
-        inject_count=$(grep -c '"memory.inject"' "$EVENTS_FILE" 2>/dev/null || echo 0)
-        capture_count=$(grep -c '"memory.capture"' "$EVENTS_FILE" 2>/dev/null || echo 0)
+        inject_count=$(grep -c '"memory.inject"' "$EVENTS_FILE" 2>/dev/null || true)
+        inject_count="${inject_count:-0}"
+        capture_count=$(grep -c '"memory.capture"' "$EVENTS_FILE" 2>/dev/null || true)
+        capture_count="${capture_count:-0}"
         echo ""
         echo -e "  ${BOLD}Usage${RESET}"
         printf "    %-18s %s\n" "Context injections:" "$inject_count"

package/scripts/sw-mission-control.sh CHANGED Viewed

@@ -7,7 +7,7 @@
 set -euo pipefail
 trap 'echo "ERROR: $BASH_SOURCE:$LINENO exited with status $?" >&2' ERR
-VERSION="3.0.0"
+VERSION="3.1.0"
 SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
 REPO_DIR="$(cd "$SCRIPT_DIR/.." && pwd)"

package/scripts/sw-model-router.sh CHANGED Viewed

@@ -7,7 +7,7 @@
 set -euo pipefail
 trap 'echo "ERROR: $BASH_SOURCE:$LINENO exited with status $?" >&2' ERR
-VERSION="3.0.0"
+VERSION="3.1.0"
 SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
 REPO_DIR="$(cd "$SCRIPT_DIR/.." && pwd)"

package/scripts/sw-otel.sh CHANGED Viewed

@@ -6,7 +6,7 @@
 set -euo pipefail
 trap 'echo "ERROR: $BASH_SOURCE:$LINENO exited with status $?" >&2' ERR
-VERSION="3.0.0"
+VERSION="3.1.0"
 SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
 REPO_DIR="$(cd "$SCRIPT_DIR/.." && pwd)"
@@ -463,8 +463,10 @@ cmd_report() {
     if [[ -f "$EVENTS_FILE" ]]; then
         event_count=$(wc -l < "$EVENTS_FILE" || echo "0")
-        export_count=$(grep -c '"type":"otel_export"' "$EVENTS_FILE" 2>/dev/null || echo "0")
-        webhook_count=$(grep -c '"type":"webhook_sent"' "$EVENTS_FILE" 2>/dev/null || echo "0")
+        export_count=$(grep -c '"type":"otel_export"' "$EVENTS_FILE" 2>/dev/null || true)
+        export_count="${export_count:-0}"
+        webhook_count=$(grep -c '"type":"webhook_sent"' "$EVENTS_FILE" 2>/dev/null || true)
+        webhook_count="${webhook_count:-0}"
         last_event_ts=$(tail -n1 "$EVENTS_FILE" | jq -r '.ts // "unknown"' 2>/dev/null || echo "unknown")
     fi

package/scripts/sw-oversight.sh CHANGED Viewed

@@ -7,7 +7,7 @@
 set -euo pipefail
 trap 'echo "ERROR: $BASH_SOURCE:$LINENO exited with status $?" >&2' ERR
-VERSION="3.0.0"
+VERSION="3.1.0"
 SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
 REPO_DIR="$(cd "$SCRIPT_DIR/.." && pwd)"

package/scripts/sw-pipeline-composer.sh CHANGED Viewed

@@ -6,7 +6,7 @@
 set -euo pipefail
 trap 'echo "ERROR: $BASH_SOURCE:$LINENO exited with status $?" >&2' ERR
-VERSION="3.0.0"
+VERSION="3.1.0"
 SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
 REPO_DIR="$(cd "$SCRIPT_DIR/.." && pwd)"

package/scripts/sw-pipeline-vitals.sh CHANGED Viewed

@@ -6,7 +6,7 @@
 set -euo pipefail
 trap 'echo "ERROR: $BASH_SOURCE:$LINENO exited with status $?" >&2' ERR
-VERSION="3.0.0"
+VERSION="3.1.0"
 SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
 REPO_DIR="$(cd "$SCRIPT_DIR/.." && pwd)"