npm - shipwright-cli - Versions diffs - 3.2.0 → 3.3.0 - Mend

shipwright-cli 3.2.0 → 3.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (279) hide show

package/.claude/agents/code-reviewer.md +2 -0
package/.claude/agents/devops-engineer.md +2 -0
package/.claude/agents/doc-fleet-agent.md +2 -0
package/.claude/agents/pipeline-agent.md +2 -0
package/.claude/agents/shell-script-specialist.md +2 -0
package/.claude/agents/test-specialist.md +2 -0
package/.claude/hooks/agent-crash-capture.sh +32 -0
package/.claude/hooks/post-tool-use.sh +3 -2
package/.claude/hooks/pre-tool-use.sh +35 -3
package/README.md +4 -4
package/claude-code/hooks/config-change.sh +18 -0
package/claude-code/hooks/instructions-reloaded.sh +7 -0
package/claude-code/hooks/worktree-create.sh +25 -0
package/claude-code/hooks/worktree-remove.sh +20 -0
package/config/code-constitution.json +130 -0
package/dashboard/middleware/auth.ts +134 -0
package/dashboard/middleware/constants.ts +21 -0
package/dashboard/public/index.html +2 -6
package/dashboard/public/styles.css +100 -97
package/dashboard/routes/auth.ts +38 -0
package/dashboard/server.ts +66 -25
package/dashboard/services/config.ts +26 -0
package/dashboard/services/db.ts +118 -0
package/dashboard/src/canvas/pixel-agent.ts +298 -0
package/dashboard/src/canvas/pixel-sprites.ts +440 -0
package/dashboard/src/canvas/shipyard-effects.ts +367 -0
package/dashboard/src/canvas/shipyard-scene.ts +616 -0
package/dashboard/src/canvas/submarine-layout.ts +267 -0
package/dashboard/src/components/header.ts +8 -7
package/dashboard/src/core/router.ts +1 -0
package/dashboard/src/design/submarine-theme.ts +253 -0
package/dashboard/src/main.ts +2 -0
package/dashboard/src/types/api.ts +2 -1
package/dashboard/src/views/activity.ts +2 -1
package/dashboard/src/views/shipyard.ts +39 -0
package/dashboard/types/index.ts +166 -0
package/docs/plans/2026-02-28-compound-audit-and-shipyard-design.md +186 -0
package/docs/plans/2026-02-28-skipper-shipwright-implementation-plan.md +1182 -0
package/docs/plans/2026-02-28-skipper-shipwright-integration-design.md +531 -0
package/docs/plans/2026-03-01-ai-powered-skill-injection-design.md +298 -0
package/docs/plans/2026-03-01-ai-powered-skill-injection-plan.md +1109 -0
package/docs/plans/2026-03-01-capabilities-cleanup-plan.md +658 -0
package/docs/plans/2026-03-01-clean-architecture-plan.md +924 -0
package/docs/plans/2026-03-01-compound-audit-cascade-design.md +191 -0
package/docs/plans/2026-03-01-compound-audit-cascade-plan.md +921 -0
package/docs/plans/2026-03-01-deep-integration-plan.md +851 -0
package/docs/plans/2026-03-01-pipeline-audit-trail-design.md +145 -0
package/docs/plans/2026-03-01-pipeline-audit-trail-plan.md +770 -0
package/docs/plans/2026-03-01-refined-depths-brand-design.md +382 -0
package/docs/plans/2026-03-01-refined-depths-implementation.md +599 -0
package/docs/plans/2026-03-01-skipper-kernel-integration-design.md +203 -0
package/docs/plans/2026-03-01-unified-platform-design.md +272 -0
package/docs/plans/2026-03-07-claude-code-feature-integration-design.md +189 -0
package/docs/plans/2026-03-07-claude-code-feature-integration-plan.md +1165 -0
package/docs/research/BACKLOG_QUICK_REFERENCE.md +352 -0
package/docs/research/CUTTING_EDGE_RESEARCH_2026.md +546 -0
package/docs/research/RESEARCH_INDEX.md +439 -0
package/docs/research/RESEARCH_SOURCES.md +440 -0
package/docs/research/RESEARCH_SUMMARY.txt +275 -0
package/docs/superpowers/specs/2026-03-10-pipeline-quality-revolution-design.md +341 -0
package/package.json +2 -2
package/scripts/lib/adaptive-model.sh +427 -0
package/scripts/lib/adaptive-timeout.sh +316 -0
package/scripts/lib/audit-trail.sh +309 -0
package/scripts/lib/auto-recovery.sh +471 -0
package/scripts/lib/bandit-selector.sh +431 -0
package/scripts/lib/bootstrap.sh +104 -2
package/scripts/lib/causal-graph.sh +455 -0
package/scripts/lib/compat.sh +126 -0
package/scripts/lib/compound-audit.sh +337 -0
package/scripts/lib/constitutional.sh +454 -0
package/scripts/lib/context-budget.sh +359 -0
package/scripts/lib/convergence.sh +594 -0
package/scripts/lib/cost-optimizer.sh +634 -0
package/scripts/lib/daemon-adaptive.sh +10 -0
package/scripts/lib/daemon-dispatch.sh +106 -17
package/scripts/lib/daemon-failure.sh +34 -4
package/scripts/lib/daemon-patrol.sh +23 -2
package/scripts/lib/daemon-poll-github.sh +361 -0
package/scripts/lib/daemon-poll-health.sh +299 -0
package/scripts/lib/daemon-poll.sh +27 -611
package/scripts/lib/daemon-state.sh +112 -66
package/scripts/lib/daemon-triage.sh +10 -0
package/scripts/lib/dod-scorecard.sh +442 -0
package/scripts/lib/error-actionability.sh +300 -0
package/scripts/lib/formal-spec.sh +461 -0
package/scripts/lib/helpers.sh +177 -4
package/scripts/lib/intent-analysis.sh +409 -0
package/scripts/lib/loop-convergence.sh +350 -0
package/scripts/lib/loop-iteration.sh +682 -0
package/scripts/lib/loop-progress.sh +48 -0
package/scripts/lib/loop-restart.sh +185 -0
package/scripts/lib/memory-effectiveness.sh +506 -0
package/scripts/lib/mutation-executor.sh +352 -0
package/scripts/lib/outcome-feedback.sh +521 -0
package/scripts/lib/pipeline-cli.sh +336 -0
package/scripts/lib/pipeline-commands.sh +1216 -0
package/scripts/lib/pipeline-detection.sh +100 -2
package/scripts/lib/pipeline-execution.sh +897 -0
package/scripts/lib/pipeline-github.sh +28 -3
package/scripts/lib/pipeline-intelligence-compound.sh +431 -0
package/scripts/lib/pipeline-intelligence-scoring.sh +407 -0
package/scripts/lib/pipeline-intelligence-skip.sh +181 -0
package/scripts/lib/pipeline-intelligence.sh +100 -1136
package/scripts/lib/pipeline-quality-bash-compat.sh +182 -0
package/scripts/lib/pipeline-quality-checks.sh +17 -715
package/scripts/lib/pipeline-quality-gates.sh +563 -0
package/scripts/lib/pipeline-stages-build.sh +730 -0
package/scripts/lib/pipeline-stages-delivery.sh +965 -0
package/scripts/lib/pipeline-stages-intake.sh +1133 -0
package/scripts/lib/pipeline-stages-monitor.sh +407 -0
package/scripts/lib/pipeline-stages-review.sh +1022 -0
package/scripts/lib/pipeline-stages.sh +59 -2929
package/scripts/lib/pipeline-state.sh +36 -5
package/scripts/lib/pipeline-util.sh +487 -0
package/scripts/lib/policy-learner.sh +438 -0
package/scripts/lib/process-reward.sh +493 -0
package/scripts/lib/project-detect.sh +649 -0
package/scripts/lib/quality-profile.sh +334 -0
package/scripts/lib/recruit-commands.sh +885 -0
package/scripts/lib/recruit-learning.sh +739 -0
package/scripts/lib/recruit-roles.sh +648 -0
package/scripts/lib/reward-aggregator.sh +458 -0
package/scripts/lib/rl-optimizer.sh +362 -0
package/scripts/lib/root-cause.sh +427 -0
package/scripts/lib/scope-enforcement.sh +445 -0
package/scripts/lib/session-restart.sh +493 -0
package/scripts/lib/skill-memory.sh +300 -0
package/scripts/lib/skill-registry.sh +775 -0
package/scripts/lib/spec-driven.sh +476 -0
package/scripts/lib/test-helpers.sh +18 -7
package/scripts/lib/test-holdout.sh +429 -0
package/scripts/lib/test-optimizer.sh +511 -0
package/scripts/shipwright-file-suggest.sh +45 -0
package/scripts/skills/adversarial-quality.md +61 -0
package/scripts/skills/api-design.md +44 -0
package/scripts/skills/architecture-design.md +50 -0
package/scripts/skills/brainstorming.md +43 -0
package/scripts/skills/data-pipeline.md +44 -0
package/scripts/skills/deploy-safety.md +64 -0
package/scripts/skills/documentation.md +38 -0
package/scripts/skills/frontend-design.md +45 -0
package/scripts/skills/generated/.gitkeep +0 -0
package/scripts/skills/generated/_refinements/.gitkeep +0 -0
package/scripts/skills/generated/_refinements/adversarial-quality.patch.md +3 -0
package/scripts/skills/generated/_refinements/architecture-design.patch.md +3 -0
package/scripts/skills/generated/_refinements/brainstorming.patch.md +3 -0
package/scripts/skills/generated/cli-version-management.md +29 -0
package/scripts/skills/generated/collection-system-validation.md +99 -0
package/scripts/skills/generated/large-scale-c-refactoring-coordination.md +97 -0
package/scripts/skills/generated/pattern-matching-similarity-scoring.md +195 -0
package/scripts/skills/generated/test-parallelization-detection.md +65 -0
package/scripts/skills/observability.md +79 -0
package/scripts/skills/performance.md +48 -0
package/scripts/skills/pr-quality.md +49 -0
package/scripts/skills/product-thinking.md +43 -0
package/scripts/skills/security-audit.md +49 -0
package/scripts/skills/systematic-debugging.md +40 -0
package/scripts/skills/testing-strategy.md +47 -0
package/scripts/skills/two-stage-review.md +52 -0
package/scripts/skills/validation-thoroughness.md +55 -0
package/scripts/sw +9 -3
package/scripts/sw-activity.sh +9 -2
package/scripts/sw-adaptive.sh +2 -1
package/scripts/sw-adversarial.sh +2 -1
package/scripts/sw-architecture-enforcer.sh +3 -1
package/scripts/sw-auth.sh +12 -2
package/scripts/sw-autonomous.sh +5 -1
package/scripts/sw-changelog.sh +4 -1
package/scripts/sw-checkpoint.sh +2 -1
package/scripts/sw-ci.sh +5 -1
package/scripts/sw-cleanup.sh +4 -26
package/scripts/sw-code-review.sh +10 -4
package/scripts/sw-connect.sh +2 -1
package/scripts/sw-context.sh +2 -1
package/scripts/sw-cost.sh +48 -3
package/scripts/sw-daemon.sh +66 -9
package/scripts/sw-dashboard.sh +3 -1
package/scripts/sw-db.sh +59 -16
package/scripts/sw-decide.sh +8 -2
package/scripts/sw-decompose.sh +360 -17
package/scripts/sw-deps.sh +4 -1
package/scripts/sw-developer-simulation.sh +4 -1
package/scripts/sw-discovery.sh +325 -2
package/scripts/sw-doc-fleet.sh +4 -1
package/scripts/sw-docs-agent.sh +3 -1
package/scripts/sw-docs.sh +2 -1
package/scripts/sw-doctor.sh +453 -2
package/scripts/sw-dora.sh +4 -1
package/scripts/sw-durable.sh +4 -3
package/scripts/sw-e2e-orchestrator.sh +17 -16
package/scripts/sw-eventbus.sh +7 -1
package/scripts/sw-evidence.sh +364 -12
package/scripts/sw-feedback.sh +550 -9
package/scripts/sw-fix.sh +20 -1
package/scripts/sw-fleet-discover.sh +6 -2
package/scripts/sw-fleet-viz.sh +4 -1
package/scripts/sw-fleet.sh +5 -1
package/scripts/sw-github-app.sh +16 -3
package/scripts/sw-github-checks.sh +3 -2
package/scripts/sw-github-deploy.sh +3 -2
package/scripts/sw-github-graphql.sh +18 -7
package/scripts/sw-guild.sh +5 -1
package/scripts/sw-heartbeat.sh +5 -30
package/scripts/sw-hello.sh +67 -0
package/scripts/sw-hygiene.sh +6 -1
package/scripts/sw-incident.sh +265 -1
package/scripts/sw-init.sh +18 -2
package/scripts/sw-instrument.sh +10 -2
package/scripts/sw-intelligence.sh +42 -6
package/scripts/sw-jira.sh +5 -1
package/scripts/sw-launchd.sh +2 -1
package/scripts/sw-linear.sh +4 -1
package/scripts/sw-logs.sh +4 -1
package/scripts/sw-loop.sh +432 -1128
package/scripts/sw-memory.sh +356 -2
package/scripts/sw-mission-control.sh +6 -1
package/scripts/sw-model-router.sh +481 -26
package/scripts/sw-otel.sh +13 -4
package/scripts/sw-oversight.sh +14 -5
package/scripts/sw-patrol-meta.sh +334 -0
package/scripts/sw-pipeline-composer.sh +5 -1
package/scripts/sw-pipeline-vitals.sh +2 -1
package/scripts/sw-pipeline.sh +53 -2664
package/scripts/sw-pm.sh +12 -5
package/scripts/sw-pr-lifecycle.sh +2 -1
package/scripts/sw-predictive.sh +7 -1
package/scripts/sw-prep.sh +185 -2
package/scripts/sw-ps.sh +5 -25
package/scripts/sw-public-dashboard.sh +15 -3
package/scripts/sw-quality.sh +2 -1
package/scripts/sw-reaper.sh +8 -25
package/scripts/sw-recruit.sh +156 -2303
package/scripts/sw-regression.sh +19 -12
package/scripts/sw-release-manager.sh +3 -1
package/scripts/sw-release.sh +4 -1
package/scripts/sw-remote.sh +3 -1
package/scripts/sw-replay.sh +7 -1
package/scripts/sw-retro.sh +158 -1
package/scripts/sw-review-rerun.sh +3 -1
package/scripts/sw-scale.sh +10 -3
package/scripts/sw-security-audit.sh +6 -1
package/scripts/sw-self-optimize.sh +6 -3
package/scripts/sw-session.sh +9 -3
package/scripts/sw-setup.sh +3 -1
package/scripts/sw-stall-detector.sh +406 -0
package/scripts/sw-standup.sh +15 -7
package/scripts/sw-status.sh +3 -1
package/scripts/sw-strategic.sh +4 -1
package/scripts/sw-stream.sh +7 -1
package/scripts/sw-swarm.sh +18 -6
package/scripts/sw-team-stages.sh +13 -6
package/scripts/sw-templates.sh +5 -29
package/scripts/sw-testgen.sh +7 -1
package/scripts/sw-tmux-pipeline.sh +4 -1
package/scripts/sw-tmux-role-color.sh +2 -0
package/scripts/sw-tmux-status.sh +1 -1
package/scripts/sw-tmux.sh +3 -1
package/scripts/sw-trace.sh +3 -1
package/scripts/sw-tracker-github.sh +3 -0
package/scripts/sw-tracker-jira.sh +3 -0
package/scripts/sw-tracker-linear.sh +3 -0
package/scripts/sw-tracker.sh +3 -1
package/scripts/sw-triage.sh +2 -1
package/scripts/sw-upgrade.sh +3 -1
package/scripts/sw-ux.sh +5 -2
package/scripts/sw-webhook.sh +3 -1
package/scripts/sw-widgets.sh +3 -1
package/scripts/sw-worktree.sh +15 -3
package/scripts/test-skill-injection.sh +1233 -0
package/templates/pipelines/autonomous.json +27 -3
package/templates/pipelines/cost-aware.json +34 -8
package/templates/pipelines/deployed.json +12 -0
package/templates/pipelines/enterprise.json +12 -0
package/templates/pipelines/fast.json +6 -0
package/templates/pipelines/full.json +27 -3
package/templates/pipelines/hotfix.json +6 -0
package/templates/pipelines/standard.json +12 -0
package/templates/pipelines/tdd.json +12 -0

package/scripts/lib/policy-learner.sh ADDED Viewed

@@ -0,0 +1,438 @@
+#!/usr/bin/env bash
+# Module guard - prevent double-sourcing
+[[ -n "${_POLICY_LEARNER_LOADED:-}" ]] && return 0
+_POLICY_LEARNER_LOADED=1
+# ╔═══════════════════════════════════════════════════════════════════════════╗
+# ║  shipwright policy-learner — Strategy Selection & Prompt Optimization   ║
+# ║  Learn optimal strategies from historical RL episodes and rewards.      ║
+# ║  Bucket by (language, issue_type, complexity), find best strategy per   ║
+# ║  bucket, optimize prompt section weights, inject into agent prompts.    ║
+# ╚═══════════════════════════════════════════════════════════════════════════╝
+# shellcheck disable=SC2034
+VERSION="3.3.0"
+# ─── Output Helpers ──────────────────────────────────────────────────────────
+[[ "$(type -t info 2>/dev/null)" == "function" ]]    || info()    { echo -e "\033[38;2;0;212;255m\033[1m▸\033[0m $*"; }
+[[ "$(type -t success 2>/dev/null)" == "function" ]] || success() { echo -e "\033[38;2;74;222;128m\033[1m✓\033[0m $*"; }
+[[ "$(type -t warn 2>/dev/null)" == "function" ]]    || warn()    { echo -e "\033[38;2;250;204;21m\033[1m⚠\033[0m $*"; }
+[[ "$(type -t error 2>/dev/null)" == "function" ]]   || error()   { echo -e "\033[38;2;248;113;113m\033[1m✗\033[0m $*" >&2; }
+if [[ "$(type -t now_iso 2>/dev/null)" != "function" ]]; then
+  now_iso()   { date -u +"%Y-%m-%dT%H:%M:%SZ"; }
+  now_epoch() { date +%s; }
+fi
+[[ "$(type -t emit_event 2>/dev/null)" == "function" ]] || emit_event() { true; }
+# ─── Configuration ───────────────────────────────────────────────────────────
+POLICY_EPISODES_FILE="${POLICY_EPISODES_FILE:-${HOME}/.shipwright/rl-episodes.jsonl}"
+POLICY_REWARDS_FILE="${POLICY_REWARDS_FILE:-${HOME}/.shipwright/rewards.jsonl}"
+POLICY_LEARNED_FILE="${POLICY_LEARNED_FILE:-${HOME}/.shipwright/learned-policy.json}"
+POLICY_MIN_EPISODES="${POLICY_MIN_EPISODES:-3}"
+# ─── Helpers ─────────────────────────────────────────────────────────────────
+_policy_ensure_dir() {
+    local dir
+    dir="$(dirname "$POLICY_LEARNED_FILE")"
+    [[ -d "$dir" ]] || mkdir -p "$dir"
+}
+# Build context key from language, issue_type, complexity
+# Output: "ts:bug:medium" or partial like "*:bug:*"
+_policy_context_key() {
+    local lang="${1:-*}"
+    local itype="${2:-*}"
+    local cplx="${3:-*}"
+    [[ -z "$lang" ]] && lang="*"
+    [[ -z "$itype" ]] && itype="*"
+    [[ -z "$cplx" ]] && cplx="*"
+    echo "${lang}:${itype}:${cplx}"
+}
+# ─── Core Functions ──────────────────────────────────────────────────────────
+# Learn from all historical episodes. Analyze by context bucket, find best
+# strategy per bucket, compute averages, and store in learned-policy.json.
+policy_learn_from_history() {
+    _policy_ensure_dir
+    if [[ ! -f "$POLICY_EPISODES_FILE" ]]; then
+        warn "No episodes file found at $POLICY_EPISODES_FILE"
+        return 0
+    fi
+    local episode_count
+    episode_count=$(wc -l < "$POLICY_EPISODES_FILE" | tr -d ' ')
+    if [[ "$episode_count" -eq 0 ]]; then
+        warn "No episodes recorded yet"
+        return 0
+    fi
+    local now_ts
+    now_ts="$(now_iso)"
+    # Use jq to process all episodes: bucket by context key, find best strategy
+    # per bucket, compute avg reward/iterations/cost
+    local policy_json
+    policy_json=$(jq -c -s --arg now "$now_ts" --argjson min_ep "$POLICY_MIN_EPISODES" '
+        def ctx_key:
+            ((.context.language // "*") + ":" +
+             (.context.issue_type // "*") + ":" +
+             (.context.complexity // "*"));
+        def strategy_key:
+            (.actions // [] | [.[] | if type == "object" then (.strategy // tostring) else tostring end] | sort | join(","));
+        group_by(ctx_key) |
+        [.[] | . as $bucket |
+            ($bucket[0] | ctx_key) as $key |
+            ($bucket | group_by(strategy_key)) |
+            [.[] |
+                {
+                    strategy: (.[0] | strategy_key),
+                    episodes: length,
+                    successes: ([.[] | select(.outcome.success == true)] | length),
+                    avg_reward: (
+                        [.[] | if .outcome.success == true then 1.0 else 0.0 end] |
+                        if length > 0 then (add / length)
+                        else 0 end
+                    ),
+                    avg_iterations: ([.[] | .outcome.iterations // 0] | add / length),
+                    avg_cost: ([.[] | .outcome.cost_usd // 0] | add / length)
+                } |
+                .success_rate = (if .episodes > 0 then (.successes / .episodes) else 0 end)
+            ] |
+            sort_by(-.success_rate, .avg_iterations) |
+            {
+                key: $key,
+                best: (if length > 0 then .[0].strategy else "default" end),
+                reward: (if length > 0 then .[0].success_rate else 0 end),
+                episodes: ([.[] | .episodes] | add // 0),
+                avg_iterations: (if length > 0 then .[0].avg_iterations else 0 end),
+                avg_cost: (if length > 0 then .[0].avg_cost else 0 end),
+                all_strategies: .
+            }
+        ] |
+        {
+            updated_at: $now,
+            total_episodes: ([.[].episodes] | add // 0),
+            min_episodes: $min_ep,
+            strategies: (
+                [.[] | {(.key): {
+                    best: .best,
+                    reward: (.reward * 100 | floor / 100),
+                    episodes: .episodes,
+                    avg_iterations: (.avg_iterations * 10 | floor / 10),
+                    avg_cost: (.avg_cost * 100 | floor / 100),
+                    confident: (.episodes >= $min_ep)
+                }}] | add // {}
+            ),
+            model_preferences: {},
+            prompt_weights: {}
+        }
+    ' "$POLICY_EPISODES_FILE" 2>/dev/null)
+    if [[ -z "$policy_json" ]] || [[ "$policy_json" == "null" ]]; then
+        warn "Failed to analyze episodes"
+        return 1
+    fi
+    # Note: partial matching handled at query time in policy_suggest_strategy
+    # Merge model preferences from episodes (which models correlate with success)
+    local model_prefs
+    model_prefs=$(jq -c -s '
+        [.[] | select(.context.model != null)] |
+        if length == 0 then {}
+        else
+            group_by(.context.complexity // "medium") |
+            [.[] |
+                (.[0].context.complexity // "medium") as $cplx |
+                group_by(.context.model) |
+                [.[] | {
+                    model: .[0].context.model,
+                    success_rate: (([.[] | select(.outcome.success == true)] | length) / length)
+                }] |
+                sort_by(-.success_rate) |
+                if length > 0 then {("build:" + $cplx): .[0].model} else {} end
+            ] | add // {}
+        end
+    ' "$POLICY_EPISODES_FILE" 2>/dev/null || echo "{}")
+    # Merge model preferences into policy
+    if [[ -n "$model_prefs" ]] && [[ "$model_prefs" != "{}" ]]; then
+        policy_json=$(echo "$policy_json" | jq -c --argjson mp "$model_prefs" '.model_preferences = $mp')
+    fi
+    # Compute prompt weights via policy_optimize_prompt_weights (inline)
+    local prompt_weights
+    prompt_weights=$(_policy_compute_prompt_weights)
+    if [[ -n "$prompt_weights" ]] && [[ "$prompt_weights" != "{}" ]]; then
+        policy_json=$(echo "$policy_json" | jq -c --argjson pw "$prompt_weights" '.prompt_weights = $pw')
+    fi
+    # Atomic write
+    local tmp
+    tmp="$(mktemp 2>/dev/null || echo "${TMPDIR:-/tmp}/policy-learn-$$.tmp")"
+    echo "$policy_json" | jq '.' > "$tmp" 2>/dev/null
+    if [[ -s "$tmp" ]]; then
+        mv "$tmp" "$POLICY_LEARNED_FILE"
+        local total
+        total=$(echo "$policy_json" | jq '.total_episodes // 0')
+        local strat_count
+        strat_count=$(echo "$policy_json" | jq '.strategies | keys | length')
+        success "Learned policy from $total episodes across $strat_count context buckets"
+        emit_event "policy.learned" "episodes=$total" "buckets=$strat_count"
+    else
+        rm -f "$tmp"
+        error "Failed to write learned policy"
+        return 1
+    fi
+}
+# Suggest best strategy for a given context.
+# Args: $1=language, $2=issue_type, $3=complexity
+# Output: JSON with strategy, expected_reward, confidence, evidence_count
+policy_suggest_strategy() {
+    local language="${1:-}"
+    local issue_type="${2:-}"
+    local complexity="${3:-}"
+    if [[ ! -f "$POLICY_LEARNED_FILE" ]]; then
+        echo '{"strategy":"default","expected_reward":0,"confidence":"none","evidence_count":0}'
+        return 0
+    fi
+    local exact_key partial1 partial2 partial3
+    exact_key="$(_policy_context_key "$language" "$issue_type" "$complexity")"
+    # Partial match keys for fallback
+    # ts:bug:medium → ts:bug:* → *:bug:medium → *:*:medium → default
+    partial1="$(_policy_context_key "$language" "$issue_type" "*")"
+    partial2="$(_policy_context_key "*" "$issue_type" "$complexity")"
+    partial3="$(_policy_context_key "*" "*" "$complexity")"
+    # Partial matching: try exact, then scan keys for partial matches
+    # ts:bug:medium → any key matching ts:bug:* → any matching *:bug:medium → *:*:medium
+    local result
+    result=$(jq -c \
+        --arg exact "$exact_key" \
+        --arg lang "$language" \
+        --arg itype "$issue_type" \
+        --arg cplx "$complexity" \
+        --argjson min_ep "$POLICY_MIN_EPISODES" '
+        .strategies as $s |
+        # Try exact match first
+        (if $s[$exact] then {match: $s[$exact], tier: "exact"}
+        else
+            # Scan all keys for partial matches
+            ($s | to_entries | [
+                # Match lang:type:*
+                (.[] | select((.key | split(":")[0]) == $lang and (.key | split(":")[1]) == $itype) | {match: .value, tier: "partial_type"}),
+                # Match *:type:complexity
+                (.[] | select((.key | split(":")[1]) == $itype and (.key | split(":")[2]) == $cplx) | {match: .value, tier: "partial_lang"}),
+                # Match *:*:complexity
+                (.[] | select((.key | split(":")[2]) == $cplx) | {match: .value, tier: "partial_cplx"})
+            ] | first // null)
+        end) |
+        if . == null then
+            {strategy: "default", expected_reward: 0, confidence: "none", evidence_count: 0}
+        else
+            {
+                strategy: .match.best,
+                expected_reward: .match.reward,
+                confidence: (
+                    if .match.episodes >= ($min_ep * 3) then "high"
+                    elif .match.episodes >= $min_ep then "medium"
+                    else "low" end
+                ),
+                evidence_count: .match.episodes,
+                match_tier: .tier,
+                avg_iterations: .match.avg_iterations
+            }
+        end
+    ' "$POLICY_LEARNED_FILE" 2>/dev/null)
+    if [[ -z "$result" ]] || [[ "$result" == "null" ]]; then
+        echo '{"strategy":"default","expected_reward":0,"confidence":"none","evidence_count":0}'
+    else
+        echo "$result"
+    fi
+}
+# Compute which prompt sections correlate with better outcomes.
+# Internal helper — called by policy_learn_from_history.
+# Output: JSON object with section weights (0.0–1.0)
+_policy_compute_prompt_weights() {
+    if [[ ! -f "$POLICY_EPISODES_FILE" ]]; then
+        echo "{}"
+        return 0
+    fi
+    # Analyze episodes for prompt section correlation
+    # Look for context fields that indicate which sections were active
+    jq -c -s '
+        def section_weight(field):
+            [.[] | select(.context[field] == true)] as $with |
+            [.[] | select(.context[field] != true)] as $without |
+            if ($with | length) < 2 then 0.5
+            elif ($without | length) < 2 then 0.5
+            else
+                (([($with[] | select(.outcome.success == true)] | length) / ([$with[] | .] | length)) -
+                 ([($without[] | select(.outcome.success == true)] | length) / ([$without[] | .] | length))) |
+                (0.5 + . / 2) |
+                if . < 0 then 0 elif . > 1 then 1 else (. * 100 | floor / 100) end
+            end;
+        {
+            inject_memory: section_weight("has_memory"),
+            inject_architecture: section_weight("has_architecture"),
+            inject_coverage_baseline: section_weight("has_coverage"),
+            inject_rl_context: section_weight("has_rl_context"),
+            inject_error_history: section_weight("has_error_history")
+        }
+    ' "$POLICY_EPISODES_FILE" 2>/dev/null || echo "{}"
+}
+# Public wrapper — learn and return prompt weights.
+policy_optimize_prompt_weights() {
+    if [[ ! -f "$POLICY_LEARNED_FILE" ]]; then
+        policy_learn_from_history
+    fi
+    if [[ -f "$POLICY_LEARNED_FILE" ]]; then
+        jq -c '.prompt_weights // {}' "$POLICY_LEARNED_FILE" 2>/dev/null || echo "{}"
+    else
+        echo "{}"
+    fi
+}
+# Format learned policy suggestions for agent prompt injection.
+# Args: $1=language, $2=issue_type, $3=complexity
+# Output: markdown section for prompt (empty if no useful data)
+policy_inject_into_prompt() {
+    local language="${1:-}"
+    local issue_type="${2:-}"
+    local complexity="${3:-}"
+    local suggestion
+    suggestion="$(policy_suggest_strategy "$language" "$issue_type" "$complexity")"
+    local confidence
+    confidence=$(echo "$suggestion" | jq -r '.confidence // "none"')
+    if [[ "$confidence" == "none" ]]; then
+        return 0
+    fi
+    local strategy evidence reward avg_iters
+    strategy=$(echo "$suggestion" | jq -r '.strategy // "default"')
+    evidence=$(echo "$suggestion" | jq -r '.evidence_count // 0')
+    reward=$(echo "$suggestion" | jq -r '.expected_reward // 0')
+    avg_iters=$(echo "$suggestion" | jq -r '.avg_iterations // 0')
+    # Format strategy name for display
+    local display_strategy
+    display_strategy=$(echo "$strategy" | tr ',' ' → ')
+    local pct
+    pct=$(awk -v r="$reward" 'BEGIN { printf "%d", r * 100 }')
+    cat <<EOF
+## Policy-Learned Strategy
+Based on ${evidence} similar issues: **${display_strategy}** (${pct}% success rate, avg ${avg_iters} iterations)
+Confidence: ${confidence}
+EOF
+    # Add prompt weight guidance if available
+    if [[ -f "$POLICY_LEARNED_FILE" ]]; then
+        local weights
+        weights=$(jq -r '
+            .prompt_weights // {} |
+            to_entries |
+            [.[] | select(.value >= 0.7)] |
+            if length > 0 then
+                "Include: " + ([.[].key | gsub("inject_"; "")] | join(", "))
+            else empty end
+        ' "$POLICY_LEARNED_FILE" 2>/dev/null || true)
+        local exclude
+        exclude=$(jq -r '
+            .prompt_weights // {} |
+            to_entries |
+            [.[] | select(.value < 0.3)] |
+            if length > 0 then
+                "Exclude (low impact): " + ([.[].key | gsub("inject_"; "")] | join(", "))
+            else empty end
+        ' "$POLICY_LEARNED_FILE" 2>/dev/null || true)
+        if [[ -n "$weights" ]]; then
+            echo "$weights"
+        fi
+        if [[ -n "$exclude" ]]; then
+            echo "$exclude"
+        fi
+    fi
+}
+# Display a human-readable report of what the policy has learned.
+policy_report() {
+    if [[ ! -f "$POLICY_LEARNED_FILE" ]]; then
+        echo "No learned policy found. Run policy_learn_from_history first."
+        return 0
+    fi
+    local updated total
+    updated=$(jq -r '.updated_at // "unknown"' "$POLICY_LEARNED_FILE")
+    total=$(jq -r '.total_episodes // 0' "$POLICY_LEARNED_FILE")
+    echo "╔═══════════════════════════════════════════════════════════════╗"
+    echo "║  Learned Policy Report                                       ║"
+    echo "╚═══════════════════════════════════════════════════════════════╝"
+    echo ""
+    echo "Updated: ${updated}"
+    echo "Total episodes: ${total}"
+    echo ""
+    # Strategy buckets
+    echo "── Strategy Recommendations ──────────────────────────────────"
+    jq -r '
+        .strategies // {} | to_entries[] |
+        "  \(.key): \(.value.best) " +
+        "(\(.value.reward * 100 | floor)% success, " +
+        "\(.value.avg_iterations) avg iters, " +
+        "~$\(.value.avg_cost), " +
+        "\(.value.episodes) episodes" +
+        (if .value.confident then ", confident" else ", low data" end) +
+        ")"
+    ' "$POLICY_LEARNED_FILE" 2>/dev/null || echo "  (none)"
+    echo ""
+    # Model preferences
+    echo "── Model Preferences ─────────────────────────────────────────"
+    local mp_count
+    mp_count=$(jq '.model_preferences // {} | keys | length' "$POLICY_LEARNED_FILE" 2>/dev/null || echo "0")
+    if [[ "$mp_count" -gt 0 ]]; then
+        jq -r '.model_preferences // {} | to_entries[] | "  \(.key): \(.value)"' "$POLICY_LEARNED_FILE" 2>/dev/null
+    else
+        echo "  (no model preference data yet)"
+    fi
+    echo ""
+    # Prompt weights
+    echo "── Prompt Section Weights ────────────────────────────────────"
+    local pw_count
+    pw_count=$(jq '.prompt_weights // {} | keys | length' "$POLICY_LEARNED_FILE" 2>/dev/null || echo "0")
+    if [[ "$pw_count" -gt 0 ]]; then
+        jq -r '
+            .prompt_weights // {} | to_entries |
+            sort_by(-.value)[] |
+            "  \(.key): \(.value)" +
+            (if .value >= 0.7 then " (include)" elif .value < 0.3 then " (exclude)" else " (neutral)" end)
+        ' "$POLICY_LEARNED_FILE" 2>/dev/null
+    else
+        echo "  (no prompt weight data yet)"
+    fi
+}