npm - autonomous-coding-toolkit - Versions diffs - 1.0.0 - Mend

autonomous-coding-toolkit 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (324) hide show

package/.claude-plugin/marketplace.json +22 -0
package/.claude-plugin/plugin.json +13 -0
package/LICENSE +21 -0
package/Makefile +21 -0
package/README.md +140 -0
package/SECURITY.md +28 -0
package/agents/bash-expert.md +113 -0
package/agents/dependency-auditor.md +138 -0
package/agents/integration-tester.md +120 -0
package/agents/lesson-scanner.md +149 -0
package/agents/python-expert.md +179 -0
package/agents/service-monitor.md +141 -0
package/agents/shell-expert.md +147 -0
package/benchmarks/runner.sh +147 -0
package/benchmarks/tasks/01-rest-endpoint/rubric.sh +29 -0
package/benchmarks/tasks/01-rest-endpoint/task.md +17 -0
package/benchmarks/tasks/02-refactor-module/task.md +8 -0
package/benchmarks/tasks/03-fix-integration-bug/task.md +8 -0
package/benchmarks/tasks/04-add-test-coverage/task.md +8 -0
package/benchmarks/tasks/05-multi-file-feature/task.md +8 -0
package/bin/act.js +238 -0
package/commands/autocode.md +6 -0
package/commands/cancel-ralph.md +18 -0
package/commands/code-factory.md +53 -0
package/commands/create-prd.md +55 -0
package/commands/ralph-loop.md +18 -0
package/commands/run-plan.md +117 -0
package/commands/submit-lesson.md +122 -0
package/docs/ARCHITECTURE.md +630 -0
package/docs/CONTRIBUTING.md +125 -0
package/docs/lessons/0001-bare-exception-swallowing.md +34 -0
package/docs/lessons/0002-async-def-without-await.md +28 -0
package/docs/lessons/0003-create-task-without-callback.md +28 -0
package/docs/lessons/0004-hardcoded-test-counts.md +28 -0
package/docs/lessons/0005-sqlite-without-closing.md +33 -0
package/docs/lessons/0006-venv-pip-path.md +27 -0
package/docs/lessons/0007-runner-state-self-rejection.md +35 -0
package/docs/lessons/0008-quality-gate-blind-spot.md +33 -0
package/docs/lessons/0009-parser-overcount-empty-batches.md +36 -0
package/docs/lessons/0010-local-outside-function-bash.md +33 -0
package/docs/lessons/0011-batch-tests-for-unimplemented-code.md +36 -0
package/docs/lessons/0012-api-markdown-unescaped-chars.md +33 -0
package/docs/lessons/0013-export-prefix-env-parsing.md +33 -0
package/docs/lessons/0014-decorator-registry-import-side-effect.md +43 -0
package/docs/lessons/0015-frontend-backend-schema-drift.md +43 -0
package/docs/lessons/0016-event-driven-cold-start-seeding.md +44 -0
package/docs/lessons/0017-copy-paste-logic-diverges.md +43 -0
package/docs/lessons/0018-layer-passes-pipeline-broken.md +45 -0
package/docs/lessons/0019-systemd-envfile-ignores-export.md +41 -0
package/docs/lessons/0020-persist-state-incrementally.md +44 -0
package/docs/lessons/0021-dual-axis-testing.md +48 -0
package/docs/lessons/0022-jsx-factory-shadowing.md +43 -0
package/docs/lessons/0023-static-analysis-spiral.md +51 -0
package/docs/lessons/0024-shared-pipeline-implementation.md +55 -0
package/docs/lessons/0025-defense-in-depth-all-entry-points.md +65 -0
package/docs/lessons/0026-linter-no-rules-false-enforcement.md +54 -0
package/docs/lessons/0027-jsx-silent-prop-drop.md +64 -0
package/docs/lessons/0028-no-infrastructure-in-client-code.md +49 -0
package/docs/lessons/0029-never-write-secrets-to-files.md +61 -0
package/docs/lessons/0030-cache-merge-not-replace.md +62 -0
package/docs/lessons/0031-verify-units-at-boundaries.md +66 -0
package/docs/lessons/0032-module-lifecycle-subscribe-unsubscribe.md +89 -0
package/docs/lessons/0033-async-iteration-mutable-snapshot.md +72 -0
package/docs/lessons/0034-caller-missing-await-silent-discard.md +65 -0
package/docs/lessons/0035-duplicate-registration-silent-overwrite.md +85 -0
package/docs/lessons/0036-websocket-dirty-disconnect.md +33 -0
package/docs/lessons/0037-parallel-agents-worktree-corruption.md +31 -0
package/docs/lessons/0038-subscribe-no-stored-ref.md +36 -0
package/docs/lessons/0039-fallback-or-default-hides-bugs.md +34 -0
package/docs/lessons/0040-event-firehose-filter-first.md +36 -0
package/docs/lessons/0041-ambiguous-base-dir-path-nesting.md +32 -0
package/docs/lessons/0042-spec-compliance-insufficient.md +36 -0
package/docs/lessons/0043-exact-count-extensible-collections.md +32 -0
package/docs/lessons/0044-relative-file-deps-worktree.md +39 -0
package/docs/lessons/0045-iterative-design-improvement.md +33 -0
package/docs/lessons/0046-plan-assertion-math-bugs.md +38 -0
package/docs/lessons/0047-pytest-single-threaded-default.md +37 -0
package/docs/lessons/0048-integration-wiring-batch.md +40 -0
package/docs/lessons/0049-ab-verification.md +41 -0
package/docs/lessons/0050-editing-sourced-files-during-execution.md +33 -0
package/docs/lessons/0051-infrastructure-fixes-cant-self-heal.md +30 -0
package/docs/lessons/0052-uncommitted-changes-poison-quality-gates.md +31 -0
package/docs/lessons/0053-jq-compact-flag-inconsistency.md +31 -0
package/docs/lessons/0054-parser-matches-inside-code-blocks.md +30 -0
package/docs/lessons/0055-agents-compensate-for-garbled-prompts.md +31 -0
package/docs/lessons/0056-grep-count-exit-code-on-zero.md +42 -0
package/docs/lessons/0057-new-artifacts-break-git-clean-gates.md +42 -0
package/docs/lessons/0058-dead-config-keys-never-consumed.md +49 -0
package/docs/lessons/0059-contract-test-shared-structures.md +53 -0
package/docs/lessons/0060-set-e-silent-death-in-runners.md +53 -0
package/docs/lessons/0061-context-injection-dirty-state.md +50 -0
package/docs/lessons/0062-sibling-bug-neighborhood-scan.md +29 -0
package/docs/lessons/0063-one-flag-two-lifetimes.md +31 -0
package/docs/lessons/0064-test-passes-wrong-reason.md +31 -0
package/docs/lessons/0065-pipefail-grep-count-double-output.md +39 -0
package/docs/lessons/0066-local-keyword-outside-function.md +37 -0
package/docs/lessons/0067-stdin-hang-non-interactive-shell.md +36 -0
package/docs/lessons/0068-agent-builds-wrong-thing-correctly.md +31 -0
package/docs/lessons/0069-plan-quality-dominates-execution.md +30 -0
package/docs/lessons/0070-spec-echo-back-prevents-drift.md +31 -0
package/docs/lessons/0071-positive-instructions-outperform-negative.md +30 -0
package/docs/lessons/0072-lost-in-the-middle-context-placement.md +30 -0
package/docs/lessons/0073-unscoped-lessons-cause-false-positives.md +30 -0
package/docs/lessons/0074-stale-context-injection-wrong-batch.md +32 -0
package/docs/lessons/0075-research-artifacts-must-persist.md +32 -0
package/docs/lessons/0076-wrong-decomposition-contaminates-downstream.md +30 -0
package/docs/lessons/0077-cherry-pick-merges-need-manual-resolution.md +30 -0
package/docs/lessons/0078-static-review-without-live-test.md +30 -0
package/docs/lessons/0079-integration-wiring-batch-required.md +32 -0
package/docs/lessons/FRAMEWORK.md +161 -0
package/docs/lessons/SUMMARY.md +201 -0
package/docs/lessons/TEMPLATE.md +85 -0
package/docs/plans/2026-02-21-code-factory-v2-design.md +204 -0
package/docs/plans/2026-02-21-code-factory-v2-implementation-plan.md +2189 -0
package/docs/plans/2026-02-21-code-factory-v2-phase4-design.md +537 -0
package/docs/plans/2026-02-21-code-factory-v2-phase4-implementation-plan.md +2012 -0
package/docs/plans/2026-02-21-hardening-pass-design.md +108 -0
package/docs/plans/2026-02-21-hardening-pass-plan.md +1378 -0
package/docs/plans/2026-02-21-mab-research-report.md +406 -0
package/docs/plans/2026-02-21-marketplace-restructure-design.md +240 -0
package/docs/plans/2026-02-21-marketplace-restructure-plan.md +832 -0
package/docs/plans/2026-02-21-phase4-completion-plan.md +697 -0
package/docs/plans/2026-02-21-validator-suite-design.md +148 -0
package/docs/plans/2026-02-21-validator-suite-plan.md +540 -0
package/docs/plans/2026-02-22-mab-research-round2.md +556 -0
package/docs/plans/2026-02-22-mab-run-design.md +462 -0
package/docs/plans/2026-02-22-mab-run-plan.md +2046 -0
package/docs/plans/2026-02-22-operations-design-methodology-research.md +681 -0
package/docs/plans/2026-02-22-research-agent-failure-taxonomy.md +532 -0
package/docs/plans/2026-02-22-research-code-guideline-policies.md +886 -0
package/docs/plans/2026-02-22-research-codebase-audit-refactoring.md +908 -0
package/docs/plans/2026-02-22-research-coding-standards-documentation.md +541 -0
package/docs/plans/2026-02-22-research-competitive-landscape.md +687 -0
package/docs/plans/2026-02-22-research-comprehensive-testing.md +1076 -0
package/docs/plans/2026-02-22-research-context-utilization.md +459 -0
package/docs/plans/2026-02-22-research-cost-quality-tradeoff.md +548 -0
package/docs/plans/2026-02-22-research-lesson-transferability.md +508 -0
package/docs/plans/2026-02-22-research-multi-agent-coordination.md +312 -0
package/docs/plans/2026-02-22-research-phase-integration.md +602 -0
package/docs/plans/2026-02-22-research-plan-quality.md +428 -0
package/docs/plans/2026-02-22-research-prompt-engineering.md +558 -0
package/docs/plans/2026-02-22-research-unconventional-perspectives.md +528 -0
package/docs/plans/2026-02-22-research-user-adoption.md +638 -0
package/docs/plans/2026-02-22-research-verification-effectiveness.md +433 -0
package/docs/plans/2026-02-23-agent-suite-design.md +299 -0
package/docs/plans/2026-02-23-agent-suite-plan.md +578 -0
package/docs/plans/2026-02-23-phase3-cost-infrastructure-design.md +148 -0
package/docs/plans/2026-02-23-phase3-cost-infrastructure-plan.md +1062 -0
package/docs/plans/2026-02-23-research-bash-expert-agent.md +543 -0
package/docs/plans/2026-02-23-research-dependency-auditor-agent.md +564 -0
package/docs/plans/2026-02-23-research-improving-existing-agents.md +503 -0
package/docs/plans/2026-02-23-research-integration-tester-agent.md +454 -0
package/docs/plans/2026-02-23-research-python-expert-agent.md +429 -0
package/docs/plans/2026-02-23-research-service-monitor-agent.md +425 -0
package/docs/plans/2026-02-23-research-shell-expert-agent.md +533 -0
package/docs/plans/2026-02-23-roadmap-to-completion.md +530 -0
package/docs/plans/2026-02-24-headless-module-split-design.md +98 -0
package/docs/plans/2026-02-24-headless-module-split.md +443 -0
package/docs/plans/2026-02-24-lesson-scope-metadata-design.md +228 -0
package/docs/plans/2026-02-24-lesson-scope-metadata-plan.md +968 -0
package/docs/plans/2026-02-24-npm-packaging-design.md +841 -0
package/docs/plans/2026-02-24-npm-packaging-plan.md +1965 -0
package/docs/plans/audit-findings.md +186 -0
package/docs/telegram-notification-format.md +98 -0
package/examples/example-plan.md +51 -0
package/examples/example-prd.json +72 -0
package/examples/example-roadmap.md +33 -0
package/examples/quickstart-plan.md +63 -0
package/hooks/hooks.json +26 -0
package/hooks/setup-symlinks.sh +48 -0
package/hooks/stop-hook.sh +135 -0
package/package.json +47 -0
package/policies/bash.md +71 -0
package/policies/python.md +71 -0
package/policies/testing.md +61 -0
package/policies/universal.md +60 -0
package/scripts/analyze-report.sh +97 -0
package/scripts/architecture-map.sh +145 -0
package/scripts/auto-compound.sh +273 -0
package/scripts/batch-audit.sh +42 -0
package/scripts/batch-test.sh +101 -0
package/scripts/entropy-audit.sh +221 -0
package/scripts/failure-digest.sh +51 -0
package/scripts/generate-ast-rules.sh +96 -0
package/scripts/init.sh +112 -0
package/scripts/lesson-check.sh +428 -0
package/scripts/lib/common.sh +61 -0
package/scripts/lib/cost-tracking.sh +153 -0
package/scripts/lib/ollama.sh +60 -0
package/scripts/lib/progress-writer.sh +128 -0
package/scripts/lib/run-plan-context.sh +215 -0
package/scripts/lib/run-plan-echo-back.sh +231 -0
package/scripts/lib/run-plan-headless.sh +396 -0
package/scripts/lib/run-plan-notify.sh +57 -0
package/scripts/lib/run-plan-parser.sh +81 -0
package/scripts/lib/run-plan-prompt.sh +215 -0
package/scripts/lib/run-plan-quality-gate.sh +132 -0
package/scripts/lib/run-plan-routing.sh +315 -0
package/scripts/lib/run-plan-sampling.sh +170 -0
package/scripts/lib/run-plan-scoring.sh +146 -0
package/scripts/lib/run-plan-state.sh +142 -0
package/scripts/lib/run-plan-team.sh +199 -0
package/scripts/lib/telegram.sh +54 -0
package/scripts/lib/thompson-sampling.sh +176 -0
package/scripts/license-check.sh +74 -0
package/scripts/mab-run.sh +575 -0
package/scripts/module-size-check.sh +146 -0
package/scripts/patterns/async-no-await.yml +5 -0
package/scripts/patterns/bare-except.yml +6 -0
package/scripts/patterns/empty-catch.yml +6 -0
package/scripts/patterns/hardcoded-localhost.yml +9 -0
package/scripts/patterns/retry-loop-no-backoff.yml +12 -0
package/scripts/pipeline-status.sh +197 -0
package/scripts/policy-check.sh +226 -0
package/scripts/prior-art-search.sh +133 -0
package/scripts/promote-mab-lessons.sh +126 -0
package/scripts/prompts/agent-a-superpowers.md +29 -0
package/scripts/prompts/agent-b-ralph.md +29 -0
package/scripts/prompts/judge-agent.md +61 -0
package/scripts/prompts/planner-agent.md +44 -0
package/scripts/pull-community-lessons.sh +90 -0
package/scripts/quality-gate.sh +266 -0
package/scripts/research-gate.sh +90 -0
package/scripts/run-plan.sh +329 -0
package/scripts/scope-infer.sh +159 -0
package/scripts/setup-ralph-loop.sh +155 -0
package/scripts/telemetry.sh +230 -0
package/scripts/tests/run-all-tests.sh +52 -0
package/scripts/tests/test-act-cli.sh +46 -0
package/scripts/tests/test-agents-md.sh +87 -0
package/scripts/tests/test-analyze-report.sh +114 -0
package/scripts/tests/test-architecture-map.sh +89 -0
package/scripts/tests/test-auto-compound.sh +169 -0
package/scripts/tests/test-batch-test.sh +65 -0
package/scripts/tests/test-benchmark-runner.sh +25 -0
package/scripts/tests/test-common.sh +168 -0
package/scripts/tests/test-cost-tracking.sh +158 -0
package/scripts/tests/test-echo-back.sh +180 -0
package/scripts/tests/test-entropy-audit.sh +146 -0
package/scripts/tests/test-failure-digest.sh +66 -0
package/scripts/tests/test-generate-ast-rules.sh +145 -0
package/scripts/tests/test-helpers.sh +82 -0
package/scripts/tests/test-init.sh +47 -0
package/scripts/tests/test-lesson-check.sh +278 -0
package/scripts/tests/test-lesson-local.sh +55 -0
package/scripts/tests/test-license-check.sh +109 -0
package/scripts/tests/test-mab-run.sh +182 -0
package/scripts/tests/test-ollama-lib.sh +49 -0
package/scripts/tests/test-ollama.sh +60 -0
package/scripts/tests/test-pipeline-status.sh +198 -0
package/scripts/tests/test-policy-check.sh +124 -0
package/scripts/tests/test-prior-art-search.sh +96 -0
package/scripts/tests/test-progress-writer.sh +140 -0
package/scripts/tests/test-promote-mab-lessons.sh +110 -0
package/scripts/tests/test-pull-community-lessons.sh +149 -0
package/scripts/tests/test-quality-gate.sh +241 -0
package/scripts/tests/test-research-gate.sh +132 -0
package/scripts/tests/test-run-plan-cli.sh +86 -0
package/scripts/tests/test-run-plan-context.sh +305 -0
package/scripts/tests/test-run-plan-e2e.sh +153 -0
package/scripts/tests/test-run-plan-headless.sh +424 -0
package/scripts/tests/test-run-plan-notify.sh +124 -0
package/scripts/tests/test-run-plan-parser.sh +217 -0
package/scripts/tests/test-run-plan-prompt.sh +254 -0
package/scripts/tests/test-run-plan-quality-gate.sh +222 -0
package/scripts/tests/test-run-plan-routing.sh +178 -0
package/scripts/tests/test-run-plan-scoring.sh +148 -0
package/scripts/tests/test-run-plan-state.sh +261 -0
package/scripts/tests/test-run-plan-team.sh +157 -0
package/scripts/tests/test-scope-infer.sh +150 -0
package/scripts/tests/test-setup-ralph-loop.sh +63 -0
package/scripts/tests/test-telegram-env.sh +38 -0
package/scripts/tests/test-telegram.sh +121 -0
package/scripts/tests/test-telemetry.sh +46 -0
package/scripts/tests/test-thompson-sampling.sh +139 -0
package/scripts/tests/test-validate-all.sh +60 -0
package/scripts/tests/test-validate-commands.sh +89 -0
package/scripts/tests/test-validate-hooks.sh +98 -0
package/scripts/tests/test-validate-lessons.sh +150 -0
package/scripts/tests/test-validate-plan-quality.sh +235 -0
package/scripts/tests/test-validate-plans.sh +187 -0
package/scripts/tests/test-validate-plugin.sh +106 -0
package/scripts/tests/test-validate-prd.sh +184 -0
package/scripts/tests/test-validate-skills.sh +134 -0
package/scripts/validate-all.sh +57 -0
package/scripts/validate-commands.sh +67 -0
package/scripts/validate-hooks.sh +89 -0
package/scripts/validate-lessons.sh +98 -0
package/scripts/validate-plan-quality.sh +369 -0
package/scripts/validate-plans.sh +120 -0
package/scripts/validate-plugin.sh +86 -0
package/scripts/validate-policies.sh +42 -0
package/scripts/validate-prd.sh +118 -0
package/scripts/validate-skills.sh +96 -0
package/skills/autocode/SKILL.md +285 -0
package/skills/autocode/ab-verification.md +51 -0
package/skills/autocode/code-quality-standards.md +37 -0
package/skills/autocode/competitive-mode.md +364 -0
package/skills/brainstorming/SKILL.md +97 -0
package/skills/capture-lesson/SKILL.md +187 -0
package/skills/check-lessons/SKILL.md +116 -0
package/skills/dispatching-parallel-agents/SKILL.md +110 -0
package/skills/executing-plans/SKILL.md +85 -0
package/skills/finishing-a-development-branch/SKILL.md +201 -0
package/skills/receiving-code-review/SKILL.md +72 -0
package/skills/requesting-code-review/SKILL.md +59 -0
package/skills/requesting-code-review/code-reviewer.md +82 -0
package/skills/research/SKILL.md +145 -0
package/skills/roadmap/SKILL.md +115 -0
package/skills/subagent-driven-development/SKILL.md +98 -0
package/skills/subagent-driven-development/code-quality-reviewer-prompt.md +18 -0
package/skills/subagent-driven-development/implementer-prompt.md +73 -0
package/skills/subagent-driven-development/spec-reviewer-prompt.md +57 -0
package/skills/systematic-debugging/SKILL.md +134 -0
package/skills/systematic-debugging/condition-based-waiting.md +64 -0
package/skills/systematic-debugging/defense-in-depth.md +32 -0
package/skills/systematic-debugging/root-cause-tracing.md +55 -0
package/skills/test-driven-development/SKILL.md +167 -0
package/skills/using-git-worktrees/SKILL.md +219 -0
package/skills/using-superpowers/SKILL.md +54 -0
package/skills/verification-before-completion/SKILL.md +140 -0
package/skills/verify/SKILL.md +82 -0
package/skills/writing-plans/SKILL.md +128 -0
package/skills/writing-skills/SKILL.md +93 -0

package/scripts/tests/test-run-plan-headless.sh ADDED Viewed

@@ -0,0 +1,424 @@
+#!/usr/bin/env bash
+# Test run-plan-headless.sh extraction
+set -euo pipefail
+SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
+RP="$SCRIPT_DIR/../run-plan.sh"
+RPH="$SCRIPT_DIR/../lib/run-plan-headless.sh"
+RPEB="$SCRIPT_DIR/../lib/run-plan-echo-back.sh"
+RPS="$SCRIPT_DIR/../lib/run-plan-sampling.sh"
+FAILURES=0
+TESTS=0
+assert_eq() {
+    local desc="$1" expected="$2" actual="$3"
+    TESTS=$((TESTS + 1))
+    if [[ "$expected" != "$actual" ]]; then
+        echo "FAIL: $desc"
+        echo "  expected: $expected"
+        echo "  actual:   $actual"
+        FAILURES=$((FAILURES + 1))
+    else
+        echo "PASS: $desc"
+    fi
+}
+# === Extracted file exists ===
+TESTS=$((TESTS + 1))
+if [[ -f "$RPH" ]]; then
+    echo "PASS: run-plan-headless.sh exists"
+else
+    echo "FAIL: run-plan-headless.sh should exist at scripts/lib/"
+    FAILURES=$((FAILURES + 1))
+fi
+# === Extracted echo-back file exists ===
+TESTS=$((TESTS + 1))
+if [[ -f "$RPEB" ]]; then
+    echo "PASS: run-plan-echo-back.sh exists"
+else
+    echo "FAIL: run-plan-echo-back.sh should exist at scripts/lib/"
+    FAILURES=$((FAILURES + 1))
+fi
+# === Extracted sampling file exists ===
+TESTS=$((TESTS + 1))
+if [[ -f "$RPS" ]]; then
+    echo "PASS: run-plan-sampling.sh exists"
+else
+    echo "FAIL: run-plan-sampling.sh should exist at scripts/lib/"
+    FAILURES=$((FAILURES + 1))
+fi
+# === run-plan.sh sources it ===
+TESTS=$((TESTS + 1))
+if grep -q 'source.*lib/run-plan-headless.sh' "$RP"; then
+    echo "PASS: run-plan.sh sources lib/run-plan-headless.sh"
+else
+    echo "FAIL: run-plan.sh should source lib/run-plan-headless.sh"
+    FAILURES=$((FAILURES + 1))
+fi
+# === run-plan.sh sources new modules ===
+TESTS=$((TESTS + 1))
+if grep -q 'source.*lib/run-plan-echo-back.sh' "$RP"; then
+    echo "PASS: run-plan.sh sources lib/run-plan-echo-back.sh"
+else
+    echo "FAIL: run-plan.sh should source lib/run-plan-echo-back.sh"
+    FAILURES=$((FAILURES + 1))
+fi
+TESTS=$((TESTS + 1))
+if grep -q 'source.*lib/run-plan-sampling.sh' "$RP"; then
+    echo "PASS: run-plan.sh sources lib/run-plan-sampling.sh"
+else
+    echo "FAIL: run-plan.sh should source lib/run-plan-sampling.sh"
+    FAILURES=$((FAILURES + 1))
+fi
+# === run-plan.sh no longer has inline run_mode_headless body ===
+# The function definition should be in the extracted file, not in run-plan.sh
+TESTS=$((TESTS + 1))
+# Count lines of run_mode_headless in run-plan.sh — should be 0 (no function body)
+if grep -q 'run_mode_headless()' "$RP"; then
+    echo "FAIL: run-plan.sh should not define run_mode_headless()"
+    FAILURES=$((FAILURES + 1))
+else
+    echo "PASS: run_mode_headless() not defined in run-plan.sh"
+fi
+# === Extracted file defines the function ===
+TESTS=$((TESTS + 1))
+if grep -q 'run_mode_headless()' "$RPH"; then
+    echo "PASS: run-plan-headless.sh defines run_mode_headless()"
+else
+    echo "FAIL: run-plan-headless.sh should define run_mode_headless()"
+    FAILURES=$((FAILURES + 1))
+fi
+# === run-plan.sh is under 330 lines ===
+line_count=$(wc -l < "$RP")
+TESTS=$((TESTS + 1))
+if [[ $line_count -le 330 ]]; then
+    echo "PASS: run-plan.sh is $line_count lines (<=330)"
+else
+    echo "FAIL: run-plan.sh is $line_count lines (should be <=330)"
+    FAILURES=$((FAILURES + 1))
+fi
+# === Extracted file has the key logic markers ===
+TESTS=$((TESTS + 1))
+if grep -q 'mkdir -p.*logs' "$RPH"; then
+    echo "PASS: headless file creates logs directory"
+else
+    echo "FAIL: headless file should create logs directory"
+    FAILURES=$((FAILURES + 1))
+fi
+TESTS=$((TESTS + 1))
+if grep -q 'claude -p' "$RPH"; then
+    echo "PASS: headless file calls claude -p"
+else
+    echo "FAIL: headless file should call claude -p"
+    FAILURES=$((FAILURES + 1))
+fi
+# === Empty batch detection ===
+# The parser should return empty text for empty batches, and headless mode should skip them.
+# This test verifies the parser side (headless mode integration is tested separately).
+WORK=$(mktemp -d)
+trap 'rm -rf "$WORK"' EXIT
+source "$SCRIPT_DIR/../lib/run-plan-parser.sh"
+# Create a plan with 2 real batches and 1 empty trailing match
+cat > "$WORK/plan-empty.md" << 'PLAN'
+## Batch 1: Real Batch
+### Task 1: Do something
+Write some code.
+## Batch 2: Also Real
+### Task 2: Do more
+Write more code.
+## Batch 3:
+PLAN
+# get_batch_text should return empty for batch 3
+val=$(get_batch_text "$WORK/plan-empty.md" 3)
+assert_eq "get_batch_text: empty batch returns empty" "" "$val"
+# count_batches should count all 3 (parser counts headers)
+val=$(count_batches "$WORK/plan-empty.md")
+assert_eq "count_batches: counts all headers including empty" "3" "$val"
+# === Bug #4: CLAUDE.md Run-Plan section removal uses awk not sed ===
+# The sed range deletion pattern '/^## Run-Plan:/,/^## [^R]/' has no terminating
+# anchor when Run-Plan is the last section, so it deletes from Run-Plan to EOF.
+# The fix replaces it with awk which handles last-section correctly.
+TESTS=$((TESTS + 1))
+# awk should be used for section removal; the old sed range pattern should not be present
+if grep -q "awk" "$RPH" && grep -q 'in_section' "$RPH"; then
+    echo "PASS: CLAUDE.md section removal uses awk (last-section safe, bug #4)"
+else
+    echo "FAIL: CLAUDE.md section removal should use awk to handle last section correctly (bug #4)"
+    FAILURES=$((FAILURES + 1))
+fi
+TESTS=$((TESTS + 1))
+# The old broken sed range pattern must not be present
+if grep -q "sed '/\^## Run-Plan:/,/\^## \[^R\]/" "$RPH" 2>/dev/null || \
+   grep -q "sed '/\^\#\# Run-Plan:/,/\^\#\# \[^R\]" "$RPH" 2>/dev/null; then
+    echo "FAIL: Old sed range deletion pattern still present (unbounded at last section, bug #4)"
+    FAILURES=$((FAILURES + 1))
+else
+    echo "PASS: Old unbounded sed range deletion pattern removed"
+fi
+# === Bug #16/#28: SAMPLE_COUNT resets at top of batch loop using SAMPLE_DEFAULT ===
+# User's --sample value must be preserved into SAMPLE_DEFAULT before the loop
+TESTS=$((TESTS + 1))
+if grep -q 'SAMPLE_DEFAULT=.*SAMPLE_COUNT' "$RPH"; then
+    echo "PASS: SAMPLE_DEFAULT saves user's --sample value before batch loop"
+else
+    echo "FAIL: SAMPLE_DEFAULT should save user's --sample value before batch loop (bug #16/#28)"
+    FAILURES=$((FAILURES + 1))
+fi
+# The reset inside the loop must use SAMPLE_DEFAULT, not hardcoded 0
+TESTS=$((TESTS + 1))
+batch_loop_region=$(sed -n '/for ((batch = START_BATCH/,/SAMPLE_ON_RETRY/p' "$RPH")
+if echo "$batch_loop_region" | grep -q 'SAMPLE_COUNT=\$SAMPLE_DEFAULT'; then
+    echo "PASS: SAMPLE_COUNT resets to SAMPLE_DEFAULT at start of each batch iteration"
+else
+    echo "FAIL: SAMPLE_COUNT should reset to SAMPLE_DEFAULT (not 0) at start of each batch iteration (bug #16/#28)"
+    FAILURES=$((FAILURES + 1))
+fi
+# === Bug #2/#27: Sampling block uses patch files instead of stash ===
+# The fix replaced git stash/pop with git diff > patch + git apply to
+# eliminate LIFO ordering issues. These tests verify the new approach.
+# Baseline state must be saved as a patch file (not stash)
+TESTS=$((TESTS + 1))
+if grep -q '_baseline_patch' "$RPS"; then
+    echo "PASS: run-plan-sampling.sh saves baseline state as a patch file"
+else
+    echo "FAIL: run-plan-sampling.sh should save baseline state as a patch file (bug #2/#27)"
+    FAILURES=$((FAILURES + 1))
+fi
+# Winner state must be saved as a patch file (not stash)
+TESTS=$((TESTS + 1))
+if grep -q '_winner_patch\|run-plan-winner' "$RPS"; then
+    echo "PASS: run-plan-sampling.sh saves winner state as a patch file"
+else
+    echo "FAIL: run-plan-sampling.sh should save winner state as a patch file (bug #2/#27)"
+    FAILURES=$((FAILURES + 1))
+fi
+# No executable git stash usage remaining in sampling module (patch approach replaces it).
+# Filter out comment lines (lines starting with optional whitespace + #).
+TESTS=$((TESTS + 1))
+sampling_block=$(sed -n '/^run_sampling_candidates()/,/^}/p' "$RPS")
+# Strip comment-only lines before counting stash calls
+stash_uses=$(echo "$sampling_block" | grep -v '^\s*#' | grep -c 'git stash' || true)
+if [[ "$stash_uses" -eq 0 ]]; then
+    echo "PASS: No git stash calls in run_sampling_candidates (replaced by patch approach)"
+else
+    echo "FAIL: Found $stash_uses git stash call(s) in run_sampling_candidates — should use patch files (bug #2/#27)"
+    FAILURES=$((FAILURES + 1))
+fi
+# Restore of winner uses git apply (patch approach)
+TESTS=$((TESTS + 1))
+if echo "$sampling_block" | grep -q 'git apply'; then
+    echo "PASS: run_sampling_candidates uses git apply to restore winner state"
+else
+    echo "FAIL: run_sampling_candidates should use git apply to restore winner state (bug #2/#27)"
+    FAILURES=$((FAILURES + 1))
+fi
+# === Bug #30: Echo-back gate behavior ===
+# run-plan.sh must accept --skip-echo-back without error
+TESTS=$((TESTS + 1))
+if grep -q '\-\-skip-echo-back' "$RP"; then
+    echo "PASS: run-plan.sh accepts --skip-echo-back flag"
+else
+    echo "FAIL: run-plan.sh should define --skip-echo-back flag (bug #30)"
+    FAILURES=$((FAILURES + 1))
+fi
+# run-plan.sh must accept --strict-echo-back without error
+TESTS=$((TESTS + 1))
+if grep -q '\-\-strict-echo-back' "$RP"; then
+    echo "PASS: run-plan.sh accepts --strict-echo-back flag"
+else
+    echo "FAIL: run-plan.sh should define --strict-echo-back flag (bug #30)"
+    FAILURES=$((FAILURES + 1))
+fi
+# _echo_back_check function must exist in headless file
+TESTS=$((TESTS + 1))
+if grep -q '_echo_back_check()' "$RPEB"; then
+    echo "PASS: _echo_back_check() is defined in run-plan-echo-back.sh"
+else
+    echo "FAIL: _echo_back_check() should be defined in run-plan-echo-back.sh (bug #30)"
+    FAILURES=$((FAILURES + 1))
+fi
+# Echo-back gate must be non-blocking by default (no early return when STRICT_ECHO_BACK not set)
+TESTS=$((TESTS + 1))
+if grep -q 'STRICT_ECHO_BACK' "$RPEB"; then
+    echo "PASS: STRICT_ECHO_BACK controls blocking behavior in echo-back gate"
+else
+    echo "FAIL: echo-back gate should check STRICT_ECHO_BACK for blocking mode (bug #30)"
+    FAILURES=$((FAILURES + 1))
+fi
+# echo-back gate is documented as non-blocking by default
+TESTS=$((TESTS + 1))
+if grep -q 'NON-BLOCKING' "$RPEB"; then
+    echo "PASS: run-plan-echo-back.sh documents NON-BLOCKING default behavior"
+else
+    echo "FAIL: run-plan-echo-back.sh should document NON-BLOCKING default (bug #30)"
+    FAILURES=$((FAILURES + 1))
+fi
+# _echo_back_check: SKIP_ECHO_BACK=true must cause early return without error
+TESTS=$((TESTS + 1))
+(
+    source "$RPEB" 2>/dev/null || true
+    SKIP_ECHO_BACK=true
+    STRICT_ECHO_BACK=false
+    _echo_back_check "some batch text here" "/nonexistent/log" 2>/dev/null
+) && echo "PASS: _echo_back_check returns 0 when SKIP_ECHO_BACK=true" \
+  || {
+    echo "FAIL: _echo_back_check should return 0 when SKIP_ECHO_BACK=true (bug #30)"
+    FAILURES=$((FAILURES + 1))
+}
+# _echo_back_check: missing log file does not crash
+TESTS=$((TESTS + 1))
+(
+    source "$RPEB" 2>/dev/null || true
+    SKIP_ECHO_BACK=false
+    STRICT_ECHO_BACK=false
+    _echo_back_check "some batch text here" "/nonexistent/log" 2>/dev/null
+) && echo "PASS: _echo_back_check handles missing log file gracefully" \
+  || {
+    echo "FAIL: _echo_back_check should handle missing log file gracefully (bug #30)"
+    FAILURES=$((FAILURES + 1))
+}
+# _echo_back_check: empty batch text does not crash
+TESTS=$((TESTS + 1))
+tmplog=$(mktemp)
+echo "some agent output here" > "$tmplog"
+(
+    source "$RPEB" 2>/dev/null || true
+    SKIP_ECHO_BACK=false
+    STRICT_ECHO_BACK=false
+    _echo_back_check "" "$tmplog" 2>/dev/null
+)
+ec=$?
+rm -f "$tmplog"
+if [[ $ec -eq 0 ]]; then
+    echo "PASS: _echo_back_check handles empty batch text gracefully"
+else
+    echo "FAIL: _echo_back_check should handle empty batch text without error (bug #30)"
+    FAILURES=$((FAILURES + 1))
+fi
+# === Bug #4 BEHAVIORAL: awk removes Run-Plan even when it's the last section ===
+# The old sed range pattern '/^## Run-Plan:/,/^## [^R]/' had no closing anchor
+# when Run-Plan was the last section, eating the file from Run-Plan to EOF.
+# This behavioral test exercises the actual awk code path with a CLAUDE.md
+# where "## Run-Plan:" is the last section and verifies other sections survive.
+WORK_AWK=$(mktemp -d)
+# Create a CLAUDE.md where Run-Plan is the LAST section
+cat > "$WORK_AWK/CLAUDE.md" << 'CLAUDE_EOF'
+# Project Config
+## Conventions
+- Use pytest
+- Stage specific files
+## Run-Plan: Batch 3
+### Recent Commits
+abc1234 fix: something
+### Progress Notes
+Batch 2 done.
+CLAUDE_EOF
+# Run the same awk logic that run-plan-headless.sh uses inline
+awk '
+    /^## Run-Plan:/ { in_section=1; next }
+    in_section && /^## / { in_section=0 }
+    !in_section { print }
+' "$WORK_AWK/CLAUDE.md" > "$WORK_AWK/CLAUDE.md.tmp"
+mv "$WORK_AWK/CLAUDE.md.tmp" "$WORK_AWK/CLAUDE.md"
+# Verify: Run-Plan section is gone
+TESTS=$((TESTS + 1))
+if grep -q "## Run-Plan:" "$WORK_AWK/CLAUDE.md"; then
+    echo "FAIL: awk last-section: Run-Plan section should be removed"
+    FAILURES=$((FAILURES + 1))
+else
+    echo "PASS: awk last-section: Run-Plan section removed"
+fi
+# Verify: Conventions section still exists (not eaten by unbounded deletion)
+TESTS=$((TESTS + 1))
+if grep -q "## Conventions" "$WORK_AWK/CLAUDE.md"; then
+    echo "PASS: awk last-section: Conventions section preserved"
+else
+    echo "FAIL: awk last-section: Conventions section should survive Run-Plan removal"
+    FAILURES=$((FAILURES + 1))
+fi
+# Verify: content before Run-Plan is preserved
+TESTS=$((TESTS + 1))
+if grep -q "Use pytest" "$WORK_AWK/CLAUDE.md"; then
+    echo "PASS: awk last-section: content before Run-Plan preserved"
+else
+    echo "FAIL: awk last-section: content before Run-Plan should be preserved"
+    FAILURES=$((FAILURES + 1))
+fi
+rm -rf "$WORK_AWK"
+# === Bug #38: Empty claude output diagnostic ===
+# Must check for empty log file after claude invocation
+TESTS=$((TESTS + 1))
+if grep -q 'claude produced no output' "$RPH"; then
+    echo "PASS: Empty claude output is diagnosed with a warning message (#38)"
+else
+    echo "FAIL: Should diagnose empty claude output (crash/no output case) (bug #38)"
+    FAILURES=$((FAILURES + 1))
+fi
+# === Summary ===
+echo ""
+echo "Results: $((TESTS - FAILURES))/$TESTS passed"
+if [[ $FAILURES -gt 0 ]]; then
+    echo "FAILURES: $FAILURES"
+    exit 1
+fi
+echo "ALL PASSED"

package/scripts/tests/test-run-plan-notify.sh ADDED Viewed

@@ -0,0 +1,124 @@
+#!/usr/bin/env bash
+# Test notification format functions (no actual Telegram sending)
+set -euo pipefail
+SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
+source "$SCRIPT_DIR/../lib/run-plan-notify.sh"
+FAILURES=0
+TESTS=0
+assert_contains() {
+    local desc="$1" needle="$2" haystack="$3"
+    TESTS=$((TESTS + 1))
+    if [[ "$haystack" == *"$needle"* ]]; then
+        echo "PASS: $desc"
+    else
+        echo "FAIL: $desc"
+        echo "  expected to contain: $needle"
+        echo "  actual:              $haystack"
+        FAILURES=$((FAILURES + 1))
+    fi
+}
+assert_eq() {
+    local desc="$1" expected="$2" actual="$3"
+    TESTS=$((TESTS + 1))
+    if [[ "$expected" == "$actual" ]]; then
+        echo "PASS: $desc"
+    else
+        echo "FAIL: $desc"
+        echo "  expected: $expected"
+        echo "  actual:   $actual"
+        FAILURES=$((FAILURES + 1))
+    fi
+}
+# --- Test: format_success_message includes plan name ---
+msg=$(format_success_message "my-feature" 3 10 "Context Assembler" 2003 1953 "4m12s" "headless" "")
+assert_contains "success includes plan name" "my-feature" "$msg"
+# --- Test: format_success_message includes batch X/Y ---
+assert_contains "success includes batch X/Y" "Batch 3/10" "$msg"
+# --- Test: format_success_message includes batch title ---
+assert_contains "success includes batch title" "Context Assembler" "$msg"
+# --- Test: format_success_message includes check mark ---
+assert_contains "success includes check mark" "✓" "$msg"
+# --- Test: format_success_message includes test count ---
+assert_contains "success includes test count" "2003" "$msg"
+# --- Test: format_success_message includes delta with up arrow ---
+assert_contains "success includes delta" "↑50" "$msg"
+# --- Test: format_success_message delta calculation: 2003 - 1953 = 50 ---
+TESTS=$((TESTS + 1))
+if [[ "$msg" == *"↑50"* ]] && [[ "$msg" != *"↑500"* ]]; then
+    echo "PASS: delta is exactly 50"
+else
+    echo "FAIL: delta should be exactly 50 (2003 - 1953)"
+    echo "  message: $msg"
+    FAILURES=$((FAILURES + 1))
+fi
+# --- Test: format_success_message includes duration ---
+assert_contains "success includes duration" "4m12s" "$msg"
+# --- Test: format_success_message includes mode ---
+assert_contains "success includes mode" "headless" "$msg"
+# --- Test: format_success_message with summary ---
+msg=$(format_success_message "my-feature" 1 5 "Quick Fixes" 100 90 "2m30s" "headless" "Added 3 tests, fixed parser")
+assert_contains "success includes summary" "Added 3 tests, fixed parser" "$msg"
+# --- Test: format_failure_message includes plan name ---
+msg=$(format_failure_message "my-feature" 2 8 "ast-grep Rules" 45 3 "pytest failed" "Fix test_auth.py")
+assert_contains "failure includes plan name" "my-feature" "$msg"
+# --- Test: format_failure_message includes batch X/Y ---
+assert_contains "failure includes batch X/Y" "Batch 2/8" "$msg"
+# --- Test: format_failure_message includes batch title ---
+assert_contains "failure includes batch title" "ast-grep Rules" "$msg"
+# --- Test: format_failure_message includes cross mark ---
+assert_contains "failure includes cross mark" "✗" "$msg"
+# --- Test: format_failure_message includes test count ---
+assert_contains "failure includes test count" "45" "$msg"
+# --- Test: format_failure_message includes failing count ---
+assert_contains "failure includes failing count" "3 failing" "$msg"
+# --- Test: format_failure_message includes error as Issue ---
+assert_contains "failure includes issue text" "pytest failed" "$msg"
+# --- Test: format_failure_message includes action ---
+assert_contains "failure includes action" "Fix test_auth.py" "$msg"
+# --- Test: _load_telegram_env warns on missing file ---
+WORK=$(mktemp -d)
+trap 'rm -rf "$WORK"' EXIT
+msg=$(_load_telegram_env "$WORK/.env-nonexistent" 2>&1 || true)
+assert_contains "warns on missing env file" "warn" "$(echo "$msg" | tr '[:upper:]' '[:lower:]')"
+# --- Test: _send_telegram warns on missing token ---
+unset TELEGRAM_BOT_TOKEN 2>/dev/null || true
+unset TELEGRAM_CHAT_ID 2>/dev/null || true
+msg=$(_send_telegram "test message" 2>&1 || true)
+assert_contains "send warns on missing credentials" "warn" "$(echo "$msg" | tr '[:upper:]' '[:lower:]')"
+# --- Test: format_success_message with zero delta ---
+msg=$(format_success_message "zero-delta" 1 1 "Single Batch" 100 100 "1m00s" "team" "")
+assert_contains "zero delta shows ↑0" "↑0" "$msg"
+echo ""
+echo "Results: $((TESTS - FAILURES))/$TESTS passed"
+if [[ $FAILURES -gt 0 ]]; then
+    echo "FAILURES: $FAILURES"
+    exit 1
+fi
+echo "ALL PASSED"