autonomous-coding-toolkit 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (324) hide show
  1. package/.claude-plugin/marketplace.json +22 -0
  2. package/.claude-plugin/plugin.json +13 -0
  3. package/LICENSE +21 -0
  4. package/Makefile +21 -0
  5. package/README.md +140 -0
  6. package/SECURITY.md +28 -0
  7. package/agents/bash-expert.md +113 -0
  8. package/agents/dependency-auditor.md +138 -0
  9. package/agents/integration-tester.md +120 -0
  10. package/agents/lesson-scanner.md +149 -0
  11. package/agents/python-expert.md +179 -0
  12. package/agents/service-monitor.md +141 -0
  13. package/agents/shell-expert.md +147 -0
  14. package/benchmarks/runner.sh +147 -0
  15. package/benchmarks/tasks/01-rest-endpoint/rubric.sh +29 -0
  16. package/benchmarks/tasks/01-rest-endpoint/task.md +17 -0
  17. package/benchmarks/tasks/02-refactor-module/task.md +8 -0
  18. package/benchmarks/tasks/03-fix-integration-bug/task.md +8 -0
  19. package/benchmarks/tasks/04-add-test-coverage/task.md +8 -0
  20. package/benchmarks/tasks/05-multi-file-feature/task.md +8 -0
  21. package/bin/act.js +238 -0
  22. package/commands/autocode.md +6 -0
  23. package/commands/cancel-ralph.md +18 -0
  24. package/commands/code-factory.md +53 -0
  25. package/commands/create-prd.md +55 -0
  26. package/commands/ralph-loop.md +18 -0
  27. package/commands/run-plan.md +117 -0
  28. package/commands/submit-lesson.md +122 -0
  29. package/docs/ARCHITECTURE.md +630 -0
  30. package/docs/CONTRIBUTING.md +125 -0
  31. package/docs/lessons/0001-bare-exception-swallowing.md +34 -0
  32. package/docs/lessons/0002-async-def-without-await.md +28 -0
  33. package/docs/lessons/0003-create-task-without-callback.md +28 -0
  34. package/docs/lessons/0004-hardcoded-test-counts.md +28 -0
  35. package/docs/lessons/0005-sqlite-without-closing.md +33 -0
  36. package/docs/lessons/0006-venv-pip-path.md +27 -0
  37. package/docs/lessons/0007-runner-state-self-rejection.md +35 -0
  38. package/docs/lessons/0008-quality-gate-blind-spot.md +33 -0
  39. package/docs/lessons/0009-parser-overcount-empty-batches.md +36 -0
  40. package/docs/lessons/0010-local-outside-function-bash.md +33 -0
  41. package/docs/lessons/0011-batch-tests-for-unimplemented-code.md +36 -0
  42. package/docs/lessons/0012-api-markdown-unescaped-chars.md +33 -0
  43. package/docs/lessons/0013-export-prefix-env-parsing.md +33 -0
  44. package/docs/lessons/0014-decorator-registry-import-side-effect.md +43 -0
  45. package/docs/lessons/0015-frontend-backend-schema-drift.md +43 -0
  46. package/docs/lessons/0016-event-driven-cold-start-seeding.md +44 -0
  47. package/docs/lessons/0017-copy-paste-logic-diverges.md +43 -0
  48. package/docs/lessons/0018-layer-passes-pipeline-broken.md +45 -0
  49. package/docs/lessons/0019-systemd-envfile-ignores-export.md +41 -0
  50. package/docs/lessons/0020-persist-state-incrementally.md +44 -0
  51. package/docs/lessons/0021-dual-axis-testing.md +48 -0
  52. package/docs/lessons/0022-jsx-factory-shadowing.md +43 -0
  53. package/docs/lessons/0023-static-analysis-spiral.md +51 -0
  54. package/docs/lessons/0024-shared-pipeline-implementation.md +55 -0
  55. package/docs/lessons/0025-defense-in-depth-all-entry-points.md +65 -0
  56. package/docs/lessons/0026-linter-no-rules-false-enforcement.md +54 -0
  57. package/docs/lessons/0027-jsx-silent-prop-drop.md +64 -0
  58. package/docs/lessons/0028-no-infrastructure-in-client-code.md +49 -0
  59. package/docs/lessons/0029-never-write-secrets-to-files.md +61 -0
  60. package/docs/lessons/0030-cache-merge-not-replace.md +62 -0
  61. package/docs/lessons/0031-verify-units-at-boundaries.md +66 -0
  62. package/docs/lessons/0032-module-lifecycle-subscribe-unsubscribe.md +89 -0
  63. package/docs/lessons/0033-async-iteration-mutable-snapshot.md +72 -0
  64. package/docs/lessons/0034-caller-missing-await-silent-discard.md +65 -0
  65. package/docs/lessons/0035-duplicate-registration-silent-overwrite.md +85 -0
  66. package/docs/lessons/0036-websocket-dirty-disconnect.md +33 -0
  67. package/docs/lessons/0037-parallel-agents-worktree-corruption.md +31 -0
  68. package/docs/lessons/0038-subscribe-no-stored-ref.md +36 -0
  69. package/docs/lessons/0039-fallback-or-default-hides-bugs.md +34 -0
  70. package/docs/lessons/0040-event-firehose-filter-first.md +36 -0
  71. package/docs/lessons/0041-ambiguous-base-dir-path-nesting.md +32 -0
  72. package/docs/lessons/0042-spec-compliance-insufficient.md +36 -0
  73. package/docs/lessons/0043-exact-count-extensible-collections.md +32 -0
  74. package/docs/lessons/0044-relative-file-deps-worktree.md +39 -0
  75. package/docs/lessons/0045-iterative-design-improvement.md +33 -0
  76. package/docs/lessons/0046-plan-assertion-math-bugs.md +38 -0
  77. package/docs/lessons/0047-pytest-single-threaded-default.md +37 -0
  78. package/docs/lessons/0048-integration-wiring-batch.md +40 -0
  79. package/docs/lessons/0049-ab-verification.md +41 -0
  80. package/docs/lessons/0050-editing-sourced-files-during-execution.md +33 -0
  81. package/docs/lessons/0051-infrastructure-fixes-cant-self-heal.md +30 -0
  82. package/docs/lessons/0052-uncommitted-changes-poison-quality-gates.md +31 -0
  83. package/docs/lessons/0053-jq-compact-flag-inconsistency.md +31 -0
  84. package/docs/lessons/0054-parser-matches-inside-code-blocks.md +30 -0
  85. package/docs/lessons/0055-agents-compensate-for-garbled-prompts.md +31 -0
  86. package/docs/lessons/0056-grep-count-exit-code-on-zero.md +42 -0
  87. package/docs/lessons/0057-new-artifacts-break-git-clean-gates.md +42 -0
  88. package/docs/lessons/0058-dead-config-keys-never-consumed.md +49 -0
  89. package/docs/lessons/0059-contract-test-shared-structures.md +53 -0
  90. package/docs/lessons/0060-set-e-silent-death-in-runners.md +53 -0
  91. package/docs/lessons/0061-context-injection-dirty-state.md +50 -0
  92. package/docs/lessons/0062-sibling-bug-neighborhood-scan.md +29 -0
  93. package/docs/lessons/0063-one-flag-two-lifetimes.md +31 -0
  94. package/docs/lessons/0064-test-passes-wrong-reason.md +31 -0
  95. package/docs/lessons/0065-pipefail-grep-count-double-output.md +39 -0
  96. package/docs/lessons/0066-local-keyword-outside-function.md +37 -0
  97. package/docs/lessons/0067-stdin-hang-non-interactive-shell.md +36 -0
  98. package/docs/lessons/0068-agent-builds-wrong-thing-correctly.md +31 -0
  99. package/docs/lessons/0069-plan-quality-dominates-execution.md +30 -0
  100. package/docs/lessons/0070-spec-echo-back-prevents-drift.md +31 -0
  101. package/docs/lessons/0071-positive-instructions-outperform-negative.md +30 -0
  102. package/docs/lessons/0072-lost-in-the-middle-context-placement.md +30 -0
  103. package/docs/lessons/0073-unscoped-lessons-cause-false-positives.md +30 -0
  104. package/docs/lessons/0074-stale-context-injection-wrong-batch.md +32 -0
  105. package/docs/lessons/0075-research-artifacts-must-persist.md +32 -0
  106. package/docs/lessons/0076-wrong-decomposition-contaminates-downstream.md +30 -0
  107. package/docs/lessons/0077-cherry-pick-merges-need-manual-resolution.md +30 -0
  108. package/docs/lessons/0078-static-review-without-live-test.md +30 -0
  109. package/docs/lessons/0079-integration-wiring-batch-required.md +32 -0
  110. package/docs/lessons/FRAMEWORK.md +161 -0
  111. package/docs/lessons/SUMMARY.md +201 -0
  112. package/docs/lessons/TEMPLATE.md +85 -0
  113. package/docs/plans/2026-02-21-code-factory-v2-design.md +204 -0
  114. package/docs/plans/2026-02-21-code-factory-v2-implementation-plan.md +2189 -0
  115. package/docs/plans/2026-02-21-code-factory-v2-phase4-design.md +537 -0
  116. package/docs/plans/2026-02-21-code-factory-v2-phase4-implementation-plan.md +2012 -0
  117. package/docs/plans/2026-02-21-hardening-pass-design.md +108 -0
  118. package/docs/plans/2026-02-21-hardening-pass-plan.md +1378 -0
  119. package/docs/plans/2026-02-21-mab-research-report.md +406 -0
  120. package/docs/plans/2026-02-21-marketplace-restructure-design.md +240 -0
  121. package/docs/plans/2026-02-21-marketplace-restructure-plan.md +832 -0
  122. package/docs/plans/2026-02-21-phase4-completion-plan.md +697 -0
  123. package/docs/plans/2026-02-21-validator-suite-design.md +148 -0
  124. package/docs/plans/2026-02-21-validator-suite-plan.md +540 -0
  125. package/docs/plans/2026-02-22-mab-research-round2.md +556 -0
  126. package/docs/plans/2026-02-22-mab-run-design.md +462 -0
  127. package/docs/plans/2026-02-22-mab-run-plan.md +2046 -0
  128. package/docs/plans/2026-02-22-operations-design-methodology-research.md +681 -0
  129. package/docs/plans/2026-02-22-research-agent-failure-taxonomy.md +532 -0
  130. package/docs/plans/2026-02-22-research-code-guideline-policies.md +886 -0
  131. package/docs/plans/2026-02-22-research-codebase-audit-refactoring.md +908 -0
  132. package/docs/plans/2026-02-22-research-coding-standards-documentation.md +541 -0
  133. package/docs/plans/2026-02-22-research-competitive-landscape.md +687 -0
  134. package/docs/plans/2026-02-22-research-comprehensive-testing.md +1076 -0
  135. package/docs/plans/2026-02-22-research-context-utilization.md +459 -0
  136. package/docs/plans/2026-02-22-research-cost-quality-tradeoff.md +548 -0
  137. package/docs/plans/2026-02-22-research-lesson-transferability.md +508 -0
  138. package/docs/plans/2026-02-22-research-multi-agent-coordination.md +312 -0
  139. package/docs/plans/2026-02-22-research-phase-integration.md +602 -0
  140. package/docs/plans/2026-02-22-research-plan-quality.md +428 -0
  141. package/docs/plans/2026-02-22-research-prompt-engineering.md +558 -0
  142. package/docs/plans/2026-02-22-research-unconventional-perspectives.md +528 -0
  143. package/docs/plans/2026-02-22-research-user-adoption.md +638 -0
  144. package/docs/plans/2026-02-22-research-verification-effectiveness.md +433 -0
  145. package/docs/plans/2026-02-23-agent-suite-design.md +299 -0
  146. package/docs/plans/2026-02-23-agent-suite-plan.md +578 -0
  147. package/docs/plans/2026-02-23-phase3-cost-infrastructure-design.md +148 -0
  148. package/docs/plans/2026-02-23-phase3-cost-infrastructure-plan.md +1062 -0
  149. package/docs/plans/2026-02-23-research-bash-expert-agent.md +543 -0
  150. package/docs/plans/2026-02-23-research-dependency-auditor-agent.md +564 -0
  151. package/docs/plans/2026-02-23-research-improving-existing-agents.md +503 -0
  152. package/docs/plans/2026-02-23-research-integration-tester-agent.md +454 -0
  153. package/docs/plans/2026-02-23-research-python-expert-agent.md +429 -0
  154. package/docs/plans/2026-02-23-research-service-monitor-agent.md +425 -0
  155. package/docs/plans/2026-02-23-research-shell-expert-agent.md +533 -0
  156. package/docs/plans/2026-02-23-roadmap-to-completion.md +530 -0
  157. package/docs/plans/2026-02-24-headless-module-split-design.md +98 -0
  158. package/docs/plans/2026-02-24-headless-module-split.md +443 -0
  159. package/docs/plans/2026-02-24-lesson-scope-metadata-design.md +228 -0
  160. package/docs/plans/2026-02-24-lesson-scope-metadata-plan.md +968 -0
  161. package/docs/plans/2026-02-24-npm-packaging-design.md +841 -0
  162. package/docs/plans/2026-02-24-npm-packaging-plan.md +1965 -0
  163. package/docs/plans/audit-findings.md +186 -0
  164. package/docs/telegram-notification-format.md +98 -0
  165. package/examples/example-plan.md +51 -0
  166. package/examples/example-prd.json +72 -0
  167. package/examples/example-roadmap.md +33 -0
  168. package/examples/quickstart-plan.md +63 -0
  169. package/hooks/hooks.json +26 -0
  170. package/hooks/setup-symlinks.sh +48 -0
  171. package/hooks/stop-hook.sh +135 -0
  172. package/package.json +47 -0
  173. package/policies/bash.md +71 -0
  174. package/policies/python.md +71 -0
  175. package/policies/testing.md +61 -0
  176. package/policies/universal.md +60 -0
  177. package/scripts/analyze-report.sh +97 -0
  178. package/scripts/architecture-map.sh +145 -0
  179. package/scripts/auto-compound.sh +273 -0
  180. package/scripts/batch-audit.sh +42 -0
  181. package/scripts/batch-test.sh +101 -0
  182. package/scripts/entropy-audit.sh +221 -0
  183. package/scripts/failure-digest.sh +51 -0
  184. package/scripts/generate-ast-rules.sh +96 -0
  185. package/scripts/init.sh +112 -0
  186. package/scripts/lesson-check.sh +428 -0
  187. package/scripts/lib/common.sh +61 -0
  188. package/scripts/lib/cost-tracking.sh +153 -0
  189. package/scripts/lib/ollama.sh +60 -0
  190. package/scripts/lib/progress-writer.sh +128 -0
  191. package/scripts/lib/run-plan-context.sh +215 -0
  192. package/scripts/lib/run-plan-echo-back.sh +231 -0
  193. package/scripts/lib/run-plan-headless.sh +396 -0
  194. package/scripts/lib/run-plan-notify.sh +57 -0
  195. package/scripts/lib/run-plan-parser.sh +81 -0
  196. package/scripts/lib/run-plan-prompt.sh +215 -0
  197. package/scripts/lib/run-plan-quality-gate.sh +132 -0
  198. package/scripts/lib/run-plan-routing.sh +315 -0
  199. package/scripts/lib/run-plan-sampling.sh +170 -0
  200. package/scripts/lib/run-plan-scoring.sh +146 -0
  201. package/scripts/lib/run-plan-state.sh +142 -0
  202. package/scripts/lib/run-plan-team.sh +199 -0
  203. package/scripts/lib/telegram.sh +54 -0
  204. package/scripts/lib/thompson-sampling.sh +176 -0
  205. package/scripts/license-check.sh +74 -0
  206. package/scripts/mab-run.sh +575 -0
  207. package/scripts/module-size-check.sh +146 -0
  208. package/scripts/patterns/async-no-await.yml +5 -0
  209. package/scripts/patterns/bare-except.yml +6 -0
  210. package/scripts/patterns/empty-catch.yml +6 -0
  211. package/scripts/patterns/hardcoded-localhost.yml +9 -0
  212. package/scripts/patterns/retry-loop-no-backoff.yml +12 -0
  213. package/scripts/pipeline-status.sh +197 -0
  214. package/scripts/policy-check.sh +226 -0
  215. package/scripts/prior-art-search.sh +133 -0
  216. package/scripts/promote-mab-lessons.sh +126 -0
  217. package/scripts/prompts/agent-a-superpowers.md +29 -0
  218. package/scripts/prompts/agent-b-ralph.md +29 -0
  219. package/scripts/prompts/judge-agent.md +61 -0
  220. package/scripts/prompts/planner-agent.md +44 -0
  221. package/scripts/pull-community-lessons.sh +90 -0
  222. package/scripts/quality-gate.sh +266 -0
  223. package/scripts/research-gate.sh +90 -0
  224. package/scripts/run-plan.sh +329 -0
  225. package/scripts/scope-infer.sh +159 -0
  226. package/scripts/setup-ralph-loop.sh +155 -0
  227. package/scripts/telemetry.sh +230 -0
  228. package/scripts/tests/run-all-tests.sh +52 -0
  229. package/scripts/tests/test-act-cli.sh +46 -0
  230. package/scripts/tests/test-agents-md.sh +87 -0
  231. package/scripts/tests/test-analyze-report.sh +114 -0
  232. package/scripts/tests/test-architecture-map.sh +89 -0
  233. package/scripts/tests/test-auto-compound.sh +169 -0
  234. package/scripts/tests/test-batch-test.sh +65 -0
  235. package/scripts/tests/test-benchmark-runner.sh +25 -0
  236. package/scripts/tests/test-common.sh +168 -0
  237. package/scripts/tests/test-cost-tracking.sh +158 -0
  238. package/scripts/tests/test-echo-back.sh +180 -0
  239. package/scripts/tests/test-entropy-audit.sh +146 -0
  240. package/scripts/tests/test-failure-digest.sh +66 -0
  241. package/scripts/tests/test-generate-ast-rules.sh +145 -0
  242. package/scripts/tests/test-helpers.sh +82 -0
  243. package/scripts/tests/test-init.sh +47 -0
  244. package/scripts/tests/test-lesson-check.sh +278 -0
  245. package/scripts/tests/test-lesson-local.sh +55 -0
  246. package/scripts/tests/test-license-check.sh +109 -0
  247. package/scripts/tests/test-mab-run.sh +182 -0
  248. package/scripts/tests/test-ollama-lib.sh +49 -0
  249. package/scripts/tests/test-ollama.sh +60 -0
  250. package/scripts/tests/test-pipeline-status.sh +198 -0
  251. package/scripts/tests/test-policy-check.sh +124 -0
  252. package/scripts/tests/test-prior-art-search.sh +96 -0
  253. package/scripts/tests/test-progress-writer.sh +140 -0
  254. package/scripts/tests/test-promote-mab-lessons.sh +110 -0
  255. package/scripts/tests/test-pull-community-lessons.sh +149 -0
  256. package/scripts/tests/test-quality-gate.sh +241 -0
  257. package/scripts/tests/test-research-gate.sh +132 -0
  258. package/scripts/tests/test-run-plan-cli.sh +86 -0
  259. package/scripts/tests/test-run-plan-context.sh +305 -0
  260. package/scripts/tests/test-run-plan-e2e.sh +153 -0
  261. package/scripts/tests/test-run-plan-headless.sh +424 -0
  262. package/scripts/tests/test-run-plan-notify.sh +124 -0
  263. package/scripts/tests/test-run-plan-parser.sh +217 -0
  264. package/scripts/tests/test-run-plan-prompt.sh +254 -0
  265. package/scripts/tests/test-run-plan-quality-gate.sh +222 -0
  266. package/scripts/tests/test-run-plan-routing.sh +178 -0
  267. package/scripts/tests/test-run-plan-scoring.sh +148 -0
  268. package/scripts/tests/test-run-plan-state.sh +261 -0
  269. package/scripts/tests/test-run-plan-team.sh +157 -0
  270. package/scripts/tests/test-scope-infer.sh +150 -0
  271. package/scripts/tests/test-setup-ralph-loop.sh +63 -0
  272. package/scripts/tests/test-telegram-env.sh +38 -0
  273. package/scripts/tests/test-telegram.sh +121 -0
  274. package/scripts/tests/test-telemetry.sh +46 -0
  275. package/scripts/tests/test-thompson-sampling.sh +139 -0
  276. package/scripts/tests/test-validate-all.sh +60 -0
  277. package/scripts/tests/test-validate-commands.sh +89 -0
  278. package/scripts/tests/test-validate-hooks.sh +98 -0
  279. package/scripts/tests/test-validate-lessons.sh +150 -0
  280. package/scripts/tests/test-validate-plan-quality.sh +235 -0
  281. package/scripts/tests/test-validate-plans.sh +187 -0
  282. package/scripts/tests/test-validate-plugin.sh +106 -0
  283. package/scripts/tests/test-validate-prd.sh +184 -0
  284. package/scripts/tests/test-validate-skills.sh +134 -0
  285. package/scripts/validate-all.sh +57 -0
  286. package/scripts/validate-commands.sh +67 -0
  287. package/scripts/validate-hooks.sh +89 -0
  288. package/scripts/validate-lessons.sh +98 -0
  289. package/scripts/validate-plan-quality.sh +369 -0
  290. package/scripts/validate-plans.sh +120 -0
  291. package/scripts/validate-plugin.sh +86 -0
  292. package/scripts/validate-policies.sh +42 -0
  293. package/scripts/validate-prd.sh +118 -0
  294. package/scripts/validate-skills.sh +96 -0
  295. package/skills/autocode/SKILL.md +285 -0
  296. package/skills/autocode/ab-verification.md +51 -0
  297. package/skills/autocode/code-quality-standards.md +37 -0
  298. package/skills/autocode/competitive-mode.md +364 -0
  299. package/skills/brainstorming/SKILL.md +97 -0
  300. package/skills/capture-lesson/SKILL.md +187 -0
  301. package/skills/check-lessons/SKILL.md +116 -0
  302. package/skills/dispatching-parallel-agents/SKILL.md +110 -0
  303. package/skills/executing-plans/SKILL.md +85 -0
  304. package/skills/finishing-a-development-branch/SKILL.md +201 -0
  305. package/skills/receiving-code-review/SKILL.md +72 -0
  306. package/skills/requesting-code-review/SKILL.md +59 -0
  307. package/skills/requesting-code-review/code-reviewer.md +82 -0
  308. package/skills/research/SKILL.md +145 -0
  309. package/skills/roadmap/SKILL.md +115 -0
  310. package/skills/subagent-driven-development/SKILL.md +98 -0
  311. package/skills/subagent-driven-development/code-quality-reviewer-prompt.md +18 -0
  312. package/skills/subagent-driven-development/implementer-prompt.md +73 -0
  313. package/skills/subagent-driven-development/spec-reviewer-prompt.md +57 -0
  314. package/skills/systematic-debugging/SKILL.md +134 -0
  315. package/skills/systematic-debugging/condition-based-waiting.md +64 -0
  316. package/skills/systematic-debugging/defense-in-depth.md +32 -0
  317. package/skills/systematic-debugging/root-cause-tracing.md +55 -0
  318. package/skills/test-driven-development/SKILL.md +167 -0
  319. package/skills/using-git-worktrees/SKILL.md +219 -0
  320. package/skills/using-superpowers/SKILL.md +54 -0
  321. package/skills/verification-before-completion/SKILL.md +140 -0
  322. package/skills/verify/SKILL.md +82 -0
  323. package/skills/writing-plans/SKILL.md +128 -0
  324. package/skills/writing-skills/SKILL.md +93 -0
@@ -0,0 +1,681 @@
1
+ # Operations Design & Design Methodology Research
2
+
3
+ > **Purpose:** Research military and business operations design methodology to enhance the autonomous coding toolkit's research phase integration.
4
+ >
5
+ > **Date:** 2026-02-22
6
+ >
7
+ > **Builds on:** `2026-02-22-research-phase-integration.md`, `2026-02-22-mab-research-round2.md`
8
+ >
9
+ > **Sources:** 4 parallel research agents (military doctrine, business methodology, cross-domain transfers, Notion workspace), 80+ web sources, 30+ Notion pages
10
+
11
+ ---
12
+
13
+ ## Executive Summary
14
+
15
+ Military and business design methodologies converge on a single meta-insight: **you cannot plan your way to a good outcome if you have not first correctly framed the problem.** Every framework examined β€” from JP 5-0 to McKinsey's issue trees to Toyota's A3 β€” enforces a formal gate between understanding the problem and designing a solution. The autonomous coding toolkit's proposed research phase (Stage 1.5) is this gate. This report maps 18 frameworks to concrete pipeline enhancements.
16
+
17
+ ### Key Findings
18
+
19
+ 1. **The problem statement is the most leveraged investment** in the entire process. Military doctrine (ADM), McKinsey (issue trees), and IDEO (POV statements) all formalize problem definition as a distinct, gated phase.
20
+ 2. **Design and planning are different cognitive modes** that must be sequenced correctly. ADM β†’ MDMP, Define β†’ Ideate, A3 left side β†’ right side. Our pipeline already does this (brainstorm β†’ plan), but lacks the structured research that bridges them.
21
+ 3. **Adversarial review must be institutionalized**, not optional. Red teams, murder boards, ACH, and believability-weighted voting all exist because groupthink is structural, not personal.
22
+ 4. **End-state backward is the only coherent direction.** EBO, Amazon's Working Backwards, and RAND's RDM all design from desired outcome to required actions β€” never forward from available resources.
23
+ 5. **Confidence levels and alternative analysis** (ICD 203) are the most underexploited transfer opportunity. Most software design docs do not express confidence or enumerate scored alternatives.
24
+
25
+ ---
26
+
27
+ ## Part I: Military Operations Design
28
+
29
+ ### 1.1 Joint/Army Operational Design (JP 5-0, ADP 5-0)
30
+
31
+ Operational design is the cognitive work that **precedes** detailed planning. It answers: *What is the actual problem? What would success look like? What is the logical structure of the path from here to there?*
32
+
33
+ **The 13 Elements of Operational Design:**
34
+
35
+ | Element | Definition | Pipeline Analog |
36
+ |---------|-----------|-----------------|
37
+ | End State | Conditions that define success | PRD acceptance criteria |
38
+ | Center of Gravity | Source of power/capability | Core module under change |
39
+ | Decisive Points | Events/places that give marked advantage | Integration boundaries, API seams |
40
+ | Lines of Effort | Logical connections between decisive points | Batch sequences in plan |
41
+ | Direct vs. Indirect | Attack COG directly or erode supporting capabilities | Refactor vs. wrapper pattern |
42
+ | Operational Reach | Distance/duration before culmination | Context window budget |
43
+ | Culmination | Point where momentum can't be maintained | Context degradation threshold |
44
+ | Arranging Operations | Sequencing simultaneous/sequential actions | Batch ordering, parallelism |
45
+
46
+ **Center of Gravity Analysis (Strange's CG-CC-CR-CV Model):**
47
+
48
+ ```
49
+ Center of Gravity β†’ Critical Capabilities β†’ Critical Requirements β†’ Critical Vulnerabilities
50
+ ```
51
+
52
+ Attack logic: identify CVs β†’ strike them β†’ degrades CRs β†’ degrades CCs β†’ neutralizes COG. For our pipeline: identify the critical vulnerability in the codebase (the weakest integration seam, the most fragile module) and address it first, not last.
53
+
54
+ **Sources:** JP 5-0 (2020), ADP 5-0 (2019), Joint Staff J-7 Planner's Handbook for Operational Design (2011), Strange & Iron CG-CC-CR-CV paper
55
+
56
+ ### 1.2 Army Design Methodology (ADM) β€” Framing Before Planning
57
+
58
+ ADM was formalized after Iraq/Afghanistan exposed the failure of procedural planning against adaptive problems. It handles **ill-structured ("wicked") problems** β€” problems with no definitive formulation, no single correct answer, and no stopping rule.
59
+
60
+ **ADM β†’ MDMP Continuum (the key insight):**
61
+
62
+ ```
63
+ [ADM: Conceptual] [MDMP: Detailed]
64
+ ─────────────────────────────────────────►
65
+ Understand Visualize Describe Plan Prepare Execute Assess
66
+ β”‚ β”‚ β”‚
67
+ Frame OE Frame Problem Op Approach
68
+ ```
69
+
70
+ ADM outputs become MDMP inputs:
71
+ - ADM produces: problem statement + operational approach + commander's intent
72
+ - MDMP ingests those and produces: COAs, wargaming, decision, OPORD
73
+
74
+ **The Four ADM Activities:**
75
+
76
+ 1. **Frame the Operational Environment** β€” Understand the systems at play (PMESII: Political, Military, Economic, Social, Infrastructure, Information). Map known/unknown/assumed.
77
+ 2. **Frame the Problem** β€” Identify the tension between current state and desired end state. The problem statement articulates *why* the gap exists, not just that it exists.
78
+ 3. **Develop the Operational Approach** β€” Generate a broad conceptual solution. This is a hypothesis, not a plan.
79
+ 4. **Reframe** β€” When realities challenge the original frame, revise. This is doctrine, not failure.
80
+
81
+ **Pipeline mapping:** ADM's "Frame β†’ Approach β†’ Reframe" is exactly what our proposed research phase does: understand the codebase landscape (Frame OE), identify the real problem vs. the stated problem (Frame Problem), and produce a research artifact that informs PRD generation (Operational Approach).
82
+
83
+ **The Israeli Cautionary Tale (SOD):** Brigadier General Naveh's Systemic Operational Design applied critical theory (Foucault, Derrida, Deleuze) to operational art. It was intellectually ambitious but catastrophically unusable β€” in the 2006 Lebanon War, commanders were so absorbed in systems-thinking abstractions that tactical execution collapsed. **Lesson: design methodology must be sophisticated enough to handle real complexity but disciplined enough to generate actionable outputs.**
84
+
85
+ **Sources:** ATP 5-0.1 (2015), ADP 5-0 (2019), Small Wars Journal "Using ADM to Frame Problems" (2023), "Rise and Recession of Military Design Thinking" (StrategycentraI.io)
86
+
87
+ ### 1.3 OODA Loop (Boyd) β€” Orientation as Design
88
+
89
+ Boyd's OODA (Observe-Orient-Decide-Act) is often trivialized as a speed loop. In reality, **Orient is the center of gravity** of the entire model β€” the decisive node where mental models are built and destroyed.
90
+
91
+ ```
92
+ OBSERVE ──► ORIENT ──► DECIDE ──► ACT
93
+ β–² β”‚ β”‚
94
+ └── [Implicit Guidance & Control]β”‚
95
+ β—„β”€β”€β”€β”€β”€β”€β”€β”€β”€β”€β”€β”€β”€β”€β”€β”€β”€β”€β”€β”€β”€β”€β”€β”˜
96
+ ```
97
+
98
+ Orient synthesizes: genetic heritage, cultural traditions, prior experience, new information, and active analysis/synthesis. The output is an **updated mental model of reality**, which shapes what gets observed next and what gets decided.
99
+
100
+ **"Destruction and Creation" (Boyd, 1976):** The epistemological engine β€” drawing on Godel, Heisenberg, and thermodynamics:
101
+ - **Destructive deduction**: Breaking existing mental models apart (analysis)
102
+ - **Creative induction**: Recombining elements into new, more accurate models (synthesis)
103
+
104
+ Every model degrades as conditions change. Effective orientation requires continuously destroying and rebuilding mental models. **This maps directly to ADM's "reframe" and to our pipeline's context degradation problem** β€” stale context is a degraded mental model.
105
+
106
+ **Sources:** Boyd's "Discourse on Winning and Losing," OODA Loop Wikipedia, DAU "Revisiting Boyd" (2021)
107
+
108
+ ### 1.4 Effects-Based Operations (EBO) β€” Designing Around Outcomes
109
+
110
+ EBO reverses the traditional planning direction:
111
+
112
+ ```
113
+ Traditional: Forces Available β†’ Targets β†’ Effects (hoped for)
114
+ EBO: Desired Strategic End State β†’ Required Effects β†’ Targets/Actions
115
+ ```
116
+
117
+ This is pure backwards planning from end state. It introduced the Effects Matrix: for each strategic objective, specify the required effect, target system, desired behavioral outcome, and assessment criteria.
118
+
119
+ **Mattis killed institutionalized EBO in 2008** β€” not because the concept was wrong, but because the tooling promised deterministic prediction in complex adaptive systems. The underlying logic (design from end state backward) survived and is embedded in current JP 5-0 doctrine.
120
+
121
+ **Pipeline mapping:** Our PRD already does backwards planning (acceptance criteria β†’ implementation tasks). EBO's lesson is that the criteria must describe **effects** (behavioral changes in the system), not **targets** (files to modify).
122
+
123
+ **Sources:** Deptula "EBO: Change in the Nature of Warfare," Air & Space Forces "Assault on EBO," Mattis criticism (Air University)
124
+
125
+ ### 1.5 Intelligence Preparation of the Battlefield (IPB)
126
+
127
+ IPB is the intelligence community's contribution to operational design β€” it structures environment analysis **before** planning begins.
128
+
129
+ **Four-Step IPB Process:**
130
+
131
+ | Step | Activity | Pipeline Analog |
132
+ |------|----------|-----------------|
133
+ | 1. Define the OE | Identify geographic area and time horizons | Identify affected files, modules, APIs |
134
+ | 2. Describe Environmental Effects | Analyze terrain using OAKOC | Map dependencies, integration seams, test coverage |
135
+ | 3. Evaluate the Threat | Build threat models and doctrine templates | Identify failure patterns, anti-patterns, tech debt |
136
+ | 4. Determine Threat COAs | Predict adversary courses of action | Predict where integration will break, where tests will fail |
137
+
138
+ **The pipeline connection:** IPB is literally what the research phase should produce β€” a structured analysis of the codebase landscape that feeds into PRD generation. The research artifact's `latent_issues` and `reuse_components` fields are IPB Steps 3 and 4.
139
+
140
+ **Sources:** FM 34-130, ATP 2-01.3, GlobalSecurity.org IPB Overview
141
+
142
+ ### 1.6 Red Teaming and Adversarial Review
143
+
144
+ Formalized after post-9/11 planning failures. The Army stood up UFMCS (University of Foreign Military and Cultural Studies) at Fort Leavenworth in 2004.
145
+
146
+ **Four Red Team Functions:**
147
+ 1. **Devil's Advocacy** β€” argue the strongest case against the current plan
148
+ 2. **Alternative Analysis** β€” generate alternative interpretations
149
+ 3. **Team A/Team B** β€” two competing teams argue opposite conclusions
150
+ 4. **Cultural Empathy Analysis** β€” model how adversaries will perceive and respond
151
+
152
+ **Cognitive Biases Targeted:** Mirror imaging, groupthink, confirmation bias, cultural missteps.
153
+
154
+ **Murder boards:** Before a plan goes to the commander, a senior officer (often outside the chain of command) attacks the plan mercilessly. This is the military's institutionalized pre-mortem.
155
+
156
+ **Pipeline mapping:** Our MAB competitive mode is Team A/Team B. The lesson scanner is Devil's Advocacy. What's missing: **a formal alternative analysis step** in the research phase that enumerates competing approaches with explicit scoring.
157
+
158
+ **Sources:** UFMCS Red Team Handbook, Applied Critical Thinking Handbook v8.1, Army Press "Group Psychology of Red Teaming"
159
+
160
+ ### 1.7 Mission Command β€” Design Through Intent
161
+
162
+ **Centralized intent, decentralized execution.** Commander's intent has three mandatory components:
163
+
164
+ 1. **Purpose (Why)** β€” how the operation contributes to higher objectives
165
+ 2. **Method (What/How broadly)** β€” enough frame without over-specifying
166
+ 3. **End State** β€” desired conditions at conclusion
167
+
168
+ Mission Command acknowledges that **no plan survives contact**. Design compensates not by making the plan more detailed, but by ensuring everyone understands the logic well enough to adapt.
169
+
170
+ **Pipeline mapping:** The plan header (Goal, Architecture, Tech Stack) is commander's intent. The batch structure is mission orders. The quality gates are decision support templates. The agent executing each batch is the subordinate commander exercising disciplined initiative within intent.
171
+
172
+ **Sources:** ADP 6-0 (2019), Army.mil "Mission Command Requires Sharp Commander's Intent"
173
+
174
+ ### 1.8 NATO COPD β€” The Full Pipeline
175
+
176
+ **Comprehensive Operations Planning Directive (COPD v3.1, 2023):**
177
+
178
+ | Phase | Name | Pipeline Stage |
179
+ |-------|------|---------------|
180
+ | 1 | Initial Situational Awareness | Brainstorming (explore context) |
181
+ | 2 | Strategic Assessment | Research phase (understand landscape) |
182
+ | 3 | Military Response Options | PRD generation (define options) |
183
+ | 4 | Strategic CONOPS Development | Plan writing (detailed execution) |
184
+ | 5 | Execution | Batch execution |
185
+ | 6 | Transition | Finishing branch (merge/PR/discard) |
186
+
187
+ The CPOE (Comprehensive Preparation of the Environment) is NATO's equivalent of IPB β€” adding political, economic, social, and information dimensions. **Our research phase is CPOE for code.**
188
+
189
+ **Sources:** NATO AJP-5, COPD V3.0 Implications paper, Major Roche "Using COPD at Tactical Level"
190
+
191
+ ---
192
+
193
+ ## Part II: Business Design Methodology
194
+
195
+ ### 2.1 McKinsey/BCG β€” Hypothesis-Driven Design
196
+
197
+ **The 7-Step Problem-Solving Process:**
198
+
199
+ 1. Define the problem (one-sentence key question)
200
+ 2. Structure the problem (MECE issue tree / hypothesis tree)
201
+ 3. Prioritize issues (impact Γ— ease matrix)
202
+ 4. Develop work plan (analysis, end-product, source, owner, timing per issue)
203
+ 5. Conduct analyses
204
+ 6. Synthesize findings (Pyramid Principle β€” answer first, then support)
205
+ 7. Communicate
206
+
207
+ **MECE (Mutually Exclusive, Collectively Exhaustive):** Invented by Barbara Minto at McKinsey in the 1970s. If you cannot make your issue tree MECE, you do not understand the problem structure. This is a design forcing function.
208
+
209
+ **Day 1 Answer:** Form a testable initial hypothesis within 48-72 hours. The entire workplan is built to confirm or kill that hypothesis. This is not guessing β€” it is structured prediction from problem decomposition.
210
+
211
+ **Pyramid Principle:** Level 1 = governing thought (one sentence). Level 2 = 3-5 supporting arguments. Level 3 = underlying data. Answer-first communication β€” no building to a conclusion.
212
+
213
+ **Pipeline mapping:** The research artifact should produce a MECE decomposition of the problem space. The "Day 1 Answer" maps to the research phase's initial hypothesis about which approach will work. The hypothesis tree feeds PRD generation.
214
+
215
+ **Sources:** Minto "The Pyramid Principle," McKinsey "Seven-Step Problem-Solving Process," IGotAnOffer MECE Framework
216
+
217
+ ### 2.2 IDEO/Stanford d.school β€” Design Thinking
218
+
219
+ **The Define Phase as Structured Research:**
220
+
221
+ The d.school's insight: "Define" is not writing a problem statement at a whiteboard. It is a synthesis discipline that transforms messy qualitative data into an actionable problem frame.
222
+
223
+ **Key tools:**
224
+ - **POV Statement:** `[User] needs [need] because [insight]` β€” user + need + insight, all three required
225
+ - **How Might We (HMW):** Reframe insights as design opportunities
226
+ - **Affinity Diagram:** Cluster observations into themes
227
+ - **Journey Map:** Visual timeline with emotional highs/lows
228
+
229
+ **Quality bar:** POV statements must be grounded in observed behavior, not assumptions. The "insight" must be non-obvious β€” something discovered, not assumed.
230
+
231
+ **Pipeline mapping:** The brainstorming phase already does empathize + define. The research phase adds rigor: POV statements become research questions, HMW questions become design alternatives, affinity diagrams become the structured research artifact.
232
+
233
+ **Sources:** Stanford d.school Process Guide, IxDF "5 Stages in Design Thinking"
234
+
235
+ ### 2.3 Toyota β€” Genchi Genbutsu and A3
236
+
237
+ **Genchi genbutsu (go and see for yourself):** Before any countermeasure is proposed, Toyota requires physical presence at the actual site, direct observation, and handling of actual data. This is a quality gate, not a suggestion.
238
+
239
+ **A3 Problem Solving (fits on one sheet β€” the constraint is the point):**
240
+
241
+ | Left Side (Understanding) | Right Side (Action) |
242
+ |--------------------------|-------------------|
243
+ | Background/context | Target condition |
244
+ | Current condition (metrics, photos from gemba) | Countermeasures |
245
+ | Problem statement (measurable delta) | Implementation plan |
246
+ | Root cause analysis (5 Whys, Ishikawa) | Follow-up/confirmation |
247
+
248
+ **Value Stream Mapping:** Walk the stream physically. Map every step. Record cycle time, changeover time, uptime, batch size, WIP. Calculate lead time vs. value-added time ratio. The gap between current and future state maps defines the design scope.
249
+
250
+ **Pipeline mapping:** The research phase is our gemba walk β€” direct codebase observation before proposing changes. The A3's left side (current condition + root cause) maps to `reuse_components` and `latent_issues` in the research artifact. The constraint of fitting on one page maps to our 6000-char context budget.
251
+
252
+ **Sources:** Lean Enterprise Institute A3 Guide, Toyota A3 Problem-Solving website
253
+
254
+ ### 2.4 Amazon β€” Working Backwards
255
+
256
+ **PR-FAQ:** Write the press release before building. Forces clarity because writing requires making implicit assumptions explicit.
257
+
258
+ **Press Release structure:** Headline (customer benefit), problem paragraph (pain being solved), solution paragraph (how it solves it), customer quote (captures experience).
259
+
260
+ **Internal FAQ:** The hard questions β€” how big is the market, what's the business model, what are the top 3 risks, how do we measure success, what does the team need?
261
+
262
+ **6-Page Narrative Memo:** Meetings begin with 20-30 minutes of silent reading. Questions only after everyone has read. This eliminates the HiPPO problem (Highest Paid Person's Opinion dominating).
263
+
264
+ **Disagree and Commit:** Disagree loudly with evidence before the decision. Once decided, execute fully. The memo creates a decision audit trail.
265
+
266
+ **Pipeline mapping:** Our PRD is a lightweight PR-FAQ (acceptance criteria = customer benefits as shell commands). The research artifact is the internal FAQ (what are the risks, what have we missed, what do we need). The plan document is the 6-pager.
267
+
268
+ **Sources:** The PRFAQ "Amazon Writing Culture," Writing Cooperative "Anatomy of an Amazon 6-pager"
269
+
270
+ ### 2.5 Bridgewater β€” Systematized Disagreement
271
+
272
+ **Idea Meritocracy = Radical Truth + Radical Transparency + Believability-Weighted Decision Making**
273
+
274
+ **Issue Log:** Every mistake, disagreement, or problem is entered into a centralized log visible to the whole firm. Problems surface immediately. Patterns become training data.
275
+
276
+ **Believability-Weighted Voting:** Not all opinions are equal. Opinions weighted by demonstrated track record (Baseball Cards). If equal-weighted and believability-weighted votes diverge, discussion resumes.
277
+
278
+ **Pipeline mapping:** Our `logs/failure-patterns.json` is a lightweight Issue Log. The MAB's Thompson Sampling is believability-weighted voting β€” arms that have demonstrated better outcomes get more weight. The lesson system compounds learning like Baseball Cards.
279
+
280
+ **Sources:** Bridgewater Principles website, Bastian Moritz "Believability-Weighted System"
281
+
282
+ ### 2.6 RAND Corporation β€” Research-to-Recommendation Pipeline
283
+
284
+ **Ten Practical Principles for Policy Analysis:**
285
+
286
+ 1. Fit tools to the problem (simplest that work)
287
+ 2. Define the problem before selecting methods
288
+ 3. Identify the decision maker
289
+ 4. Explain how the choice depends on key judgments
290
+ 5. Open and explicit analysis (hidden assumptions = persistent error)
291
+ 6. Use multiple methods (triangulate)
292
+ 7. Examine uncertainty explicitly (sensitivity analysis)
293
+ 8. Consider feasibility (political, organizational, technical)
294
+ 9. Communicate clearly
295
+ 10. Document (reproducible and auditable)
296
+
297
+ **Robust Decision Making (RDM):** Instead of optimizing under expected conditions, generate a wide range of possible futures and find strategies that perform acceptably across the widest range. Design for robustness, not optimality.
298
+
299
+ **Key insight:** Findings, Implications, and Recommendations are strictly separated. Conflating them is an analytical error.
300
+
301
+ **Pipeline mapping:** The research phase should separate findings (what the codebase analysis shows) from implications (what this means for the design) from recommendations (what we should do). RDM maps to our MAB β€” instead of picking the "best" approach, find one that degrades gracefully.
302
+
303
+ **Sources:** RAND "Ten Practical Principles" (PEA3956-1), RAND "Systems Analysis: A Tool for Choice" (P4860)
304
+
305
+ ### 2.7 Wardley Mapping β€” Situational Awareness Before Strategy
306
+
307
+ **Core insight:** You cannot have a strategy without a map.
308
+
309
+ **Two axes:**
310
+ - Y-axis: Value Chain (visibility to user β€” top = user needs, bottom = infrastructure)
311
+ - X-axis: Evolution (Genesis β†’ Custom β†’ Product β†’ Commodity)
312
+
313
+ **Why evolution matters:** The evolutionary stage determines the correct design approach:
314
+ - Genesis: explore, expect failure, protect from efficiency pressure
315
+ - Custom Built: develop capability, understand best practices
316
+ - Product: optimize, differentiate, watch for commoditization
317
+ - Commodity: buy don't build, focus on operational efficiency
318
+
319
+ **Strategic error:** Applying the wrong approach to the evolutionary stage. Innovating on commodity components wastes resources. Standardizing genesis components destroys competitive advantage.
320
+
321
+ **Pipeline mapping:** The research phase should classify components by maturity. A new module being built from scratch (genesis) needs different treatment than wiring into an existing well-tested library (commodity). This classification informs batch ordering and risk assessment.
322
+
323
+ **Sources:** Wardley Maps Wikipedia, Aktia Solutions "Introduction to Wardley Maps"
324
+
325
+ ### 2.8 TOGAF ADM β€” Separation of Concerns
326
+
327
+ Enterprise architecture's contribution: separate "what the business needs" from "how technology delivers it."
328
+
329
+ **Phase A (Architecture Vision)** must be approved before **Phase B (Business Architecture)** which must be approved before **Phase C (Technology Architecture)**. Each is a gate.
330
+
331
+ **Pipeline mapping:** Our pipeline already enforces this: brainstorm (what) β†’ plan (how) β†’ execute (build). The research phase strengthens Phase A by adding structured codebase analysis.
332
+
333
+ ### 2.9 Stage-Gate β€” The Innovation Pipeline
334
+
335
+ Robert Cooper's foundational research: **most product failures are failures of front-end definition, not execution.**
336
+
337
+ **The Fuzzy Front End (Stages 0-2):**
338
+ - Stage 0: Discovery/Ideation (generate candidate ideas)
339
+ - Stage 1: Scoping (rapid, low-cost preliminary assessment)
340
+ - Stage 2: Build the Business Case (primary design phase β€” product definition)
341
+
342
+ **Gate anatomy:** Deliverables (quality, not completion) + Criteria (Must-Meet pass/fail + Should-Meet scored) + Outputs (Go/Kill/Hold/Recycle).
343
+
344
+ **The Product Definition document (Gate 2)** is the key quality gate artifact. Cooper's research: projects with a stable, well-defined product definition before development are **3x more likely to succeed**.
345
+
346
+ **Pipeline mapping:** Our quality gates are Stage-Gate gates. The research phase is Stage 1 (scoping). The PRD is the Product Definition at Gate 2. The Go/Kill/Hold/Recycle decision maps to our research gate (proceed / block / defer).
347
+
348
+ **Sources:** Stage-Gate International overview, Toolshero "Stage Gate Process by Robert Cooper"
349
+
350
+ ---
351
+
352
+ ## Part III: Cross-Domain Transfers
353
+
354
+ ### 3.1 Agile's Military Roots
355
+
356
+ **The lineage is biographical, not metaphorical.** Jeff Sutherland graduated West Point (1964), flew 100 combat missions over North Vietnam, was personally trained by John Boyd.
357
+
358
+ **OODA β†’ Scrum mapping:**
359
+
360
+ | OODA | Scrum |
361
+ |------|-------|
362
+ | Observe | Sprint Review, Daily Standup |
363
+ | Orient | Backlog Refinement, Retrospective |
364
+ | Decide | Sprint Planning |
365
+ | Act | Sprint execution |
366
+
367
+ **Auftragstaktik β†’ "Self-organizing teams":** Commanders specify intent and objective (what/why), leave method (how) to subordinates. Product Owners set the mission, teams determine execution.
368
+
369
+ **Full lineage:** US military WWII quality programs β†’ Deming β†’ Toyota TPS β†’ Lean Manufacturing β†’ Lean Software Development β†’ Agile Manifesto (2001).
370
+
371
+ ### 3.2 Chaos Engineering = Civilian Red Teaming
372
+
373
+ **Origin:** Prussian Kriegsspiel (1824) β†’ RAND Cold War simulations β†’ NSA Multics evaluation (1970s) β†’ SEAL Team Six Red Cell β†’ Netflix Chaos Monkey (2010).
374
+
375
+ | Simian Army Tool | Military Equivalent |
376
+ |-----------------|-------------------|
377
+ | Chaos Monkey (kills instances) | Attrition wargame |
378
+ | Latency Monkey (injects delays) | Communications degradation exercise |
379
+ | Chaos Kong (kills regions) | Theater-level degraded ops |
380
+
381
+ **The proof case:** Netflix's 2015 DynamoDB outage β€” Netflix experienced far less downtime than peers because chaos engineering had already forced them to solve the exact failure modes. This is "train as you fight."
382
+
383
+ ### 3.3 ICD 203 β€” The Underexploited Transfer
384
+
385
+ **Nine Analytic Tradecraft Standards:**
386
+
387
+ 1. Describe quality and credibility of sources
388
+ 2. Express uncertainties with explicit probability language
389
+ 3. Distinguish information from assumptions and judgments
390
+ 4. Incorporate alternative analysis (enumerate competing hypotheses)
391
+ 5. Demonstrate relevance and address implications
392
+ 6. Use clear argumentation
393
+ 7. Explain change from previous judgments
394
+ 8. Make accurate assessments
395
+ 9. Use effective visual information
396
+
397
+ **Analysis of Competing Hypotheses (ACH):** List all hypotheses; score evidence against each; identify which hypothesis has the **least contradicting evidence** (not the most supporting β€” a critical logical distinction).
398
+
399
+ **The gap:** Most software design docs do not express confidence levels, do not enumerate scored alternatives, and do not apply ACH. This is the single highest-value transfer opportunity from military/intelligence to software design.
400
+
401
+ **Pipeline mapping:** The research artifact should include confidence levels on latent issues and design changes, scored alternatives for architectural decisions, and explicit distinction between findings (data), implications (meaning), and recommendations (action).
402
+
403
+ ### 3.4 Cynefin β€” Match Design Approach to Problem Type
404
+
405
+ | Domain | Characteristics | Design Approach |
406
+ |--------|---------------|----------------|
407
+ | Clear | Known cause-effect; best practices exist | Sense β†’ Categorize β†’ Respond |
408
+ | Complicated | Knowable; requires expert analysis | Sense β†’ Analyze β†’ Respond |
409
+ | Complex | Emergent; cause-effect only in retrospect | Probe β†’ Sense β†’ Respond |
410
+ | Chaotic | No discernible cause-effect | Act β†’ Sense β†’ Respond |
411
+
412
+ **The critical insight:** Applying Complicated-domain thinking (expert analysis, detailed upfront design) to Complex-domain problems is a primary cause of software project failure. Waterfall's failure mode is treating product development as Complicated when it's Complex.
413
+
414
+ **Pipeline mapping:** The research phase should classify the problem domain. A well-understood CRUD endpoint is Clear/Complicated β€” spec it, build it. A novel ML pipeline integration is Complex β€” probe with spikes, learn, then plan. This classification should influence batch strategy (detailed plan vs. exploratory spike).
415
+
416
+ ### 3.5 NASA V-Model and Formal Design Reviews
417
+
418
+ **Review sequence:** MCR β†’ SRR β†’ PDR β†’ CDR β†’ TRR β†’ ORR. Each is a gate.
419
+
420
+ **The lesson commercial software ignores:** Requirements traceability. NASA traces every design decision to a requirement and every requirement to a test. Most commercial software cannot.
421
+
422
+ **Columbia lesson:** Dissenting technical voices were filtered out before reaching decision-makers. Now codified: the design review process must create conditions for technical dissent to surface.
423
+
424
+ **Pipeline mapping:** Our PRD β†’ plan β†’ test structure is a lightweight V-model. Requirements traceability = PRD task IDs referenced in plan steps. The lesson about dissent = why the lesson scanner and MAB competitive mode exist.
425
+
426
+ ### 3.6 Verified Transfer Cases
427
+
428
+ | Transfer | Origin | Destination | Vector |
429
+ |----------|--------|-------------|--------|
430
+ | OODA β†’ Scrum | Boyd/USAF | Agile | Biographical (Sutherland) |
431
+ | AAR β†’ Blameless Postmortem | Army NTC | Google SRE | Cultural (aviation CRM) |
432
+ | Red Team β†’ Threat Modeling | RAND/NSA | Microsoft STRIDE, MITRE ATT&CK | Institutional (FFRDCs) |
433
+ | V-Model β†’ Regulated Software | NASA/DoD | DO-178C, ISO 26262, IEC 62304 | Regulatory pressure |
434
+ | Kill Chain β†’ DevSecOps | DoD | Platform One, Kessel Run | Bidirectional (Palantir/Anduril) |
435
+ | Red Cell β†’ Penetration Testing | SEAL Team Six | Commercial security | Personnel migration |
436
+
437
+ ---
438
+
439
+ ## Part IV: Notion Workspace Findings
440
+
441
+ Your workspace contains deep applied coverage of military doctrine β€” primarily applied to career transition planning, not software pipeline design. Key assets:
442
+
443
+ ### 4.1 Military Doctrine (Deep Coverage)
444
+
445
+ | Asset | File | Content |
446
+ |-------|------|---------|
447
+ | JP 5-0 Operational Design Reference | `notion/.../2fc24971-...ab9b-...` | Full 13 elements, MOP vs. MOE |
448
+ | ODF Generator Agent v1 | `notion/.../81382326-...` | AI agent grounded in JP 5-0, ADP 5-0, FM 3-05.20 |
449
+ | ODF Generator Agent v2 (JADC2) | `notion/.../efa33bcd-...` | JADC2 Sense-Make-Act, Mission Command, speed-of-relevance |
450
+ | Dynamic ODF System | `notion/.../29e24971-...` | Multi-agent architecture: Intake β†’ Research β†’ 6 LOE Agents β†’ Risk β†’ Decision β†’ Sync |
451
+ | Strategic Frameworks & Methodologies | `notion/.../2a524971-...` | MDMP 7-step, IPB 4-step, CARVER matrix with scored examples |
452
+ | Military Intelligence System Prompt | `notion/.../29c24971-...` | IPB, F3EAD, CARVER, PMESII-PT, COG analysis, ICD 203 |
453
+
454
+ ### 4.2 Decision Science (Deep Coverage)
455
+
456
+ | Asset | Content |
457
+ |-------|---------|
458
+ | Kahneman Deep Dive | System 1/2, prospect theory, planning fallacy, pre-mortem, reference-class forecasting |
459
+ | Superforecasting Brief | Tetlock's 10 Commandments, Brier scoring, granular belief updating |
460
+ | 20 Cognitive Biases | Individual and team debiasing: pre-mortem, outside view, devil's advocate |
461
+ | 8 Elements of Thought | Richard Paul/Linda Elder critical thinking framework |
462
+ | Think Like a Rocket Scientist | First principles ↔ IPB, backcasting ↔ MDMP reverse planning |
463
+
464
+ ### 4.3 Business/Program Frameworks (Broad Coverage)
465
+
466
+ | Asset | Content |
467
+ |-------|---------|
468
+ | Framework Encyclopedia | Product (JTBD, RICE), Ops (OKRs, Lean, Six Sigma), PM (PMBOK, Agile), Program (SAFe, Stage-Gate, EVM) |
469
+ | Lean Six Sigma Green Belt | Job Instruction 4-Step, SWOT, FMEA, VSM, A3/Kaizen |
470
+ | SAFe Portfolio Vision | Maps to Commander's Intent β€” stable strategic direction enabling tactical flexibility |
471
+ | Policy Analysis | Bardach's Eightfold Path, Gil's Framework, 6-E Framework |
472
+
473
+ ### 4.4 Coverage Gaps (Opportunities)
474
+
475
+ | Framework | Workspace Status | Opportunity |
476
+ |-----------|-----------------|-------------|
477
+ | Wardley Mapping | One shallow reference | Deep dive would complement strategic planning |
478
+ | Cynefin | Book in library, no applied page | Critical for problem classification |
479
+ | Amazon Working Backwards | Not present | PR-FAQ methodology applicable to PRD generation |
480
+ | RAND RDM | Not present | Robust decision-making under uncertainty |
481
+ | ICD 203 full implementation | Referenced but not applied | Confidence levels for design decisions |
482
+
483
+ ---
484
+
485
+ ## Part V: Cross-Framework Synthesis
486
+
487
+ ### 5.1 The Universal Design Phase Meta-Pattern
488
+
489
+ Every framework has a distinct gate between "understanding the problem" and "designing a solution":
490
+
491
+ | Framework | Problem Definition Artifact | Gate |
492
+ |-----------|----------------------------|------|
493
+ | JP 5-0 / ADM | Problem statement + operational approach | ADM β†’ MDMP transition |
494
+ | McKinsey | MECE issue tree + Day 1 Answer | Week 1 hypothesis review |
495
+ | IDEO d.school | POV statement (user + need + insight) | POV validation |
496
+ | Toyota | A3 left side (current condition + root cause) | A3 review |
497
+ | Amazon | PR-FAQ (customer pain + internal FAQ) | PR-FAQ review |
498
+ | Bridgewater | Issue Log + believability-weighted framing | Believability vote |
499
+ | RAND | Problem framing document | Peer review |
500
+ | Wardley | Value chain map + evolution placement | Doctrine check |
501
+ | TOGAF | Business Architecture baseline + gap analysis | Architecture Vision approval |
502
+ | Stage-Gate | Product Definition document | Gate 2 (Go to Development) |
503
+ | ICD 203 | ACH matrix + confidence levels | Alternative analysis review |
504
+
505
+ **Our pipeline currently:** Brainstorm (problem definition) β†’ PRD (acceptance criteria) β†’ Plan (detailed tasks). The research phase fills the gap between brainstorm and PRD β€” it is the structured analysis that every framework above demands before solution commitment.
506
+
507
+ ### 5.2 What Military Doctrine Knows That Most Frameworks Don't
508
+
509
+ 1. **The plan will fail contact.** Design for intent, not method. Commander's intent matters more than the synchronization matrix. Our plan header (Goal, Architecture) is intent; the batch details are the synchronization matrix.
510
+
511
+ 2. **Orientation is the competitive advantage.** Boyd: the OODA loop is won or lost in Orient. The quality of pre-execution cognitive work determines execution quality more than execution technique.
512
+
513
+ 3. **Adversarial review must be structural, not optional.** Groupthink is a property of cohesive teams under pressure, not a personality failure. Red teams exist because the alternative consistently produces plans with unexamined fatal assumptions.
514
+
515
+ 4. **Reframing is doctrine, not failure.** ADM's fourth activity (Reframe) acknowledges that the initial problem frame will be wrong. The pipeline must support mid-execution reframing without treating it as a failure.
516
+
517
+ ### 5.3 The Underexploited Transfers
518
+
519
+ **Highest-value transfers not yet in our pipeline:**
520
+
521
+ | Transfer | Source | Application | Impact |
522
+ |----------|--------|-------------|--------|
523
+ | Confidence levels | ICD 203 | Research artifact fields get `confidence: high/medium/low` | Prevents false precision in design decisions |
524
+ | ACH scoring | ICD 203 | Enumerate design alternatives, score against evidence | Prevents premature convergence |
525
+ | Cynefin classification | Snowden | Classify problem domain per batch β†’ choose execution strategy | Prevents waterfall-on-complex errors |
526
+ | Wardley evolution | Wardley | Classify components by maturity β†’ inform build-vs-reuse | Prevents innovating on commodity |
527
+ | COG-CC-CR-CV analysis | Strange | Identify critical vulnerability in codebase β†’ address first | Prevents leaving worst risk for last |
528
+ | RDM robustness | RAND | Design for acceptable performance across futures, not optimal in one | Prevents brittle architecture |
529
+ | Murder board | Military | Formal adversarial review of plan before execution | Prevents groupthink in plan generation |
530
+
531
+ ### 5.4 Revised Pipeline with Operations Design Integration
532
+
533
+ ```
534
+ Stage 0 : Roadmap (multi-feature sequencing)
535
+ Stage 0.5 : Problem Framing ← NEW (ADM "Frame the Problem")
536
+ - MECE decomposition of problem space
537
+ - Cynefin domain classification
538
+ - COG-CC-CR-CV analysis of codebase
539
+ Stage 1 : Brainstorm (explore intent β†’ design β†’ approval)
540
+ Stage 1.5 : Research ← ENHANCED
541
+ - IPB-style codebase analysis (4-step)
542
+ - ACH scoring of design alternatives
543
+ - Confidence levels on all findings
544
+ - Wardley evolution classification of components
545
+ - Findings / Implications / Recommendations separation (RAND)
546
+ - Research gate (Go/Kill/Hold)
547
+ Stage 2 : PRD (machine-verifiable acceptance criteria)
548
+ Stage 2.5 : Murder Board ← NEW (formal adversarial plan review)
549
+ - Red team attacks the plan
550
+ - Alternative analysis required
551
+ - Pre-mortem: "imagine this failed β€” what went wrong?"
552
+ Stage 3 : Plan (TDD-structured tasks at 2-5 minute granularity)
553
+ Stage 3.5 : Isolate (git worktree)
554
+ Stage 4 : Execute (batch execution with quality gates)
555
+ Stage 5 : Verify (evidence-based gate)
556
+ Stage 5.5 : AAR ← NEW (after-action review)
557
+ - What was planned vs. what happened
558
+ - Root causes of deviations
559
+ - Lessons for failure-patterns.json
560
+ Stage 6 : Finish (merge / PR / keep / discard)
561
+ ```
562
+
563
+ ### 5.5 Research Artifact Schema (Enhanced)
564
+
565
+ Based on the cross-framework synthesis, the research artifact should include:
566
+
567
+ ```json
568
+ {
569
+ "feature": "string",
570
+ "date": "YYYY-MM-DD",
571
+ "domain_classification": "clear | complicated | complex | chaotic",
572
+ "problem_frame": {
573
+ "current_state": "string (A3 left side β€” what is happening now)",
574
+ "desired_state": "string (end state β€” what success looks like)",
575
+ "gap": "string (why the gap exists, not just that it exists)",
576
+ "root_causes": ["string (5 Whys / Ishikawa results)"]
577
+ },
578
+ "mece_decomposition": [
579
+ {"branch": "string", "sub_branches": ["string"], "priority": "high|medium|low"}
580
+ ],
581
+ "alternatives": [
582
+ {
583
+ "approach": "string",
584
+ "evidence_for": ["string"],
585
+ "evidence_against": ["string"],
586
+ "confidence": "high|medium|low",
587
+ "recommended": true
588
+ }
589
+ ],
590
+ "cog_analysis": {
591
+ "center_of_gravity": "string (core module/capability under change)",
592
+ "critical_capabilities": ["string"],
593
+ "critical_requirements": ["string"],
594
+ "critical_vulnerabilities": ["string (address these first)"]
595
+ },
596
+ "reuse_components": [
597
+ {"requirement": "string", "file": "string", "gap": "none|partial|full", "evolution": "genesis|custom|product|commodity"}
598
+ ],
599
+ "latent_issues": [
600
+ {"file": "string", "line": 0, "description": "string", "severity": "critical|high|medium|low", "confidence": "high|medium|low", "blocking": true}
601
+ ],
602
+ "design_changes": [
603
+ {"change": "string", "rationale": "string", "blocking": true, "alternatives_considered": ["string"]}
604
+ ],
605
+ "findings_vs_implications_vs_recommendations": {
606
+ "findings": ["string (what the data shows)"],
607
+ "implications": ["string (what this means for the design)"],
608
+ "recommendations": ["string (what we should do)"]
609
+ },
610
+ "prd_scope_delta": {"tasks_removable": [], "tasks_added": [], "estimated_task_reduction": 0}
611
+ }
612
+ ```
613
+
614
+ ---
615
+
616
+ ## Part VI: Implementation Priorities
617
+
618
+ ### Tier 1 (Highest value, lowest effort β€” enhance existing stages)
619
+
620
+ 1. **Add confidence levels to research artifact** β€” every finding gets `high/medium/low` confidence
621
+ 2. **Add alternatives scoring** β€” enumerate 2-3 approaches with evidence for/against (ACH-lite)
622
+ 3. **Separate findings/implications/recommendations** in research output (RAND discipline)
623
+ 4. **Add Cynefin classification** to plan header β€” determines execution strategy per batch
624
+
625
+ ### Tier 2 (High value, moderate effort β€” new lightweight stages)
626
+
627
+ 5. **Murder Board script** β€” adversarial review of generated plan before execution (pre-mortem + devil's advocacy)
628
+ 6. **AAR step** after execution β€” structured what-planned-vs-what-happened with root cause β†’ failure-patterns.json
629
+ 7. **COG-CC-CR-CV analysis** in research phase β€” identify critical vulnerabilities to address first
630
+
631
+ ### Tier 3 (High value, significant effort β€” new capabilities)
632
+
633
+ 8. **Problem Framing stage** (Stage 0.5) β€” MECE decomposition + Cynefin classification before brainstorming
634
+ 9. **Wardley evolution classification** of components β€” inform build-vs-reuse decisions
635
+ 10. **Full ICD 203 implementation** β€” confidence vocabulary, source credibility, alternative analysis mandated
636
+
637
+ ---
638
+
639
+ ## Sources
640
+
641
+ ### Military Doctrine
642
+ - JP 5-0 Joint Planning (2020)
643
+ - ADP 5-0 The Operations Process (2019)
644
+ - ATP 5-0.1 Army Design Methodology (2015)
645
+ - Joint Staff J-7 Planner's Handbook for Operational Design (2011)
646
+ - FM 34-130 Intelligence Preparation of the Battlefield
647
+ - ADP 6-0 Mission Command (2019)
648
+ - NATO AJP-5 Allied Joint Doctrine for Planning
649
+ - NATO COPD v3.1 (2023)
650
+ - UFMCS Red Team Handbook / Applied Critical Thinking Handbook v8.1
651
+ - Boyd, "Discourse on Winning and Losing" / "Destruction and Creation" (1976)
652
+ - Strange & Iron, "Understanding Centers of Gravity and Critical Vulnerabilities"
653
+
654
+ ### Business Methodology
655
+ - Minto, "The Pyramid Principle" (McKinsey)
656
+ - Stanford d.school Design Thinking Process Guide
657
+ - Lean Enterprise Institute A3 Guide / Toyota Production System
658
+ - Amazon PR-FAQ / Working Backwards methodology
659
+ - Dalio, "Principles" (Bridgewater)
660
+ - RAND "Ten Practical Principles for Policy Analysis" (PEA3956-1)
661
+ - Wardley, "Wardley Maps" (Creative Commons)
662
+ - TOGAF Standard (The Open Group)
663
+ - Cooper, "Winning at New Products" (Stage-Gate)
664
+
665
+ ### Cross-Domain
666
+ - Sutherland/Boyd OODA-to-Scrum lineage (Scrum Inc.)
667
+ - Netflix Chaos Monkey / Simian Army (Gremlin, SEI CMU)
668
+ - ICD 203 Analytic Standards (DNI)
669
+ - NASA Systems Engineering Handbook (NASA-HDBK-2203)
670
+ - Snowden, Cynefin Framework (Wikipedia, Deakin University)
671
+ - DoD Enterprise DevSecOps Fundamentals v2.5 (dodcio.defense.gov)
672
+ - Google Design Docs (Industrial Empathy / Malte Ubl)
673
+ - Team Topologies (Skelton & Pais)
674
+
675
+ ### Notion Workspace
676
+ - JP 5-0 Operational Design Reference, ODF Generator Agents v1/v2
677
+ - Strategic Frameworks & Methodologies (MDMP, IPB, CARVER applied)
678
+ - Military Intelligence System Prompt (IPB, F3EAD, ICD 203)
679
+ - Kahneman Deep Dive, Superforecasting Brief
680
+ - Framework Encyclopedia, Lean Six Sigma Green Belt
681
+ - Think Like a Rocket Scientist, Kill Chain, Hundred-Year Marathon