tribunal-kit 4.4.1 → 4.4.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (141) hide show
  1. package/.agent/history/architecture-graph.yaml +140 -0
  2. package/.agent/history/graph-cache.json +262 -0
  3. package/.agent/history/snapshots/bin__tribunal-kit.js.json +19 -0
  4. package/.agent/history/snapshots/eslint.config.js.json +9 -0
  5. package/.agent/history/snapshots/migrate_refs.js.json +11 -0
  6. package/.agent/history/snapshots/scripts__changelog.js.json +13 -0
  7. package/.agent/history/snapshots/scripts__sync-version.js.json +12 -0
  8. package/.agent/history/snapshots/scripts__validate-payload.js.json +12 -0
  9. package/.agent/history/snapshots/test__integration__bridges.test.js.json +14 -0
  10. package/.agent/history/snapshots/test__integration__init.test.js.json +14 -0
  11. package/.agent/history/snapshots/test__integration__routing.test.js.json +12 -0
  12. package/.agent/history/snapshots/test__integration__swarm_dispatcher.test.js.json +14 -0
  13. package/.agent/history/snapshots/test__integration__wave2.test.js.json +14 -0
  14. package/.agent/history/snapshots/test__unit__args.test.js.json +20 -0
  15. package/.agent/history/snapshots/test__unit__case_law_manager.test.js.json +11 -0
  16. package/.agent/history/snapshots/test__unit__context_broker.test.js.json +11 -0
  17. package/.agent/history/snapshots/test__unit__copyDir.test.js.json +23 -0
  18. package/.agent/history/snapshots/test__unit__graph_tools.test.js.json +12 -0
  19. package/.agent/history/snapshots/test__unit__inner_loop_validator.test.js.json +11 -0
  20. package/.agent/history/snapshots/test__unit__selfInstall.test.js.json +23 -0
  21. package/.agent/history/snapshots/test__unit__semver.test.js.json +20 -0
  22. package/.agent/history/snapshots/test__unit__swarm_dispatcher.test.js.json +12 -0
  23. package/.agent/scripts/_colors.js +170 -18
  24. package/.agent/scripts/_utils.js +244 -42
  25. package/.agent/scripts/bundle_analyzer.js +261 -290
  26. package/.agent/scripts/case_law_manager.js +1 -7
  27. package/.agent/scripts/checklist.js +278 -266
  28. package/.agent/scripts/colors.js +11 -17
  29. package/.agent/scripts/context_broker.js +1 -7
  30. package/.agent/scripts/dependency_analyzer.js +234 -272
  31. package/.agent/scripts/graph_builder.js +46 -18
  32. package/.agent/scripts/graph_visualizer.js +10 -4
  33. package/.agent/scripts/graph_zoom.js +6 -4
  34. package/.agent/scripts/inner_loop_validator.js +2 -8
  35. package/.agent/scripts/lint_runner.js +186 -187
  36. package/.agent/scripts/marathon_harness.js +799 -0
  37. package/.agent/scripts/prompt_compiler.js +56 -0
  38. package/.agent/scripts/schema_validator.js +8 -25
  39. package/.agent/scripts/security_scan.js +276 -303
  40. package/.agent/scripts/session_manager.js +1 -7
  41. package/.agent/scripts/skill_evolution.js +1 -8
  42. package/.agent/scripts/skill_integrator.js +1 -7
  43. package/.agent/scripts/test_runner.js +186 -193
  44. package/.agent/scripts/utils.js +17 -32
  45. package/.agent/scripts/verify_all.js +248 -257
  46. package/.agent/skills/agent-organizer/SKILL.md +42 -0
  47. package/.agent/skills/agentic-patterns/SKILL.md +42 -0
  48. package/.agent/skills/ai-prompt-injection-defense/SKILL.md +42 -0
  49. package/.agent/skills/api-patterns/SKILL.md +42 -0
  50. package/.agent/skills/api-security-auditor/SKILL.md +42 -0
  51. package/.agent/skills/app-builder/SKILL.md +42 -0
  52. package/.agent/skills/appflow-wireframe/SKILL.md +42 -0
  53. package/.agent/skills/architecture/SKILL.md +42 -0
  54. package/.agent/skills/authentication-best-practices/SKILL.md +42 -0
  55. package/.agent/skills/backend-security-expert/SKILL.md +122 -0
  56. package/.agent/skills/bash-linux/SKILL.md +42 -0
  57. package/.agent/skills/behavioral-modes/SKILL.md +42 -0
  58. package/.agent/skills/brainstorming/SKILL.md +42 -0
  59. package/.agent/skills/building-native-ui/SKILL.md +42 -0
  60. package/.agent/skills/clean-code/SKILL.md +42 -0
  61. package/.agent/skills/code-review-checklist/SKILL.md +42 -0
  62. package/.agent/skills/config-validator/SKILL.md +42 -0
  63. package/.agent/skills/csharp-developer/SKILL.md +42 -0
  64. package/.agent/skills/data-validation-schemas/SKILL.md +42 -0
  65. package/.agent/skills/database-design/SKILL.md +42 -0
  66. package/.agent/skills/deployment-procedures/SKILL.md +42 -0
  67. package/.agent/skills/devops-engineer/SKILL.md +42 -0
  68. package/.agent/skills/devops-incident-responder/SKILL.md +42 -0
  69. package/.agent/skills/documentation-templates/SKILL.md +42 -0
  70. package/.agent/skills/edge-computing/SKILL.md +42 -0
  71. package/.agent/skills/error-resilience/SKILL.md +42 -0
  72. package/.agent/skills/extract-design-system/SKILL.md +42 -0
  73. package/.agent/skills/framer-motion-expert/SKILL.md +42 -0
  74. package/.agent/skills/frontend-design/SKILL.md +42 -0
  75. package/.agent/skills/frontend-security-expert/SKILL.md +123 -0
  76. package/.agent/skills/game-design-expert/SKILL.md +42 -0
  77. package/.agent/skills/game-engineering-expert/SKILL.md +42 -0
  78. package/.agent/skills/geo-fundamentals/SKILL.md +42 -0
  79. package/.agent/skills/github-operations/SKILL.md +42 -0
  80. package/.agent/skills/gsap-core/SKILL.md +42 -0
  81. package/.agent/skills/gsap-frameworks/SKILL.md +42 -0
  82. package/.agent/skills/gsap-performance/SKILL.md +42 -0
  83. package/.agent/skills/gsap-plugins/SKILL.md +42 -0
  84. package/.agent/skills/gsap-react/SKILL.md +42 -0
  85. package/.agent/skills/gsap-scrolltrigger/SKILL.md +42 -0
  86. package/.agent/skills/gsap-timeline/SKILL.md +42 -0
  87. package/.agent/skills/gsap-utils/SKILL.md +42 -0
  88. package/.agent/skills/i18n-localization/SKILL.md +42 -0
  89. package/.agent/skills/intelligent-routing/SKILL.md +42 -0
  90. package/.agent/skills/knowledge-graph/SKILL.md +42 -0
  91. package/.agent/skills/lint-and-validate/SKILL.md +42 -0
  92. package/.agent/skills/llm-engineering/SKILL.md +42 -0
  93. package/.agent/skills/local-first/SKILL.md +42 -0
  94. package/.agent/skills/mcp-builder/SKILL.md +42 -0
  95. package/.agent/skills/mobile-design/SKILL.md +42 -0
  96. package/.agent/skills/monorepo-management/SKILL.md +42 -0
  97. package/.agent/skills/motion-engineering/SKILL.md +42 -0
  98. package/.agent/skills/nextjs-react-expert/SKILL.md +42 -0
  99. package/.agent/skills/nodejs-best-practices/SKILL.md +42 -0
  100. package/.agent/skills/observability/SKILL.md +42 -0
  101. package/.agent/skills/parallel-agents/SKILL.md +42 -0
  102. package/.agent/skills/performance-profiling/SKILL.md +42 -0
  103. package/.agent/skills/plan-writing/SKILL.md +42 -0
  104. package/.agent/skills/platform-engineer/SKILL.md +42 -0
  105. package/.agent/skills/playwright-best-practices/SKILL.md +42 -0
  106. package/.agent/skills/powershell-windows/SKILL.md +42 -0
  107. package/.agent/skills/project-idioms/SKILL.md +42 -0
  108. package/.agent/skills/python-patterns/SKILL.md +42 -0
  109. package/.agent/skills/python-pro/SKILL.md +42 -0
  110. package/.agent/skills/react-specialist/SKILL.md +42 -0
  111. package/.agent/skills/readme-builder/SKILL.md +42 -0
  112. package/.agent/skills/realtime-patterns/SKILL.md +42 -0
  113. package/.agent/skills/red-team-tactics/SKILL.md +42 -0
  114. package/.agent/skills/rust-pro/SKILL.md +42 -0
  115. package/.agent/skills/seo-fundamentals/SKILL.md +42 -0
  116. package/.agent/skills/server-management/SKILL.md +42 -0
  117. package/.agent/skills/shadcn-ui-expert/SKILL.md +42 -0
  118. package/.agent/skills/skill-creator/SKILL.md +42 -0
  119. package/.agent/skills/sql-pro/SKILL.md +42 -0
  120. package/.agent/skills/supabase-postgres-best-practices/SKILL.md +42 -0
  121. package/.agent/skills/swiftui-expert/SKILL.md +42 -0
  122. package/.agent/skills/systematic-debugging/SKILL.md +42 -0
  123. package/.agent/skills/tailwind-patterns/SKILL.md +42 -0
  124. package/.agent/skills/tdd-workflow/SKILL.md +42 -0
  125. package/.agent/skills/test-result-analyzer/SKILL.md +42 -0
  126. package/.agent/skills/testing-patterns/SKILL.md +42 -0
  127. package/.agent/skills/trend-researcher/SKILL.md +42 -0
  128. package/.agent/skills/typescript-advanced/SKILL.md +42 -0
  129. package/.agent/skills/ui-ux-pro-max/SKILL.md +42 -0
  130. package/.agent/skills/ui-ux-researcher/SKILL.md +42 -0
  131. package/.agent/skills/vue-expert/SKILL.md +42 -0
  132. package/.agent/skills/vulnerability-scanner/SKILL.md +42 -0
  133. package/.agent/skills/web-accessibility-auditor/SKILL.md +42 -0
  134. package/.agent/skills/web-design-guidelines/SKILL.md +42 -0
  135. package/.agent/skills/webapp-testing/SKILL.md +42 -0
  136. package/.agent/skills/whimsy-injector/SKILL.md +42 -0
  137. package/.agent/skills/workflow-optimizer/SKILL.md +42 -0
  138. package/.agent/workflows/marathon.md +247 -0
  139. package/.agent/workflows/super-prompt.md +27 -0
  140. package/bin/tribunal-kit.js +47 -1
  141. package/package.json +3 -2
@@ -560,3 +560,45 @@ Review these questions before confirming output:
560
560
 
561
561
  ## VBC Protocol (Verification-Before-Completion)
562
562
  You MUST verify existing code signatures and variables before attempting to modify or call them. No hallucination is permitted.
563
+
564
+
565
+ ---
566
+
567
+ ## 🤖 LLM-Specific Traps
568
+
569
+ AI coding assistants often fall into specific bad habits when dealing with this domain. These are strictly forbidden:
570
+
571
+ 1. **Over-engineering:** Proposing complex abstractions or distributed systems when a simpler approach suffices.
572
+ 2. **Hallucinated Libraries/Methods:** Using non-existent methods or packages. Always `// VERIFY` or check `package.json` / `requirements.txt`.
573
+ 3. **Skipping Edge Cases:** Writing the "happy path" and ignoring error handling, timeouts, or data validation.
574
+ 4. **Context Amnesia:** Forgetting the user's constraints and offering generic advice instead of tailored solutions.
575
+ 5. **Silent Degradation:** Catching and suppressing errors without logging or re-raising.
576
+
577
+ ---
578
+
579
+ ## 🏛️ Tribunal Integration (Anti-Hallucination)
580
+
581
+ **Slash command: `/review` or `/tribunal-full`**
582
+ **Active reviewers: `logic-reviewer` · `security-auditor`**
583
+
584
+ ### ❌ Forbidden AI Tropes
585
+
586
+ 1. **Blind Assumptions:** Never make an assumption without documenting it clearly with `// VERIFY: [reason]`.
587
+ 2. **Silent Degradation:** Catching and suppressing errors without logging or handling.
588
+ 3. **Context Amnesia:** Forgetting the user's constraints and offering generic advice instead of tailored solutions.
589
+
590
+ ### ✅ Pre-Flight Self-Audit
591
+
592
+ Review these questions before confirming output:
593
+ ```
594
+ ✅ Did I rely ONLY on real, verified tools and methods?
595
+ ✅ Is this solution appropriately scoped to the user's constraints?
596
+ ✅ Did I handle potential failure modes and edge cases?
597
+ ✅ Have I avoided generic boilerplate that doesn't add value?
598
+ ```
599
+
600
+ ### 🛑 Verification-Before-Completion (VBC) Protocol
601
+
602
+ **CRITICAL:** You must follow a strict "evidence-based closeout" state machine.
603
+ - ❌ **Forbidden:** Declaring a task complete because the output "looks correct."
604
+ - ✅ **Required:** You are explicitly forbidden from finalizing any task without providing **concrete evidence** (terminal output, passing tests, compile success, or equivalent proof) that your output works as intended.
@@ -242,3 +242,45 @@ Review these questions before confirming output:
242
242
 
243
243
  ## VBC Protocol (Verification-Before-Completion)
244
244
  You MUST verify existing code signatures and variables before attempting to modify or call them. No hallucination is permitted.
245
+
246
+
247
+ ---
248
+
249
+ ## 🤖 LLM-Specific Traps
250
+
251
+ AI coding assistants often fall into specific bad habits when dealing with this domain. These are strictly forbidden:
252
+
253
+ 1. **Over-engineering:** Proposing complex abstractions or distributed systems when a simpler approach suffices.
254
+ 2. **Hallucinated Libraries/Methods:** Using non-existent methods or packages. Always `// VERIFY` or check `package.json` / `requirements.txt`.
255
+ 3. **Skipping Edge Cases:** Writing the "happy path" and ignoring error handling, timeouts, or data validation.
256
+ 4. **Context Amnesia:** Forgetting the user's constraints and offering generic advice instead of tailored solutions.
257
+ 5. **Silent Degradation:** Catching and suppressing errors without logging or re-raising.
258
+
259
+ ---
260
+
261
+ ## 🏛️ Tribunal Integration (Anti-Hallucination)
262
+
263
+ **Slash command: `/review` or `/tribunal-full`**
264
+ **Active reviewers: `logic-reviewer` · `security-auditor`**
265
+
266
+ ### ❌ Forbidden AI Tropes
267
+
268
+ 1. **Blind Assumptions:** Never make an assumption without documenting it clearly with `// VERIFY: [reason]`.
269
+ 2. **Silent Degradation:** Catching and suppressing errors without logging or handling.
270
+ 3. **Context Amnesia:** Forgetting the user's constraints and offering generic advice instead of tailored solutions.
271
+
272
+ ### ✅ Pre-Flight Self-Audit
273
+
274
+ Review these questions before confirming output:
275
+ ```
276
+ ✅ Did I rely ONLY on real, verified tools and methods?
277
+ ✅ Is this solution appropriately scoped to the user's constraints?
278
+ ✅ Did I handle potential failure modes and edge cases?
279
+ ✅ Have I avoided generic boilerplate that doesn't add value?
280
+ ```
281
+
282
+ ### 🛑 Verification-Before-Completion (VBC) Protocol
283
+
284
+ **CRITICAL:** You must follow a strict "evidence-based closeout" state machine.
285
+ - ❌ **Forbidden:** Declaring a task complete because the output "looks correct."
286
+ - ✅ **Required:** You are explicitly forbidden from finalizing any task without providing **concrete evidence** (terminal output, passing tests, compile success, or equivalent proof) that your output works as intended.
@@ -273,3 +273,45 @@ Review these questions before confirming output:
273
273
 
274
274
  ## VBC Protocol (Verification-Before-Completion)
275
275
  You MUST verify existing code signatures and variables before attempting to modify or call them. No hallucination is permitted.
276
+
277
+
278
+ ---
279
+
280
+ ## 🤖 LLM-Specific Traps
281
+
282
+ AI coding assistants often fall into specific bad habits when dealing with this domain. These are strictly forbidden:
283
+
284
+ 1. **Over-engineering:** Proposing complex abstractions or distributed systems when a simpler approach suffices.
285
+ 2. **Hallucinated Libraries/Methods:** Using non-existent methods or packages. Always `// VERIFY` or check `package.json` / `requirements.txt`.
286
+ 3. **Skipping Edge Cases:** Writing the "happy path" and ignoring error handling, timeouts, or data validation.
287
+ 4. **Context Amnesia:** Forgetting the user's constraints and offering generic advice instead of tailored solutions.
288
+ 5. **Silent Degradation:** Catching and suppressing errors without logging or re-raising.
289
+
290
+ ---
291
+
292
+ ## 🏛️ Tribunal Integration (Anti-Hallucination)
293
+
294
+ **Slash command: `/review` or `/tribunal-full`**
295
+ **Active reviewers: `logic-reviewer` · `security-auditor`**
296
+
297
+ ### ❌ Forbidden AI Tropes
298
+
299
+ 1. **Blind Assumptions:** Never make an assumption without documenting it clearly with `// VERIFY: [reason]`.
300
+ 2. **Silent Degradation:** Catching and suppressing errors without logging or handling.
301
+ 3. **Context Amnesia:** Forgetting the user's constraints and offering generic advice instead of tailored solutions.
302
+
303
+ ### ✅ Pre-Flight Self-Audit
304
+
305
+ Review these questions before confirming output:
306
+ ```
307
+ ✅ Did I rely ONLY on real, verified tools and methods?
308
+ ✅ Is this solution appropriately scoped to the user's constraints?
309
+ ✅ Did I handle potential failure modes and edge cases?
310
+ ✅ Have I avoided generic boilerplate that doesn't add value?
311
+ ```
312
+
313
+ ### 🛑 Verification-Before-Completion (VBC) Protocol
314
+
315
+ **CRITICAL:** You must follow a strict "evidence-based closeout" state machine.
316
+ - ❌ **Forbidden:** Declaring a task complete because the output "looks correct."
317
+ - ✅ **Required:** You are explicitly forbidden from finalizing any task without providing **concrete evidence** (terminal output, passing tests, compile success, or equivalent proof) that your output works as intended.
@@ -402,3 +402,45 @@ Review these questions before confirming output:
402
402
 
403
403
  ## VBC Protocol (Verification-Before-Completion)
404
404
  You MUST verify existing code signatures and variables before attempting to modify or call them. No hallucination is permitted.
405
+
406
+
407
+ ---
408
+
409
+ ## 🤖 LLM-Specific Traps
410
+
411
+ AI coding assistants often fall into specific bad habits when dealing with this domain. These are strictly forbidden:
412
+
413
+ 1. **Over-engineering:** Proposing complex abstractions or distributed systems when a simpler approach suffices.
414
+ 2. **Hallucinated Libraries/Methods:** Using non-existent methods or packages. Always `// VERIFY` or check `package.json` / `requirements.txt`.
415
+ 3. **Skipping Edge Cases:** Writing the "happy path" and ignoring error handling, timeouts, or data validation.
416
+ 4. **Context Amnesia:** Forgetting the user's constraints and offering generic advice instead of tailored solutions.
417
+ 5. **Silent Degradation:** Catching and suppressing errors without logging or re-raising.
418
+
419
+ ---
420
+
421
+ ## 🏛️ Tribunal Integration (Anti-Hallucination)
422
+
423
+ **Slash command: `/review` or `/tribunal-full`**
424
+ **Active reviewers: `logic-reviewer` · `security-auditor`**
425
+
426
+ ### ❌ Forbidden AI Tropes
427
+
428
+ 1. **Blind Assumptions:** Never make an assumption without documenting it clearly with `// VERIFY: [reason]`.
429
+ 2. **Silent Degradation:** Catching and suppressing errors without logging or handling.
430
+ 3. **Context Amnesia:** Forgetting the user's constraints and offering generic advice instead of tailored solutions.
431
+
432
+ ### ✅ Pre-Flight Self-Audit
433
+
434
+ Review these questions before confirming output:
435
+ ```
436
+ ✅ Did I rely ONLY on real, verified tools and methods?
437
+ ✅ Is this solution appropriately scoped to the user's constraints?
438
+ ✅ Did I handle potential failure modes and edge cases?
439
+ ✅ Have I avoided generic boilerplate that doesn't add value?
440
+ ```
441
+
442
+ ### 🛑 Verification-Before-Completion (VBC) Protocol
443
+
444
+ **CRITICAL:** You must follow a strict "evidence-based closeout" state machine.
445
+ - ❌ **Forbidden:** Declaring a task complete because the output "looks correct."
446
+ - ✅ **Required:** You are explicitly forbidden from finalizing any task without providing **concrete evidence** (terminal output, passing tests, compile success, or equivalent proof) that your output works as intended.
@@ -216,3 +216,45 @@ Review these questions before confirming output:
216
216
 
217
217
  ## VBC Protocol (Verification-Before-Completion)
218
218
  You MUST verify existing code signatures and variables before attempting to modify or call them. No hallucination is permitted.
219
+
220
+
221
+ ---
222
+
223
+ ## 🤖 LLM-Specific Traps
224
+
225
+ AI coding assistants often fall into specific bad habits when dealing with this domain. These are strictly forbidden:
226
+
227
+ 1. **Over-engineering:** Proposing complex abstractions or distributed systems when a simpler approach suffices.
228
+ 2. **Hallucinated Libraries/Methods:** Using non-existent methods or packages. Always `// VERIFY` or check `package.json` / `requirements.txt`.
229
+ 3. **Skipping Edge Cases:** Writing the "happy path" and ignoring error handling, timeouts, or data validation.
230
+ 4. **Context Amnesia:** Forgetting the user's constraints and offering generic advice instead of tailored solutions.
231
+ 5. **Silent Degradation:** Catching and suppressing errors without logging or re-raising.
232
+
233
+ ---
234
+
235
+ ## 🏛️ Tribunal Integration (Anti-Hallucination)
236
+
237
+ **Slash command: `/review` or `/tribunal-full`**
238
+ **Active reviewers: `logic-reviewer` · `security-auditor`**
239
+
240
+ ### ❌ Forbidden AI Tropes
241
+
242
+ 1. **Blind Assumptions:** Never make an assumption without documenting it clearly with `// VERIFY: [reason]`.
243
+ 2. **Silent Degradation:** Catching and suppressing errors without logging or handling.
244
+ 3. **Context Amnesia:** Forgetting the user's constraints and offering generic advice instead of tailored solutions.
245
+
246
+ ### ✅ Pre-Flight Self-Audit
247
+
248
+ Review these questions before confirming output:
249
+ ```
250
+ ✅ Did I rely ONLY on real, verified tools and methods?
251
+ ✅ Is this solution appropriately scoped to the user's constraints?
252
+ ✅ Did I handle potential failure modes and edge cases?
253
+ ✅ Have I avoided generic boilerplate that doesn't add value?
254
+ ```
255
+
256
+ ### 🛑 Verification-Before-Completion (VBC) Protocol
257
+
258
+ **CRITICAL:** You must follow a strict "evidence-based closeout" state machine.
259
+ - ❌ **Forbidden:** Declaring a task complete because the output "looks correct."
260
+ - ✅ **Required:** You are explicitly forbidden from finalizing any task without providing **concrete evidence** (terminal output, passing tests, compile success, or equivalent proof) that your output works as intended.
@@ -184,3 +184,45 @@ Review these questions before confirming output:
184
184
 
185
185
  ## VBC Protocol (Verification-Before-Completion)
186
186
  You MUST verify existing code signatures and variables before attempting to modify or call them. No hallucination is permitted.
187
+
188
+
189
+ ---
190
+
191
+ ## 🤖 LLM-Specific Traps
192
+
193
+ AI coding assistants often fall into specific bad habits when dealing with this domain. These are strictly forbidden:
194
+
195
+ 1. **Over-engineering:** Proposing complex abstractions or distributed systems when a simpler approach suffices.
196
+ 2. **Hallucinated Libraries/Methods:** Using non-existent methods or packages. Always `// VERIFY` or check `package.json` / `requirements.txt`.
197
+ 3. **Skipping Edge Cases:** Writing the "happy path" and ignoring error handling, timeouts, or data validation.
198
+ 4. **Context Amnesia:** Forgetting the user's constraints and offering generic advice instead of tailored solutions.
199
+ 5. **Silent Degradation:** Catching and suppressing errors without logging or re-raising.
200
+
201
+ ---
202
+
203
+ ## 🏛️ Tribunal Integration (Anti-Hallucination)
204
+
205
+ **Slash command: `/review` or `/tribunal-full`**
206
+ **Active reviewers: `logic-reviewer` · `security-auditor`**
207
+
208
+ ### ❌ Forbidden AI Tropes
209
+
210
+ 1. **Blind Assumptions:** Never make an assumption without documenting it clearly with `// VERIFY: [reason]`.
211
+ 2. **Silent Degradation:** Catching and suppressing errors without logging or handling.
212
+ 3. **Context Amnesia:** Forgetting the user's constraints and offering generic advice instead of tailored solutions.
213
+
214
+ ### ✅ Pre-Flight Self-Audit
215
+
216
+ Review these questions before confirming output:
217
+ ```
218
+ ✅ Did I rely ONLY on real, verified tools and methods?
219
+ ✅ Is this solution appropriately scoped to the user's constraints?
220
+ ✅ Did I handle potential failure modes and edge cases?
221
+ ✅ Have I avoided generic boilerplate that doesn't add value?
222
+ ```
223
+
224
+ ### 🛑 Verification-Before-Completion (VBC) Protocol
225
+
226
+ **CRITICAL:** You must follow a strict "evidence-based closeout" state machine.
227
+ - ❌ **Forbidden:** Declaring a task complete because the output "looks correct."
228
+ - ✅ **Required:** You are explicitly forbidden from finalizing any task without providing **concrete evidence** (terminal output, passing tests, compile success, or equivalent proof) that your output works as intended.
@@ -167,3 +167,45 @@ Review these questions before confirming output:
167
167
 
168
168
  ## VBC Protocol (Verification-Before-Completion)
169
169
  You MUST verify existing code signatures and variables before attempting to modify or call them. No hallucination is permitted.
170
+
171
+
172
+ ---
173
+
174
+ ## 🤖 LLM-Specific Traps
175
+
176
+ AI coding assistants often fall into specific bad habits when dealing with this domain. These are strictly forbidden:
177
+
178
+ 1. **Over-engineering:** Proposing complex abstractions or distributed systems when a simpler approach suffices.
179
+ 2. **Hallucinated Libraries/Methods:** Using non-existent methods or packages. Always `// VERIFY` or check `package.json` / `requirements.txt`.
180
+ 3. **Skipping Edge Cases:** Writing the "happy path" and ignoring error handling, timeouts, or data validation.
181
+ 4. **Context Amnesia:** Forgetting the user's constraints and offering generic advice instead of tailored solutions.
182
+ 5. **Silent Degradation:** Catching and suppressing errors without logging or re-raising.
183
+
184
+ ---
185
+
186
+ ## 🏛️ Tribunal Integration (Anti-Hallucination)
187
+
188
+ **Slash command: `/review` or `/tribunal-full`**
189
+ **Active reviewers: `logic-reviewer` · `security-auditor`**
190
+
191
+ ### ❌ Forbidden AI Tropes
192
+
193
+ 1. **Blind Assumptions:** Never make an assumption without documenting it clearly with `// VERIFY: [reason]`.
194
+ 2. **Silent Degradation:** Catching and suppressing errors without logging or handling.
195
+ 3. **Context Amnesia:** Forgetting the user's constraints and offering generic advice instead of tailored solutions.
196
+
197
+ ### ✅ Pre-Flight Self-Audit
198
+
199
+ Review these questions before confirming output:
200
+ ```
201
+ ✅ Did I rely ONLY on real, verified tools and methods?
202
+ ✅ Is this solution appropriately scoped to the user's constraints?
203
+ ✅ Did I handle potential failure modes and edge cases?
204
+ ✅ Have I avoided generic boilerplate that doesn't add value?
205
+ ```
206
+
207
+ ### 🛑 Verification-Before-Completion (VBC) Protocol
208
+
209
+ **CRITICAL:** You must follow a strict "evidence-based closeout" state machine.
210
+ - ❌ **Forbidden:** Declaring a task complete because the output "looks correct."
211
+ - ✅ **Required:** You are explicitly forbidden from finalizing any task without providing **concrete evidence** (terminal output, passing tests, compile success, or equivalent proof) that your output works as intended.
@@ -323,3 +323,45 @@ Review these questions before confirming output:
323
323
 
324
324
  ## VBC Protocol (Verification-Before-Completion)
325
325
  You MUST verify existing code signatures and variables before attempting to modify or call them. No hallucination is permitted.
326
+
327
+
328
+ ---
329
+
330
+ ## 🤖 LLM-Specific Traps
331
+
332
+ AI coding assistants often fall into specific bad habits when dealing with this domain. These are strictly forbidden:
333
+
334
+ 1. **Over-engineering:** Proposing complex abstractions or distributed systems when a simpler approach suffices.
335
+ 2. **Hallucinated Libraries/Methods:** Using non-existent methods or packages. Always `// VERIFY` or check `package.json` / `requirements.txt`.
336
+ 3. **Skipping Edge Cases:** Writing the "happy path" and ignoring error handling, timeouts, or data validation.
337
+ 4. **Context Amnesia:** Forgetting the user's constraints and offering generic advice instead of tailored solutions.
338
+ 5. **Silent Degradation:** Catching and suppressing errors without logging or re-raising.
339
+
340
+ ---
341
+
342
+ ## 🏛️ Tribunal Integration (Anti-Hallucination)
343
+
344
+ **Slash command: `/review` or `/tribunal-full`**
345
+ **Active reviewers: `logic-reviewer` · `security-auditor`**
346
+
347
+ ### ❌ Forbidden AI Tropes
348
+
349
+ 1. **Blind Assumptions:** Never make an assumption without documenting it clearly with `// VERIFY: [reason]`.
350
+ 2. **Silent Degradation:** Catching and suppressing errors without logging or handling.
351
+ 3. **Context Amnesia:** Forgetting the user's constraints and offering generic advice instead of tailored solutions.
352
+
353
+ ### ✅ Pre-Flight Self-Audit
354
+
355
+ Review these questions before confirming output:
356
+ ```
357
+ ✅ Did I rely ONLY on real, verified tools and methods?
358
+ ✅ Is this solution appropriately scoped to the user's constraints?
359
+ ✅ Did I handle potential failure modes and edge cases?
360
+ ✅ Have I avoided generic boilerplate that doesn't add value?
361
+ ```
362
+
363
+ ### 🛑 Verification-Before-Completion (VBC) Protocol
364
+
365
+ **CRITICAL:** You must follow a strict "evidence-based closeout" state machine.
366
+ - ❌ **Forbidden:** Declaring a task complete because the output "looks correct."
367
+ - ✅ **Required:** You are explicitly forbidden from finalizing any task without providing **concrete evidence** (terminal output, passing tests, compile success, or equivalent proof) that your output works as intended.
@@ -227,3 +227,45 @@ Review these questions before confirming output:
227
227
 
228
228
  ## VBC Protocol (Verification-Before-Completion)
229
229
  You MUST verify existing code signatures and variables before attempting to modify or call them. No hallucination is permitted.
230
+
231
+
232
+ ---
233
+
234
+ ## 🤖 LLM-Specific Traps
235
+
236
+ AI coding assistants often fall into specific bad habits when dealing with this domain. These are strictly forbidden:
237
+
238
+ 1. **Over-engineering:** Proposing complex abstractions or distributed systems when a simpler approach suffices.
239
+ 2. **Hallucinated Libraries/Methods:** Using non-existent methods or packages. Always `// VERIFY` or check `package.json` / `requirements.txt`.
240
+ 3. **Skipping Edge Cases:** Writing the "happy path" and ignoring error handling, timeouts, or data validation.
241
+ 4. **Context Amnesia:** Forgetting the user's constraints and offering generic advice instead of tailored solutions.
242
+ 5. **Silent Degradation:** Catching and suppressing errors without logging or re-raising.
243
+
244
+ ---
245
+
246
+ ## 🏛️ Tribunal Integration (Anti-Hallucination)
247
+
248
+ **Slash command: `/review` or `/tribunal-full`**
249
+ **Active reviewers: `logic-reviewer` · `security-auditor`**
250
+
251
+ ### ❌ Forbidden AI Tropes
252
+
253
+ 1. **Blind Assumptions:** Never make an assumption without documenting it clearly with `// VERIFY: [reason]`.
254
+ 2. **Silent Degradation:** Catching and suppressing errors without logging or handling.
255
+ 3. **Context Amnesia:** Forgetting the user's constraints and offering generic advice instead of tailored solutions.
256
+
257
+ ### ✅ Pre-Flight Self-Audit
258
+
259
+ Review these questions before confirming output:
260
+ ```
261
+ ✅ Did I rely ONLY on real, verified tools and methods?
262
+ ✅ Is this solution appropriately scoped to the user's constraints?
263
+ ✅ Did I handle potential failure modes and edge cases?
264
+ ✅ Have I avoided generic boilerplate that doesn't add value?
265
+ ```
266
+
267
+ ### 🛑 Verification-Before-Completion (VBC) Protocol
268
+
269
+ **CRITICAL:** You must follow a strict "evidence-based closeout" state machine.
270
+ - ❌ **Forbidden:** Declaring a task complete because the output "looks correct."
271
+ - ✅ **Required:** You are explicitly forbidden from finalizing any task without providing **concrete evidence** (terminal output, passing tests, compile success, or equivalent proof) that your output works as intended.
@@ -0,0 +1,247 @@
1
+ ---
2
+ description: Long-running agent harness for multi-session projects. Decomposes specs into atomic features tracked in JSON, ensures clean handoffs between sessions, and provides structured progress tracking. Based on Anthropic's long-running agent patterns.
3
+ ---
4
+
5
+ # /marathon — Long-Running Agent Harness
6
+
7
+ $ARGUMENTS
8
+
9
+ ---
10
+
11
+ ## When to Use /marathon
12
+
13
+ |Use `/marathon` when...|Use something else when...|
14
+ |:---|:---|
15
+ |A project requires multiple sessions to complete|Quick one-shot task → `/generate`|
16
+ |You need structured progress tracking across context windows|Single feature addition → `/enhance`|
17
+ |Building a complex app from a high-level spec|Planning without execution → `/plan`|
18
+ |Previous agent sessions lost context or declared victory too early|Brainstorming options → `/brainstorm`|
19
+
20
+ ---
21
+
22
+ ## Sub-Commands
23
+
24
+ ```
25
+ /marathon init [spec] Start a new marathon from a specification
26
+ /marathon continue Resume work: read progress, pick next feature, implement
27
+ /marathon status Show progress dashboard
28
+ /marathon reset Archive current marathon and start fresh
29
+ ```
30
+
31
+ ---
32
+
33
+ ## Phase 1: Initialize (First Session Only)
34
+
35
+ **Trigger:** `/marathon init "Build X"`
36
+
37
+ This phase runs the **Initializer Agent** pattern — a specialized first session that sets up the foundation for all future sessions.
38
+
39
+ ### Steps
40
+
41
+ 1. **Parse the specification** — Read the user's spec carefully
42
+ 2. **Decompose into atomic features** — Generate 30–200 features depending on project complexity
43
+ - Each feature must be **independently testable**
44
+ - Each must have clear **done criteria** (verification steps)
45
+ - Group by category: `core`, `auth`, `ui`, `data`, `integration`, `polish`
46
+ - All features start with `passes: false`
47
+ 3. **Create the marathon state:**
48
+ ```bash
49
+ node .agent/scripts/marathon_harness.js init "Build X"
50
+ # Then add features one by one:
51
+ node .agent/scripts/marathon_harness.js add-feature "core" "User can open a new chat" "Navigate to main page" "Click New Chat" "Verify welcome state"
52
+ node .agent/scripts/marathon_harness.js add-feature "core" "User can type and send a message" "Open chat" "Type in input" "Press Enter" "See message appear"
53
+ # ... repeat for all features
54
+ ```
55
+ 4. **Scaffold the project** — Create initial files, install dependencies
56
+ 5. **Create init.sh** — Write a bootstrap script that starts the dev environment
57
+ 6. **Initial git commit:** `git commit -m "marathon: initial scaffold for [spec]"`
58
+ 7. **Human Gate:** User reviews the feature list before proceeding
59
+
60
+ ### Feature JSON Format
61
+
62
+ Features are stored in `.agent/history/marathon/feature_list.json` as structured JSON. JSON is used instead of Markdown because agents are less likely to inappropriately modify JSON structures.
63
+
64
+ ```json
65
+ {
66
+ "id": 1,
67
+ "category": "core",
68
+ "description": "User can open a new chat and see a welcome screen",
69
+ "steps": [
70
+ "Navigate to main page",
71
+ "Click 'New Chat' button",
72
+ "Verify welcome state renders"
73
+ ],
74
+ "passes": false,
75
+ "sessionCompleted": null
76
+ }
77
+ ```
78
+
79
+ > [!CAUTION]
80
+ > **Feature descriptions are immutable.** After initialization, agents may ONLY change the `passes` field and `sessionCompleted` timestamp. It is unacceptable to remove, edit, or reorder features — this could lead to missing or buggy functionality.
81
+
82
+ ---
83
+
84
+ ## Phase 2: Get Bearings (Every Session Start)
85
+
86
+ **Trigger:** `/marathon continue`
87
+
88
+ Every new session starts by orienting the agent. This is the **Coding Agent** pattern — understanding state before making changes.
89
+
90
+ ### Steps
91
+
92
+ 1. **Read marathon state:**
93
+ ```bash
94
+ node .agent/scripts/marathon_harness.js session-start
95
+ ```
96
+ This automatically:
97
+ - Reads `progress.json` and shows what was done in previous sessions
98
+ - Reads `git log --oneline -20` for recent commits
99
+ - Shows the next unfinished feature
100
+ - Records the session start time
101
+
102
+ 2. **Start the dev environment:**
103
+ ```bash
104
+ node .agent/scripts/auto_preview.js start
105
+ ```
106
+
107
+ 3. **Smoke test basic functionality:**
108
+ - If a web app: navigate to the main page, verify it loads without errors
109
+ - If a CLI tool: run the help command, verify it outputs correctly
110
+ - If an API: hit the health check endpoint
111
+ - If browser MCP tools are available (Puppeteer), use them for visual verification
112
+
113
+ 4. **If smoke test fails:** Fix the broken state FIRST before implementing new features. The codebase must be clean before new work begins.
114
+
115
+ 5. **Announce bearings:**
116
+ ```
117
+ Session N. Progress: 12/47 features (25%).
118
+ Working on: Feature #13 [ui] — "User can toggle dark mode"
119
+ ```
120
+
121
+ ---
122
+
123
+ ## Phase 3: Implement (One Feature Per Cycle)
124
+
125
+ Work on exactly **one feature at a time**. This incremental approach prevents the common failure mode of trying to do too much at once.
126
+
127
+ ### Steps
128
+
129
+ 1. **Impact analysis** — Identify files that will be affected (per `/enhance` workflow)
130
+ 2. **Implement the feature** — Write code, following Tribunal code quality standards
131
+ 3. **Self-verify the feature:**
132
+ - Run the verification steps listed in the feature's `steps` array
133
+ - Test as a human user would (browser for web, CLI for CLI)
134
+ - Run existing tests to ensure no regressions: `npm test` or equivalent
135
+ 4. **Mark as passing:**
136
+ ```bash
137
+ node .agent/scripts/marathon_harness.js mark <id> pass
138
+ ```
139
+ 5. **Git commit** with a descriptive message:
140
+ ```bash
141
+ git commit -m "marathon: implement feature #13 — dark mode toggle"
142
+ ```
143
+ 6. **Check context budget:**
144
+ - If context allows → return to Phase 2, step 5 (pick next feature)
145
+ - If nearing context limit → proceed to Phase 4
146
+
147
+ ### If a feature cannot be completed
148
+
149
+ If a feature is blocked or too complex for the current session:
150
+ 1. Leave it as `passes: false`
151
+ 2. Add a log note explaining why:
152
+ ```bash
153
+ node .agent/scripts/marathon_harness.js log "Feature #13 blocked: requires OAuth integration not yet set up"
154
+ ```
155
+ 3. Move to the next feature or proceed to Phase 4
156
+
157
+ ---
158
+
159
+ ## Phase 4: Clean Exit (Session End)
160
+
161
+ Every session MUST leave the codebase in a clean, merge-ready state.
162
+
163
+ ### Steps
164
+
165
+ 1. **Verify clean state:**
166
+ - All code compiles without errors
167
+ - All existing tests pass
168
+ - No half-implemented features left in an intermediate state
169
+ - If something is half-done, either complete it or revert it
170
+
171
+ 2. **Record session end:**
172
+ ```bash
173
+ node .agent/scripts/marathon_harness.js session-end "Implemented dark mode, user settings page, and notification bell"
174
+ ```
175
+
176
+ 3. **Final git commit:**
177
+ ```bash
178
+ git commit -m "marathon: session N complete, 15/47 features passing"
179
+ ```
180
+
181
+ 4. **Display status dashboard** — The session-end command automatically shows progress
182
+
183
+ ---
184
+
185
+ ## Marathon Guards
186
+
187
+ ```
188
+ ❌ Never delete or edit feature descriptions — only change the passes status
189
+ ❌ Never skip the smoke test at session start — broken code must be fixed first
190
+ ❌ Never mark a feature as passing without testing it end-to-end
191
+ ❌ Never work on more than one feature at a time
192
+ ❌ Never leave the codebase in a broken state at session end
193
+ ❌ Never declare the project "done" if any feature has passes: false
194
+ ❌ Never try to one-shot the entire project — always work incrementally
195
+ ❌ Never guess what happened in previous sessions — read progress.json and git log
196
+ ```
197
+
198
+ ---
199
+
200
+ ## State Files
201
+
202
+ All marathon state is stored in `.agent/history/marathon/` (preserved on `tk update`):
203
+
204
+ ```
205
+ .agent/history/marathon/
206
+ ├── feature_list.json ← Structured feature backlog (immutable descriptions)
207
+ ├── progress.json ← Session log + progress notes
208
+ └── archive/ ← Previous marathons (after reset)
209
+ ```
210
+
211
+ ---
212
+
213
+ ## Script Reference
214
+
215
+ ```bash
216
+ # Initialize
217
+ node .agent/scripts/marathon_harness.js init "Build a task management app"
218
+
219
+ # Add features (during init phase)
220
+ node .agent/scripts/marathon_harness.js add-feature "core" "User can create a task" "Click add" "Type title" "Save"
221
+
222
+ # Session lifecycle
223
+ node .agent/scripts/marathon_harness.js session-start
224
+ node .agent/scripts/marathon_harness.js session-end "Completed auth and dashboard"
225
+
226
+ # During implementation
227
+ node .agent/scripts/marathon_harness.js next
228
+ node .agent/scripts/marathon_harness.js mark 5 pass
229
+ node .agent/scripts/marathon_harness.js log "Refactored auth to use JWT"
230
+
231
+ # Status
232
+ node .agent/scripts/marathon_harness.js status
233
+
234
+ # Archive and restart
235
+ node .agent/scripts/marathon_harness.js reset
236
+ ```
237
+
238
+ ---
239
+
240
+ ## Usage Examples
241
+
242
+ ```
243
+ /marathon init Build a full-stack clone of claude.ai with chat, settings, and themes
244
+ /marathon continue
245
+ /marathon status
246
+ /marathon reset
247
+ ```