tribunal-kit 4.4.1 → 4.4.3
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.agent/history/architecture-graph.yaml +140 -0
- package/.agent/history/graph-cache.json +262 -0
- package/.agent/history/snapshots/bin__tribunal-kit.js.json +19 -0
- package/.agent/history/snapshots/eslint.config.js.json +9 -0
- package/.agent/history/snapshots/migrate_refs.js.json +11 -0
- package/.agent/history/snapshots/scripts__changelog.js.json +13 -0
- package/.agent/history/snapshots/scripts__sync-version.js.json +12 -0
- package/.agent/history/snapshots/scripts__validate-payload.js.json +12 -0
- package/.agent/history/snapshots/test__integration__bridges.test.js.json +14 -0
- package/.agent/history/snapshots/test__integration__init.test.js.json +14 -0
- package/.agent/history/snapshots/test__integration__routing.test.js.json +12 -0
- package/.agent/history/snapshots/test__integration__swarm_dispatcher.test.js.json +14 -0
- package/.agent/history/snapshots/test__integration__wave2.test.js.json +14 -0
- package/.agent/history/snapshots/test__unit__args.test.js.json +20 -0
- package/.agent/history/snapshots/test__unit__case_law_manager.test.js.json +11 -0
- package/.agent/history/snapshots/test__unit__context_broker.test.js.json +11 -0
- package/.agent/history/snapshots/test__unit__copyDir.test.js.json +23 -0
- package/.agent/history/snapshots/test__unit__graph_tools.test.js.json +12 -0
- package/.agent/history/snapshots/test__unit__inner_loop_validator.test.js.json +11 -0
- package/.agent/history/snapshots/test__unit__selfInstall.test.js.json +23 -0
- package/.agent/history/snapshots/test__unit__semver.test.js.json +20 -0
- package/.agent/history/snapshots/test__unit__swarm_dispatcher.test.js.json +12 -0
- package/.agent/scripts/_colors.js +170 -18
- package/.agent/scripts/_utils.js +244 -42
- package/.agent/scripts/bundle_analyzer.js +261 -290
- package/.agent/scripts/case_law_manager.js +1 -7
- package/.agent/scripts/checklist.js +278 -266
- package/.agent/scripts/colors.js +11 -17
- package/.agent/scripts/context_broker.js +1 -7
- package/.agent/scripts/dependency_analyzer.js +234 -272
- package/.agent/scripts/graph_builder.js +46 -18
- package/.agent/scripts/graph_visualizer.js +10 -4
- package/.agent/scripts/graph_zoom.js +6 -4
- package/.agent/scripts/inner_loop_validator.js +2 -8
- package/.agent/scripts/lint_runner.js +186 -187
- package/.agent/scripts/marathon_harness.js +799 -0
- package/.agent/scripts/prompt_compiler.js +56 -0
- package/.agent/scripts/schema_validator.js +8 -25
- package/.agent/scripts/security_scan.js +276 -303
- package/.agent/scripts/session_manager.js +1 -7
- package/.agent/scripts/skill_evolution.js +1 -8
- package/.agent/scripts/skill_integrator.js +1 -7
- package/.agent/scripts/test_runner.js +186 -193
- package/.agent/scripts/utils.js +17 -32
- package/.agent/scripts/verify_all.js +248 -257
- package/.agent/skills/agent-organizer/SKILL.md +42 -0
- package/.agent/skills/agentic-patterns/SKILL.md +42 -0
- package/.agent/skills/ai-prompt-injection-defense/SKILL.md +42 -0
- package/.agent/skills/api-patterns/SKILL.md +42 -0
- package/.agent/skills/api-security-auditor/SKILL.md +42 -0
- package/.agent/skills/app-builder/SKILL.md +42 -0
- package/.agent/skills/appflow-wireframe/SKILL.md +42 -0
- package/.agent/skills/architecture/SKILL.md +42 -0
- package/.agent/skills/authentication-best-practices/SKILL.md +42 -0
- package/.agent/skills/backend-security-expert/SKILL.md +122 -0
- package/.agent/skills/bash-linux/SKILL.md +42 -0
- package/.agent/skills/behavioral-modes/SKILL.md +42 -0
- package/.agent/skills/brainstorming/SKILL.md +42 -0
- package/.agent/skills/building-native-ui/SKILL.md +42 -0
- package/.agent/skills/clean-code/SKILL.md +42 -0
- package/.agent/skills/code-review-checklist/SKILL.md +42 -0
- package/.agent/skills/config-validator/SKILL.md +42 -0
- package/.agent/skills/csharp-developer/SKILL.md +42 -0
- package/.agent/skills/data-validation-schemas/SKILL.md +42 -0
- package/.agent/skills/database-design/SKILL.md +42 -0
- package/.agent/skills/deployment-procedures/SKILL.md +42 -0
- package/.agent/skills/devops-engineer/SKILL.md +42 -0
- package/.agent/skills/devops-incident-responder/SKILL.md +42 -0
- package/.agent/skills/documentation-templates/SKILL.md +42 -0
- package/.agent/skills/edge-computing/SKILL.md +42 -0
- package/.agent/skills/error-resilience/SKILL.md +42 -0
- package/.agent/skills/extract-design-system/SKILL.md +42 -0
- package/.agent/skills/framer-motion-expert/SKILL.md +42 -0
- package/.agent/skills/frontend-design/SKILL.md +42 -0
- package/.agent/skills/frontend-security-expert/SKILL.md +123 -0
- package/.agent/skills/game-design-expert/SKILL.md +42 -0
- package/.agent/skills/game-engineering-expert/SKILL.md +42 -0
- package/.agent/skills/geo-fundamentals/SKILL.md +42 -0
- package/.agent/skills/github-operations/SKILL.md +42 -0
- package/.agent/skills/gsap-core/SKILL.md +42 -0
- package/.agent/skills/gsap-frameworks/SKILL.md +42 -0
- package/.agent/skills/gsap-performance/SKILL.md +42 -0
- package/.agent/skills/gsap-plugins/SKILL.md +42 -0
- package/.agent/skills/gsap-react/SKILL.md +42 -0
- package/.agent/skills/gsap-scrolltrigger/SKILL.md +42 -0
- package/.agent/skills/gsap-timeline/SKILL.md +42 -0
- package/.agent/skills/gsap-utils/SKILL.md +42 -0
- package/.agent/skills/i18n-localization/SKILL.md +42 -0
- package/.agent/skills/intelligent-routing/SKILL.md +42 -0
- package/.agent/skills/knowledge-graph/SKILL.md +42 -0
- package/.agent/skills/lint-and-validate/SKILL.md +42 -0
- package/.agent/skills/llm-engineering/SKILL.md +42 -0
- package/.agent/skills/local-first/SKILL.md +42 -0
- package/.agent/skills/mcp-builder/SKILL.md +42 -0
- package/.agent/skills/mobile-design/SKILL.md +42 -0
- package/.agent/skills/monorepo-management/SKILL.md +42 -0
- package/.agent/skills/motion-engineering/SKILL.md +42 -0
- package/.agent/skills/nextjs-react-expert/SKILL.md +42 -0
- package/.agent/skills/nodejs-best-practices/SKILL.md +42 -0
- package/.agent/skills/observability/SKILL.md +42 -0
- package/.agent/skills/parallel-agents/SKILL.md +42 -0
- package/.agent/skills/performance-profiling/SKILL.md +42 -0
- package/.agent/skills/plan-writing/SKILL.md +42 -0
- package/.agent/skills/platform-engineer/SKILL.md +42 -0
- package/.agent/skills/playwright-best-practices/SKILL.md +42 -0
- package/.agent/skills/powershell-windows/SKILL.md +42 -0
- package/.agent/skills/project-idioms/SKILL.md +42 -0
- package/.agent/skills/python-patterns/SKILL.md +42 -0
- package/.agent/skills/python-pro/SKILL.md +42 -0
- package/.agent/skills/react-specialist/SKILL.md +42 -0
- package/.agent/skills/readme-builder/SKILL.md +42 -0
- package/.agent/skills/realtime-patterns/SKILL.md +42 -0
- package/.agent/skills/red-team-tactics/SKILL.md +42 -0
- package/.agent/skills/rust-pro/SKILL.md +42 -0
- package/.agent/skills/seo-fundamentals/SKILL.md +42 -0
- package/.agent/skills/server-management/SKILL.md +42 -0
- package/.agent/skills/shadcn-ui-expert/SKILL.md +42 -0
- package/.agent/skills/skill-creator/SKILL.md +42 -0
- package/.agent/skills/sql-pro/SKILL.md +42 -0
- package/.agent/skills/supabase-postgres-best-practices/SKILL.md +42 -0
- package/.agent/skills/swiftui-expert/SKILL.md +42 -0
- package/.agent/skills/systematic-debugging/SKILL.md +42 -0
- package/.agent/skills/tailwind-patterns/SKILL.md +42 -0
- package/.agent/skills/tdd-workflow/SKILL.md +42 -0
- package/.agent/skills/test-result-analyzer/SKILL.md +42 -0
- package/.agent/skills/testing-patterns/SKILL.md +42 -0
- package/.agent/skills/trend-researcher/SKILL.md +42 -0
- package/.agent/skills/typescript-advanced/SKILL.md +42 -0
- package/.agent/skills/ui-ux-pro-max/SKILL.md +42 -0
- package/.agent/skills/ui-ux-researcher/SKILL.md +42 -0
- package/.agent/skills/vue-expert/SKILL.md +42 -0
- package/.agent/skills/vulnerability-scanner/SKILL.md +42 -0
- package/.agent/skills/web-accessibility-auditor/SKILL.md +42 -0
- package/.agent/skills/web-design-guidelines/SKILL.md +42 -0
- package/.agent/skills/webapp-testing/SKILL.md +42 -0
- package/.agent/skills/whimsy-injector/SKILL.md +42 -0
- package/.agent/skills/workflow-optimizer/SKILL.md +42 -0
- package/.agent/workflows/marathon.md +247 -0
- package/.agent/workflows/super-prompt.md +27 -0
- package/bin/tribunal-kit.js +47 -1
- package/package.json +3 -2
|
@@ -560,3 +560,45 @@ Review these questions before confirming output:
|
|
|
560
560
|
|
|
561
561
|
## VBC Protocol (Verification-Before-Completion)
|
|
562
562
|
You MUST verify existing code signatures and variables before attempting to modify or call them. No hallucination is permitted.
|
|
563
|
+
|
|
564
|
+
|
|
565
|
+
---
|
|
566
|
+
|
|
567
|
+
## 🤖 LLM-Specific Traps
|
|
568
|
+
|
|
569
|
+
AI coding assistants often fall into specific bad habits when dealing with this domain. These are strictly forbidden:
|
|
570
|
+
|
|
571
|
+
1. **Over-engineering:** Proposing complex abstractions or distributed systems when a simpler approach suffices.
|
|
572
|
+
2. **Hallucinated Libraries/Methods:** Using non-existent methods or packages. Always `// VERIFY` or check `package.json` / `requirements.txt`.
|
|
573
|
+
3. **Skipping Edge Cases:** Writing the "happy path" and ignoring error handling, timeouts, or data validation.
|
|
574
|
+
4. **Context Amnesia:** Forgetting the user's constraints and offering generic advice instead of tailored solutions.
|
|
575
|
+
5. **Silent Degradation:** Catching and suppressing errors without logging or re-raising.
|
|
576
|
+
|
|
577
|
+
---
|
|
578
|
+
|
|
579
|
+
## 🏛️ Tribunal Integration (Anti-Hallucination)
|
|
580
|
+
|
|
581
|
+
**Slash command: `/review` or `/tribunal-full`**
|
|
582
|
+
**Active reviewers: `logic-reviewer` · `security-auditor`**
|
|
583
|
+
|
|
584
|
+
### ❌ Forbidden AI Tropes
|
|
585
|
+
|
|
586
|
+
1. **Blind Assumptions:** Never make an assumption without documenting it clearly with `// VERIFY: [reason]`.
|
|
587
|
+
2. **Silent Degradation:** Catching and suppressing errors without logging or handling.
|
|
588
|
+
3. **Context Amnesia:** Forgetting the user's constraints and offering generic advice instead of tailored solutions.
|
|
589
|
+
|
|
590
|
+
### ✅ Pre-Flight Self-Audit
|
|
591
|
+
|
|
592
|
+
Review these questions before confirming output:
|
|
593
|
+
```
|
|
594
|
+
✅ Did I rely ONLY on real, verified tools and methods?
|
|
595
|
+
✅ Is this solution appropriately scoped to the user's constraints?
|
|
596
|
+
✅ Did I handle potential failure modes and edge cases?
|
|
597
|
+
✅ Have I avoided generic boilerplate that doesn't add value?
|
|
598
|
+
```
|
|
599
|
+
|
|
600
|
+
### 🛑 Verification-Before-Completion (VBC) Protocol
|
|
601
|
+
|
|
602
|
+
**CRITICAL:** You must follow a strict "evidence-based closeout" state machine.
|
|
603
|
+
- ❌ **Forbidden:** Declaring a task complete because the output "looks correct."
|
|
604
|
+
- ✅ **Required:** You are explicitly forbidden from finalizing any task without providing **concrete evidence** (terminal output, passing tests, compile success, or equivalent proof) that your output works as intended.
|
|
@@ -242,3 +242,45 @@ Review these questions before confirming output:
|
|
|
242
242
|
|
|
243
243
|
## VBC Protocol (Verification-Before-Completion)
|
|
244
244
|
You MUST verify existing code signatures and variables before attempting to modify or call them. No hallucination is permitted.
|
|
245
|
+
|
|
246
|
+
|
|
247
|
+
---
|
|
248
|
+
|
|
249
|
+
## 🤖 LLM-Specific Traps
|
|
250
|
+
|
|
251
|
+
AI coding assistants often fall into specific bad habits when dealing with this domain. These are strictly forbidden:
|
|
252
|
+
|
|
253
|
+
1. **Over-engineering:** Proposing complex abstractions or distributed systems when a simpler approach suffices.
|
|
254
|
+
2. **Hallucinated Libraries/Methods:** Using non-existent methods or packages. Always `// VERIFY` or check `package.json` / `requirements.txt`.
|
|
255
|
+
3. **Skipping Edge Cases:** Writing the "happy path" and ignoring error handling, timeouts, or data validation.
|
|
256
|
+
4. **Context Amnesia:** Forgetting the user's constraints and offering generic advice instead of tailored solutions.
|
|
257
|
+
5. **Silent Degradation:** Catching and suppressing errors without logging or re-raising.
|
|
258
|
+
|
|
259
|
+
---
|
|
260
|
+
|
|
261
|
+
## 🏛️ Tribunal Integration (Anti-Hallucination)
|
|
262
|
+
|
|
263
|
+
**Slash command: `/review` or `/tribunal-full`**
|
|
264
|
+
**Active reviewers: `logic-reviewer` · `security-auditor`**
|
|
265
|
+
|
|
266
|
+
### ❌ Forbidden AI Tropes
|
|
267
|
+
|
|
268
|
+
1. **Blind Assumptions:** Never make an assumption without documenting it clearly with `// VERIFY: [reason]`.
|
|
269
|
+
2. **Silent Degradation:** Catching and suppressing errors without logging or handling.
|
|
270
|
+
3. **Context Amnesia:** Forgetting the user's constraints and offering generic advice instead of tailored solutions.
|
|
271
|
+
|
|
272
|
+
### ✅ Pre-Flight Self-Audit
|
|
273
|
+
|
|
274
|
+
Review these questions before confirming output:
|
|
275
|
+
```
|
|
276
|
+
✅ Did I rely ONLY on real, verified tools and methods?
|
|
277
|
+
✅ Is this solution appropriately scoped to the user's constraints?
|
|
278
|
+
✅ Did I handle potential failure modes and edge cases?
|
|
279
|
+
✅ Have I avoided generic boilerplate that doesn't add value?
|
|
280
|
+
```
|
|
281
|
+
|
|
282
|
+
### 🛑 Verification-Before-Completion (VBC) Protocol
|
|
283
|
+
|
|
284
|
+
**CRITICAL:** You must follow a strict "evidence-based closeout" state machine.
|
|
285
|
+
- ❌ **Forbidden:** Declaring a task complete because the output "looks correct."
|
|
286
|
+
- ✅ **Required:** You are explicitly forbidden from finalizing any task without providing **concrete evidence** (terminal output, passing tests, compile success, or equivalent proof) that your output works as intended.
|
|
@@ -273,3 +273,45 @@ Review these questions before confirming output:
|
|
|
273
273
|
|
|
274
274
|
## VBC Protocol (Verification-Before-Completion)
|
|
275
275
|
You MUST verify existing code signatures and variables before attempting to modify or call them. No hallucination is permitted.
|
|
276
|
+
|
|
277
|
+
|
|
278
|
+
---
|
|
279
|
+
|
|
280
|
+
## 🤖 LLM-Specific Traps
|
|
281
|
+
|
|
282
|
+
AI coding assistants often fall into specific bad habits when dealing with this domain. These are strictly forbidden:
|
|
283
|
+
|
|
284
|
+
1. **Over-engineering:** Proposing complex abstractions or distributed systems when a simpler approach suffices.
|
|
285
|
+
2. **Hallucinated Libraries/Methods:** Using non-existent methods or packages. Always `// VERIFY` or check `package.json` / `requirements.txt`.
|
|
286
|
+
3. **Skipping Edge Cases:** Writing the "happy path" and ignoring error handling, timeouts, or data validation.
|
|
287
|
+
4. **Context Amnesia:** Forgetting the user's constraints and offering generic advice instead of tailored solutions.
|
|
288
|
+
5. **Silent Degradation:** Catching and suppressing errors without logging or re-raising.
|
|
289
|
+
|
|
290
|
+
---
|
|
291
|
+
|
|
292
|
+
## 🏛️ Tribunal Integration (Anti-Hallucination)
|
|
293
|
+
|
|
294
|
+
**Slash command: `/review` or `/tribunal-full`**
|
|
295
|
+
**Active reviewers: `logic-reviewer` · `security-auditor`**
|
|
296
|
+
|
|
297
|
+
### ❌ Forbidden AI Tropes
|
|
298
|
+
|
|
299
|
+
1. **Blind Assumptions:** Never make an assumption without documenting it clearly with `// VERIFY: [reason]`.
|
|
300
|
+
2. **Silent Degradation:** Catching and suppressing errors without logging or handling.
|
|
301
|
+
3. **Context Amnesia:** Forgetting the user's constraints and offering generic advice instead of tailored solutions.
|
|
302
|
+
|
|
303
|
+
### ✅ Pre-Flight Self-Audit
|
|
304
|
+
|
|
305
|
+
Review these questions before confirming output:
|
|
306
|
+
```
|
|
307
|
+
✅ Did I rely ONLY on real, verified tools and methods?
|
|
308
|
+
✅ Is this solution appropriately scoped to the user's constraints?
|
|
309
|
+
✅ Did I handle potential failure modes and edge cases?
|
|
310
|
+
✅ Have I avoided generic boilerplate that doesn't add value?
|
|
311
|
+
```
|
|
312
|
+
|
|
313
|
+
### 🛑 Verification-Before-Completion (VBC) Protocol
|
|
314
|
+
|
|
315
|
+
**CRITICAL:** You must follow a strict "evidence-based closeout" state machine.
|
|
316
|
+
- ❌ **Forbidden:** Declaring a task complete because the output "looks correct."
|
|
317
|
+
- ✅ **Required:** You are explicitly forbidden from finalizing any task without providing **concrete evidence** (terminal output, passing tests, compile success, or equivalent proof) that your output works as intended.
|
|
@@ -402,3 +402,45 @@ Review these questions before confirming output:
|
|
|
402
402
|
|
|
403
403
|
## VBC Protocol (Verification-Before-Completion)
|
|
404
404
|
You MUST verify existing code signatures and variables before attempting to modify or call them. No hallucination is permitted.
|
|
405
|
+
|
|
406
|
+
|
|
407
|
+
---
|
|
408
|
+
|
|
409
|
+
## 🤖 LLM-Specific Traps
|
|
410
|
+
|
|
411
|
+
AI coding assistants often fall into specific bad habits when dealing with this domain. These are strictly forbidden:
|
|
412
|
+
|
|
413
|
+
1. **Over-engineering:** Proposing complex abstractions or distributed systems when a simpler approach suffices.
|
|
414
|
+
2. **Hallucinated Libraries/Methods:** Using non-existent methods or packages. Always `// VERIFY` or check `package.json` / `requirements.txt`.
|
|
415
|
+
3. **Skipping Edge Cases:** Writing the "happy path" and ignoring error handling, timeouts, or data validation.
|
|
416
|
+
4. **Context Amnesia:** Forgetting the user's constraints and offering generic advice instead of tailored solutions.
|
|
417
|
+
5. **Silent Degradation:** Catching and suppressing errors without logging or re-raising.
|
|
418
|
+
|
|
419
|
+
---
|
|
420
|
+
|
|
421
|
+
## 🏛️ Tribunal Integration (Anti-Hallucination)
|
|
422
|
+
|
|
423
|
+
**Slash command: `/review` or `/tribunal-full`**
|
|
424
|
+
**Active reviewers: `logic-reviewer` · `security-auditor`**
|
|
425
|
+
|
|
426
|
+
### ❌ Forbidden AI Tropes
|
|
427
|
+
|
|
428
|
+
1. **Blind Assumptions:** Never make an assumption without documenting it clearly with `// VERIFY: [reason]`.
|
|
429
|
+
2. **Silent Degradation:** Catching and suppressing errors without logging or handling.
|
|
430
|
+
3. **Context Amnesia:** Forgetting the user's constraints and offering generic advice instead of tailored solutions.
|
|
431
|
+
|
|
432
|
+
### ✅ Pre-Flight Self-Audit
|
|
433
|
+
|
|
434
|
+
Review these questions before confirming output:
|
|
435
|
+
```
|
|
436
|
+
✅ Did I rely ONLY on real, verified tools and methods?
|
|
437
|
+
✅ Is this solution appropriately scoped to the user's constraints?
|
|
438
|
+
✅ Did I handle potential failure modes and edge cases?
|
|
439
|
+
✅ Have I avoided generic boilerplate that doesn't add value?
|
|
440
|
+
```
|
|
441
|
+
|
|
442
|
+
### 🛑 Verification-Before-Completion (VBC) Protocol
|
|
443
|
+
|
|
444
|
+
**CRITICAL:** You must follow a strict "evidence-based closeout" state machine.
|
|
445
|
+
- ❌ **Forbidden:** Declaring a task complete because the output "looks correct."
|
|
446
|
+
- ✅ **Required:** You are explicitly forbidden from finalizing any task without providing **concrete evidence** (terminal output, passing tests, compile success, or equivalent proof) that your output works as intended.
|
|
@@ -216,3 +216,45 @@ Review these questions before confirming output:
|
|
|
216
216
|
|
|
217
217
|
## VBC Protocol (Verification-Before-Completion)
|
|
218
218
|
You MUST verify existing code signatures and variables before attempting to modify or call them. No hallucination is permitted.
|
|
219
|
+
|
|
220
|
+
|
|
221
|
+
---
|
|
222
|
+
|
|
223
|
+
## 🤖 LLM-Specific Traps
|
|
224
|
+
|
|
225
|
+
AI coding assistants often fall into specific bad habits when dealing with this domain. These are strictly forbidden:
|
|
226
|
+
|
|
227
|
+
1. **Over-engineering:** Proposing complex abstractions or distributed systems when a simpler approach suffices.
|
|
228
|
+
2. **Hallucinated Libraries/Methods:** Using non-existent methods or packages. Always `// VERIFY` or check `package.json` / `requirements.txt`.
|
|
229
|
+
3. **Skipping Edge Cases:** Writing the "happy path" and ignoring error handling, timeouts, or data validation.
|
|
230
|
+
4. **Context Amnesia:** Forgetting the user's constraints and offering generic advice instead of tailored solutions.
|
|
231
|
+
5. **Silent Degradation:** Catching and suppressing errors without logging or re-raising.
|
|
232
|
+
|
|
233
|
+
---
|
|
234
|
+
|
|
235
|
+
## 🏛️ Tribunal Integration (Anti-Hallucination)
|
|
236
|
+
|
|
237
|
+
**Slash command: `/review` or `/tribunal-full`**
|
|
238
|
+
**Active reviewers: `logic-reviewer` · `security-auditor`**
|
|
239
|
+
|
|
240
|
+
### ❌ Forbidden AI Tropes
|
|
241
|
+
|
|
242
|
+
1. **Blind Assumptions:** Never make an assumption without documenting it clearly with `// VERIFY: [reason]`.
|
|
243
|
+
2. **Silent Degradation:** Catching and suppressing errors without logging or handling.
|
|
244
|
+
3. **Context Amnesia:** Forgetting the user's constraints and offering generic advice instead of tailored solutions.
|
|
245
|
+
|
|
246
|
+
### ✅ Pre-Flight Self-Audit
|
|
247
|
+
|
|
248
|
+
Review these questions before confirming output:
|
|
249
|
+
```
|
|
250
|
+
✅ Did I rely ONLY on real, verified tools and methods?
|
|
251
|
+
✅ Is this solution appropriately scoped to the user's constraints?
|
|
252
|
+
✅ Did I handle potential failure modes and edge cases?
|
|
253
|
+
✅ Have I avoided generic boilerplate that doesn't add value?
|
|
254
|
+
```
|
|
255
|
+
|
|
256
|
+
### 🛑 Verification-Before-Completion (VBC) Protocol
|
|
257
|
+
|
|
258
|
+
**CRITICAL:** You must follow a strict "evidence-based closeout" state machine.
|
|
259
|
+
- ❌ **Forbidden:** Declaring a task complete because the output "looks correct."
|
|
260
|
+
- ✅ **Required:** You are explicitly forbidden from finalizing any task without providing **concrete evidence** (terminal output, passing tests, compile success, or equivalent proof) that your output works as intended.
|
|
@@ -184,3 +184,45 @@ Review these questions before confirming output:
|
|
|
184
184
|
|
|
185
185
|
## VBC Protocol (Verification-Before-Completion)
|
|
186
186
|
You MUST verify existing code signatures and variables before attempting to modify or call them. No hallucination is permitted.
|
|
187
|
+
|
|
188
|
+
|
|
189
|
+
---
|
|
190
|
+
|
|
191
|
+
## 🤖 LLM-Specific Traps
|
|
192
|
+
|
|
193
|
+
AI coding assistants often fall into specific bad habits when dealing with this domain. These are strictly forbidden:
|
|
194
|
+
|
|
195
|
+
1. **Over-engineering:** Proposing complex abstractions or distributed systems when a simpler approach suffices.
|
|
196
|
+
2. **Hallucinated Libraries/Methods:** Using non-existent methods or packages. Always `// VERIFY` or check `package.json` / `requirements.txt`.
|
|
197
|
+
3. **Skipping Edge Cases:** Writing the "happy path" and ignoring error handling, timeouts, or data validation.
|
|
198
|
+
4. **Context Amnesia:** Forgetting the user's constraints and offering generic advice instead of tailored solutions.
|
|
199
|
+
5. **Silent Degradation:** Catching and suppressing errors without logging or re-raising.
|
|
200
|
+
|
|
201
|
+
---
|
|
202
|
+
|
|
203
|
+
## 🏛️ Tribunal Integration (Anti-Hallucination)
|
|
204
|
+
|
|
205
|
+
**Slash command: `/review` or `/tribunal-full`**
|
|
206
|
+
**Active reviewers: `logic-reviewer` · `security-auditor`**
|
|
207
|
+
|
|
208
|
+
### ❌ Forbidden AI Tropes
|
|
209
|
+
|
|
210
|
+
1. **Blind Assumptions:** Never make an assumption without documenting it clearly with `// VERIFY: [reason]`.
|
|
211
|
+
2. **Silent Degradation:** Catching and suppressing errors without logging or handling.
|
|
212
|
+
3. **Context Amnesia:** Forgetting the user's constraints and offering generic advice instead of tailored solutions.
|
|
213
|
+
|
|
214
|
+
### ✅ Pre-Flight Self-Audit
|
|
215
|
+
|
|
216
|
+
Review these questions before confirming output:
|
|
217
|
+
```
|
|
218
|
+
✅ Did I rely ONLY on real, verified tools and methods?
|
|
219
|
+
✅ Is this solution appropriately scoped to the user's constraints?
|
|
220
|
+
✅ Did I handle potential failure modes and edge cases?
|
|
221
|
+
✅ Have I avoided generic boilerplate that doesn't add value?
|
|
222
|
+
```
|
|
223
|
+
|
|
224
|
+
### 🛑 Verification-Before-Completion (VBC) Protocol
|
|
225
|
+
|
|
226
|
+
**CRITICAL:** You must follow a strict "evidence-based closeout" state machine.
|
|
227
|
+
- ❌ **Forbidden:** Declaring a task complete because the output "looks correct."
|
|
228
|
+
- ✅ **Required:** You are explicitly forbidden from finalizing any task without providing **concrete evidence** (terminal output, passing tests, compile success, or equivalent proof) that your output works as intended.
|
|
@@ -167,3 +167,45 @@ Review these questions before confirming output:
|
|
|
167
167
|
|
|
168
168
|
## VBC Protocol (Verification-Before-Completion)
|
|
169
169
|
You MUST verify existing code signatures and variables before attempting to modify or call them. No hallucination is permitted.
|
|
170
|
+
|
|
171
|
+
|
|
172
|
+
---
|
|
173
|
+
|
|
174
|
+
## 🤖 LLM-Specific Traps
|
|
175
|
+
|
|
176
|
+
AI coding assistants often fall into specific bad habits when dealing with this domain. These are strictly forbidden:
|
|
177
|
+
|
|
178
|
+
1. **Over-engineering:** Proposing complex abstractions or distributed systems when a simpler approach suffices.
|
|
179
|
+
2. **Hallucinated Libraries/Methods:** Using non-existent methods or packages. Always `// VERIFY` or check `package.json` / `requirements.txt`.
|
|
180
|
+
3. **Skipping Edge Cases:** Writing the "happy path" and ignoring error handling, timeouts, or data validation.
|
|
181
|
+
4. **Context Amnesia:** Forgetting the user's constraints and offering generic advice instead of tailored solutions.
|
|
182
|
+
5. **Silent Degradation:** Catching and suppressing errors without logging or re-raising.
|
|
183
|
+
|
|
184
|
+
---
|
|
185
|
+
|
|
186
|
+
## 🏛️ Tribunal Integration (Anti-Hallucination)
|
|
187
|
+
|
|
188
|
+
**Slash command: `/review` or `/tribunal-full`**
|
|
189
|
+
**Active reviewers: `logic-reviewer` · `security-auditor`**
|
|
190
|
+
|
|
191
|
+
### ❌ Forbidden AI Tropes
|
|
192
|
+
|
|
193
|
+
1. **Blind Assumptions:** Never make an assumption without documenting it clearly with `// VERIFY: [reason]`.
|
|
194
|
+
2. **Silent Degradation:** Catching and suppressing errors without logging or handling.
|
|
195
|
+
3. **Context Amnesia:** Forgetting the user's constraints and offering generic advice instead of tailored solutions.
|
|
196
|
+
|
|
197
|
+
### ✅ Pre-Flight Self-Audit
|
|
198
|
+
|
|
199
|
+
Review these questions before confirming output:
|
|
200
|
+
```
|
|
201
|
+
✅ Did I rely ONLY on real, verified tools and methods?
|
|
202
|
+
✅ Is this solution appropriately scoped to the user's constraints?
|
|
203
|
+
✅ Did I handle potential failure modes and edge cases?
|
|
204
|
+
✅ Have I avoided generic boilerplate that doesn't add value?
|
|
205
|
+
```
|
|
206
|
+
|
|
207
|
+
### 🛑 Verification-Before-Completion (VBC) Protocol
|
|
208
|
+
|
|
209
|
+
**CRITICAL:** You must follow a strict "evidence-based closeout" state machine.
|
|
210
|
+
- ❌ **Forbidden:** Declaring a task complete because the output "looks correct."
|
|
211
|
+
- ✅ **Required:** You are explicitly forbidden from finalizing any task without providing **concrete evidence** (terminal output, passing tests, compile success, or equivalent proof) that your output works as intended.
|
|
@@ -323,3 +323,45 @@ Review these questions before confirming output:
|
|
|
323
323
|
|
|
324
324
|
## VBC Protocol (Verification-Before-Completion)
|
|
325
325
|
You MUST verify existing code signatures and variables before attempting to modify or call them. No hallucination is permitted.
|
|
326
|
+
|
|
327
|
+
|
|
328
|
+
---
|
|
329
|
+
|
|
330
|
+
## 🤖 LLM-Specific Traps
|
|
331
|
+
|
|
332
|
+
AI coding assistants often fall into specific bad habits when dealing with this domain. These are strictly forbidden:
|
|
333
|
+
|
|
334
|
+
1. **Over-engineering:** Proposing complex abstractions or distributed systems when a simpler approach suffices.
|
|
335
|
+
2. **Hallucinated Libraries/Methods:** Using non-existent methods or packages. Always `// VERIFY` or check `package.json` / `requirements.txt`.
|
|
336
|
+
3. **Skipping Edge Cases:** Writing the "happy path" and ignoring error handling, timeouts, or data validation.
|
|
337
|
+
4. **Context Amnesia:** Forgetting the user's constraints and offering generic advice instead of tailored solutions.
|
|
338
|
+
5. **Silent Degradation:** Catching and suppressing errors without logging or re-raising.
|
|
339
|
+
|
|
340
|
+
---
|
|
341
|
+
|
|
342
|
+
## 🏛️ Tribunal Integration (Anti-Hallucination)
|
|
343
|
+
|
|
344
|
+
**Slash command: `/review` or `/tribunal-full`**
|
|
345
|
+
**Active reviewers: `logic-reviewer` · `security-auditor`**
|
|
346
|
+
|
|
347
|
+
### ❌ Forbidden AI Tropes
|
|
348
|
+
|
|
349
|
+
1. **Blind Assumptions:** Never make an assumption without documenting it clearly with `// VERIFY: [reason]`.
|
|
350
|
+
2. **Silent Degradation:** Catching and suppressing errors without logging or handling.
|
|
351
|
+
3. **Context Amnesia:** Forgetting the user's constraints and offering generic advice instead of tailored solutions.
|
|
352
|
+
|
|
353
|
+
### ✅ Pre-Flight Self-Audit
|
|
354
|
+
|
|
355
|
+
Review these questions before confirming output:
|
|
356
|
+
```
|
|
357
|
+
✅ Did I rely ONLY on real, verified tools and methods?
|
|
358
|
+
✅ Is this solution appropriately scoped to the user's constraints?
|
|
359
|
+
✅ Did I handle potential failure modes and edge cases?
|
|
360
|
+
✅ Have I avoided generic boilerplate that doesn't add value?
|
|
361
|
+
```
|
|
362
|
+
|
|
363
|
+
### 🛑 Verification-Before-Completion (VBC) Protocol
|
|
364
|
+
|
|
365
|
+
**CRITICAL:** You must follow a strict "evidence-based closeout" state machine.
|
|
366
|
+
- ❌ **Forbidden:** Declaring a task complete because the output "looks correct."
|
|
367
|
+
- ✅ **Required:** You are explicitly forbidden from finalizing any task without providing **concrete evidence** (terminal output, passing tests, compile success, or equivalent proof) that your output works as intended.
|
|
@@ -227,3 +227,45 @@ Review these questions before confirming output:
|
|
|
227
227
|
|
|
228
228
|
## VBC Protocol (Verification-Before-Completion)
|
|
229
229
|
You MUST verify existing code signatures and variables before attempting to modify or call them. No hallucination is permitted.
|
|
230
|
+
|
|
231
|
+
|
|
232
|
+
---
|
|
233
|
+
|
|
234
|
+
## 🤖 LLM-Specific Traps
|
|
235
|
+
|
|
236
|
+
AI coding assistants often fall into specific bad habits when dealing with this domain. These are strictly forbidden:
|
|
237
|
+
|
|
238
|
+
1. **Over-engineering:** Proposing complex abstractions or distributed systems when a simpler approach suffices.
|
|
239
|
+
2. **Hallucinated Libraries/Methods:** Using non-existent methods or packages. Always `// VERIFY` or check `package.json` / `requirements.txt`.
|
|
240
|
+
3. **Skipping Edge Cases:** Writing the "happy path" and ignoring error handling, timeouts, or data validation.
|
|
241
|
+
4. **Context Amnesia:** Forgetting the user's constraints and offering generic advice instead of tailored solutions.
|
|
242
|
+
5. **Silent Degradation:** Catching and suppressing errors without logging or re-raising.
|
|
243
|
+
|
|
244
|
+
---
|
|
245
|
+
|
|
246
|
+
## 🏛️ Tribunal Integration (Anti-Hallucination)
|
|
247
|
+
|
|
248
|
+
**Slash command: `/review` or `/tribunal-full`**
|
|
249
|
+
**Active reviewers: `logic-reviewer` · `security-auditor`**
|
|
250
|
+
|
|
251
|
+
### ❌ Forbidden AI Tropes
|
|
252
|
+
|
|
253
|
+
1. **Blind Assumptions:** Never make an assumption without documenting it clearly with `// VERIFY: [reason]`.
|
|
254
|
+
2. **Silent Degradation:** Catching and suppressing errors without logging or handling.
|
|
255
|
+
3. **Context Amnesia:** Forgetting the user's constraints and offering generic advice instead of tailored solutions.
|
|
256
|
+
|
|
257
|
+
### ✅ Pre-Flight Self-Audit
|
|
258
|
+
|
|
259
|
+
Review these questions before confirming output:
|
|
260
|
+
```
|
|
261
|
+
✅ Did I rely ONLY on real, verified tools and methods?
|
|
262
|
+
✅ Is this solution appropriately scoped to the user's constraints?
|
|
263
|
+
✅ Did I handle potential failure modes and edge cases?
|
|
264
|
+
✅ Have I avoided generic boilerplate that doesn't add value?
|
|
265
|
+
```
|
|
266
|
+
|
|
267
|
+
### 🛑 Verification-Before-Completion (VBC) Protocol
|
|
268
|
+
|
|
269
|
+
**CRITICAL:** You must follow a strict "evidence-based closeout" state machine.
|
|
270
|
+
- ❌ **Forbidden:** Declaring a task complete because the output "looks correct."
|
|
271
|
+
- ✅ **Required:** You are explicitly forbidden from finalizing any task without providing **concrete evidence** (terminal output, passing tests, compile success, or equivalent proof) that your output works as intended.
|
|
@@ -0,0 +1,247 @@
|
|
|
1
|
+
---
|
|
2
|
+
description: Long-running agent harness for multi-session projects. Decomposes specs into atomic features tracked in JSON, ensures clean handoffs between sessions, and provides structured progress tracking. Based on Anthropic's long-running agent patterns.
|
|
3
|
+
---
|
|
4
|
+
|
|
5
|
+
# /marathon — Long-Running Agent Harness
|
|
6
|
+
|
|
7
|
+
$ARGUMENTS
|
|
8
|
+
|
|
9
|
+
---
|
|
10
|
+
|
|
11
|
+
## When to Use /marathon
|
|
12
|
+
|
|
13
|
+
|Use `/marathon` when...|Use something else when...|
|
|
14
|
+
|:---|:---|
|
|
15
|
+
|A project requires multiple sessions to complete|Quick one-shot task → `/generate`|
|
|
16
|
+
|You need structured progress tracking across context windows|Single feature addition → `/enhance`|
|
|
17
|
+
|Building a complex app from a high-level spec|Planning without execution → `/plan`|
|
|
18
|
+
|Previous agent sessions lost context or declared victory too early|Brainstorming options → `/brainstorm`|
|
|
19
|
+
|
|
20
|
+
---
|
|
21
|
+
|
|
22
|
+
## Sub-Commands
|
|
23
|
+
|
|
24
|
+
```
|
|
25
|
+
/marathon init [spec] Start a new marathon from a specification
|
|
26
|
+
/marathon continue Resume work: read progress, pick next feature, implement
|
|
27
|
+
/marathon status Show progress dashboard
|
|
28
|
+
/marathon reset Archive current marathon and start fresh
|
|
29
|
+
```
|
|
30
|
+
|
|
31
|
+
---
|
|
32
|
+
|
|
33
|
+
## Phase 1: Initialize (First Session Only)
|
|
34
|
+
|
|
35
|
+
**Trigger:** `/marathon init "Build X"`
|
|
36
|
+
|
|
37
|
+
This phase runs the **Initializer Agent** pattern — a specialized first session that sets up the foundation for all future sessions.
|
|
38
|
+
|
|
39
|
+
### Steps
|
|
40
|
+
|
|
41
|
+
1. **Parse the specification** — Read the user's spec carefully
|
|
42
|
+
2. **Decompose into atomic features** — Generate 30–200 features depending on project complexity
|
|
43
|
+
- Each feature must be **independently testable**
|
|
44
|
+
- Each must have clear **done criteria** (verification steps)
|
|
45
|
+
- Group by category: `core`, `auth`, `ui`, `data`, `integration`, `polish`
|
|
46
|
+
- All features start with `passes: false`
|
|
47
|
+
3. **Create the marathon state:**
|
|
48
|
+
```bash
|
|
49
|
+
node .agent/scripts/marathon_harness.js init "Build X"
|
|
50
|
+
# Then add features one by one:
|
|
51
|
+
node .agent/scripts/marathon_harness.js add-feature "core" "User can open a new chat" "Navigate to main page" "Click New Chat" "Verify welcome state"
|
|
52
|
+
node .agent/scripts/marathon_harness.js add-feature "core" "User can type and send a message" "Open chat" "Type in input" "Press Enter" "See message appear"
|
|
53
|
+
# ... repeat for all features
|
|
54
|
+
```
|
|
55
|
+
4. **Scaffold the project** — Create initial files, install dependencies
|
|
56
|
+
5. **Create init.sh** — Write a bootstrap script that starts the dev environment
|
|
57
|
+
6. **Initial git commit:** `git commit -m "marathon: initial scaffold for [spec]"`
|
|
58
|
+
7. **Human Gate:** User reviews the feature list before proceeding
|
|
59
|
+
|
|
60
|
+
### Feature JSON Format
|
|
61
|
+
|
|
62
|
+
Features are stored in `.agent/history/marathon/feature_list.json` as structured JSON. JSON is used instead of Markdown because agents are less likely to inappropriately modify JSON structures.
|
|
63
|
+
|
|
64
|
+
```json
|
|
65
|
+
{
|
|
66
|
+
"id": 1,
|
|
67
|
+
"category": "core",
|
|
68
|
+
"description": "User can open a new chat and see a welcome screen",
|
|
69
|
+
"steps": [
|
|
70
|
+
"Navigate to main page",
|
|
71
|
+
"Click 'New Chat' button",
|
|
72
|
+
"Verify welcome state renders"
|
|
73
|
+
],
|
|
74
|
+
"passes": false,
|
|
75
|
+
"sessionCompleted": null
|
|
76
|
+
}
|
|
77
|
+
```
|
|
78
|
+
|
|
79
|
+
> [!CAUTION]
|
|
80
|
+
> **Feature descriptions are immutable.** After initialization, agents may ONLY change the `passes` field and `sessionCompleted` timestamp. It is unacceptable to remove, edit, or reorder features — this could lead to missing or buggy functionality.
|
|
81
|
+
|
|
82
|
+
---
|
|
83
|
+
|
|
84
|
+
## Phase 2: Get Bearings (Every Session Start)
|
|
85
|
+
|
|
86
|
+
**Trigger:** `/marathon continue`
|
|
87
|
+
|
|
88
|
+
Every new session starts by orienting the agent. This is the **Coding Agent** pattern — understanding state before making changes.
|
|
89
|
+
|
|
90
|
+
### Steps
|
|
91
|
+
|
|
92
|
+
1. **Read marathon state:**
|
|
93
|
+
```bash
|
|
94
|
+
node .agent/scripts/marathon_harness.js session-start
|
|
95
|
+
```
|
|
96
|
+
This automatically:
|
|
97
|
+
- Reads `progress.json` and shows what was done in previous sessions
|
|
98
|
+
- Reads `git log --oneline -20` for recent commits
|
|
99
|
+
- Shows the next unfinished feature
|
|
100
|
+
- Records the session start time
|
|
101
|
+
|
|
102
|
+
2. **Start the dev environment:**
|
|
103
|
+
```bash
|
|
104
|
+
node .agent/scripts/auto_preview.js start
|
|
105
|
+
```
|
|
106
|
+
|
|
107
|
+
3. **Smoke test basic functionality:**
|
|
108
|
+
- If a web app: navigate to the main page, verify it loads without errors
|
|
109
|
+
- If a CLI tool: run the help command, verify it outputs correctly
|
|
110
|
+
- If an API: hit the health check endpoint
|
|
111
|
+
- If browser MCP tools are available (Puppeteer), use them for visual verification
|
|
112
|
+
|
|
113
|
+
4. **If smoke test fails:** Fix the broken state FIRST before implementing new features. The codebase must be clean before new work begins.
|
|
114
|
+
|
|
115
|
+
5. **Announce bearings:**
|
|
116
|
+
```
|
|
117
|
+
Session N. Progress: 12/47 features (25%).
|
|
118
|
+
Working on: Feature #13 [ui] — "User can toggle dark mode"
|
|
119
|
+
```
|
|
120
|
+
|
|
121
|
+
---
|
|
122
|
+
|
|
123
|
+
## Phase 3: Implement (One Feature Per Cycle)
|
|
124
|
+
|
|
125
|
+
Work on exactly **one feature at a time**. This incremental approach prevents the common failure mode of trying to do too much at once.
|
|
126
|
+
|
|
127
|
+
### Steps
|
|
128
|
+
|
|
129
|
+
1. **Impact analysis** — Identify files that will be affected (per `/enhance` workflow)
|
|
130
|
+
2. **Implement the feature** — Write code, following Tribunal code quality standards
|
|
131
|
+
3. **Self-verify the feature:**
|
|
132
|
+
- Run the verification steps listed in the feature's `steps` array
|
|
133
|
+
- Test as a human user would (browser for web, CLI for CLI)
|
|
134
|
+
- Run existing tests to ensure no regressions: `npm test` or equivalent
|
|
135
|
+
4. **Mark as passing:**
|
|
136
|
+
```bash
|
|
137
|
+
node .agent/scripts/marathon_harness.js mark <id> pass
|
|
138
|
+
```
|
|
139
|
+
5. **Git commit** with a descriptive message:
|
|
140
|
+
```bash
|
|
141
|
+
git commit -m "marathon: implement feature #13 — dark mode toggle"
|
|
142
|
+
```
|
|
143
|
+
6. **Check context budget:**
|
|
144
|
+
- If context allows → return to Phase 2, step 5 (pick next feature)
|
|
145
|
+
- If nearing context limit → proceed to Phase 4
|
|
146
|
+
|
|
147
|
+
### If a feature cannot be completed
|
|
148
|
+
|
|
149
|
+
If a feature is blocked or too complex for the current session:
|
|
150
|
+
1. Leave it as `passes: false`
|
|
151
|
+
2. Add a log note explaining why:
|
|
152
|
+
```bash
|
|
153
|
+
node .agent/scripts/marathon_harness.js log "Feature #13 blocked: requires OAuth integration not yet set up"
|
|
154
|
+
```
|
|
155
|
+
3. Move to the next feature or proceed to Phase 4
|
|
156
|
+
|
|
157
|
+
---
|
|
158
|
+
|
|
159
|
+
## Phase 4: Clean Exit (Session End)
|
|
160
|
+
|
|
161
|
+
Every session MUST leave the codebase in a clean, merge-ready state.
|
|
162
|
+
|
|
163
|
+
### Steps
|
|
164
|
+
|
|
165
|
+
1. **Verify clean state:**
|
|
166
|
+
- All code compiles without errors
|
|
167
|
+
- All existing tests pass
|
|
168
|
+
- No half-implemented features left in an intermediate state
|
|
169
|
+
- If something is half-done, either complete it or revert it
|
|
170
|
+
|
|
171
|
+
2. **Record session end:**
|
|
172
|
+
```bash
|
|
173
|
+
node .agent/scripts/marathon_harness.js session-end "Implemented dark mode, user settings page, and notification bell"
|
|
174
|
+
```
|
|
175
|
+
|
|
176
|
+
3. **Final git commit:**
|
|
177
|
+
```bash
|
|
178
|
+
git commit -m "marathon: session N complete, 15/47 features passing"
|
|
179
|
+
```
|
|
180
|
+
|
|
181
|
+
4. **Display status dashboard** — The session-end command automatically shows progress
|
|
182
|
+
|
|
183
|
+
---
|
|
184
|
+
|
|
185
|
+
## Marathon Guards
|
|
186
|
+
|
|
187
|
+
```
|
|
188
|
+
❌ Never delete or edit feature descriptions — only change the passes status
|
|
189
|
+
❌ Never skip the smoke test at session start — broken code must be fixed first
|
|
190
|
+
❌ Never mark a feature as passing without testing it end-to-end
|
|
191
|
+
❌ Never work on more than one feature at a time
|
|
192
|
+
❌ Never leave the codebase in a broken state at session end
|
|
193
|
+
❌ Never declare the project "done" if any feature has passes: false
|
|
194
|
+
❌ Never try to one-shot the entire project — always work incrementally
|
|
195
|
+
❌ Never guess what happened in previous sessions — read progress.json and git log
|
|
196
|
+
```
|
|
197
|
+
|
|
198
|
+
---
|
|
199
|
+
|
|
200
|
+
## State Files
|
|
201
|
+
|
|
202
|
+
All marathon state is stored in `.agent/history/marathon/` (preserved on `tk update`):
|
|
203
|
+
|
|
204
|
+
```
|
|
205
|
+
.agent/history/marathon/
|
|
206
|
+
├── feature_list.json ← Structured feature backlog (immutable descriptions)
|
|
207
|
+
├── progress.json ← Session log + progress notes
|
|
208
|
+
└── archive/ ← Previous marathons (after reset)
|
|
209
|
+
```
|
|
210
|
+
|
|
211
|
+
---
|
|
212
|
+
|
|
213
|
+
## Script Reference
|
|
214
|
+
|
|
215
|
+
```bash
|
|
216
|
+
# Initialize
|
|
217
|
+
node .agent/scripts/marathon_harness.js init "Build a task management app"
|
|
218
|
+
|
|
219
|
+
# Add features (during init phase)
|
|
220
|
+
node .agent/scripts/marathon_harness.js add-feature "core" "User can create a task" "Click add" "Type title" "Save"
|
|
221
|
+
|
|
222
|
+
# Session lifecycle
|
|
223
|
+
node .agent/scripts/marathon_harness.js session-start
|
|
224
|
+
node .agent/scripts/marathon_harness.js session-end "Completed auth and dashboard"
|
|
225
|
+
|
|
226
|
+
# During implementation
|
|
227
|
+
node .agent/scripts/marathon_harness.js next
|
|
228
|
+
node .agent/scripts/marathon_harness.js mark 5 pass
|
|
229
|
+
node .agent/scripts/marathon_harness.js log "Refactored auth to use JWT"
|
|
230
|
+
|
|
231
|
+
# Status
|
|
232
|
+
node .agent/scripts/marathon_harness.js status
|
|
233
|
+
|
|
234
|
+
# Archive and restart
|
|
235
|
+
node .agent/scripts/marathon_harness.js reset
|
|
236
|
+
```
|
|
237
|
+
|
|
238
|
+
---
|
|
239
|
+
|
|
240
|
+
## Usage Examples
|
|
241
|
+
|
|
242
|
+
```
|
|
243
|
+
/marathon init Build a full-stack clone of claude.ai with chat, settings, and themes
|
|
244
|
+
/marathon continue
|
|
245
|
+
/marathon status
|
|
246
|
+
/marathon reset
|
|
247
|
+
```
|