mindforge-cc 2.0.0 → 2.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (115) hide show
  1. package/.agent/mindforge/add-backlog.md +32 -0
  2. package/.agent/mindforge/agent.md +31 -0
  3. package/.agent/mindforge/do.md +31 -0
  4. package/.agent/mindforge/note.md +35 -0
  5. package/.agent/mindforge/plant-seed.md +31 -0
  6. package/.agent/mindforge/review-backlog.md +34 -0
  7. package/.agent/mindforge/session-report.md +39 -0
  8. package/.agent/mindforge/ui-phase.md +34 -0
  9. package/.agent/mindforge/ui-review.md +36 -0
  10. package/.agent/mindforge/validate-phase.md +31 -0
  11. package/.agent/mindforge/workstreams.md +35 -0
  12. package/.claude/commands/mindforge/add-backlog.md +32 -0
  13. package/.claude/commands/mindforge/agent.md +31 -0
  14. package/.claude/commands/mindforge/approve.md +27 -15
  15. package/.claude/commands/mindforge/audit.md +30 -26
  16. package/.claude/commands/mindforge/auto.md +29 -18
  17. package/.claude/commands/mindforge/benchmark.md +26 -29
  18. package/.claude/commands/mindforge/browse.md +24 -22
  19. package/.claude/commands/mindforge/complete-milestone.md +28 -14
  20. package/.claude/commands/mindforge/costs.md +26 -9
  21. package/.claude/commands/mindforge/cross-review.md +27 -13
  22. package/.claude/commands/mindforge/dashboard.md +35 -98
  23. package/.claude/commands/mindforge/debug.md +34 -126
  24. package/.claude/commands/mindforge/discuss-phase.md +36 -138
  25. package/.claude/commands/mindforge/do.md +31 -0
  26. package/.claude/commands/mindforge/execute-phase.md +37 -190
  27. package/.claude/commands/mindforge/health.md +27 -17
  28. package/.claude/commands/mindforge/help.md +25 -19
  29. package/.claude/commands/mindforge/init-org.md +37 -131
  30. package/.claude/commands/mindforge/init-project.md +40 -155
  31. package/.claude/commands/mindforge/install-skill.md +32 -15
  32. package/.claude/commands/mindforge/learn.md +36 -142
  33. package/.claude/commands/mindforge/map-codebase.md +36 -298
  34. package/.claude/commands/mindforge/marketplace.md +33 -120
  35. package/.claude/commands/mindforge/metrics.md +29 -18
  36. package/.claude/commands/mindforge/migrate.md +33 -40
  37. package/.claude/commands/mindforge/milestone.md +35 -12
  38. package/.claude/commands/mindforge/new-runtime.md +25 -15
  39. package/.claude/commands/mindforge/next.md +34 -105
  40. package/.claude/commands/mindforge/note.md +35 -0
  41. package/.claude/commands/mindforge/plan-phase.md +34 -125
  42. package/.claude/commands/mindforge/plant-seed.md +31 -0
  43. package/.claude/commands/mindforge/plugins.md +30 -36
  44. package/.claude/commands/mindforge/pr-review.md +32 -41
  45. package/.claude/commands/mindforge/profile-team.md +26 -19
  46. package/.claude/commands/mindforge/publish-skill.md +28 -17
  47. package/.claude/commands/mindforge/qa.md +27 -12
  48. package/.claude/commands/mindforge/quick.md +35 -135
  49. package/.claude/commands/mindforge/release.md +27 -8
  50. package/.claude/commands/mindforge/remember.md +25 -10
  51. package/.claude/commands/mindforge/research.md +27 -9
  52. package/.claude/commands/mindforge/retrospective.md +28 -22
  53. package/.claude/commands/mindforge/review-backlog.md +34 -0
  54. package/.claude/commands/mindforge/review.md +37 -157
  55. package/.claude/commands/mindforge/security-scan.md +34 -233
  56. package/.claude/commands/mindforge/session-report.md +39 -0
  57. package/.claude/commands/mindforge/ship.md +34 -100
  58. package/.claude/commands/mindforge/skills.md +36 -141
  59. package/.claude/commands/mindforge/status.md +30 -104
  60. package/.claude/commands/mindforge/steer.md +25 -10
  61. package/.claude/commands/mindforge/sync-confluence.md +28 -9
  62. package/.claude/commands/mindforge/sync-jira.md +32 -12
  63. package/.claude/commands/mindforge/tokens.md +25 -6
  64. package/.claude/commands/mindforge/ui-phase.md +34 -0
  65. package/.claude/commands/mindforge/ui-review.md +36 -0
  66. package/.claude/commands/mindforge/update.md +33 -42
  67. package/.claude/commands/mindforge/validate-phase.md +31 -0
  68. package/.claude/commands/mindforge/verify-phase.md +30 -62
  69. package/.claude/commands/mindforge/workspace.md +28 -25
  70. package/.claude/commands/mindforge/workstreams.md +35 -0
  71. package/.mindforge/memory/decision-library.jsonl +0 -0
  72. package/.mindforge/memory/knowledge-base.jsonl +7 -0
  73. package/.mindforge/memory/pattern-library.jsonl +1 -0
  74. package/.mindforge/memory/team-preferences.jsonl +4 -0
  75. package/.mindforge/personas/advisor-researcher.md +89 -0
  76. package/.mindforge/personas/analyst.md +112 -52
  77. package/.mindforge/personas/architect.md +100 -67
  78. package/.mindforge/personas/assumptions-analyzer-extend.md +87 -0
  79. package/.mindforge/personas/assumptions-analyzer.md +109 -0
  80. package/.mindforge/personas/codebase-mapper-extend.md +93 -0
  81. package/.mindforge/personas/codebase-mapper.md +770 -0
  82. package/.mindforge/personas/coverage-specialist.md +104 -0
  83. package/.mindforge/personas/debug-specialist.md +118 -52
  84. package/.mindforge/personas/debugger.md +97 -0
  85. package/.mindforge/personas/decision-architect.md +102 -0
  86. package/.mindforge/personas/developer.md +97 -85
  87. package/.mindforge/personas/executor.md +88 -0
  88. package/.mindforge/personas/integration-checker.md +92 -0
  89. package/.mindforge/personas/nyquist-auditor.md +84 -0
  90. package/.mindforge/personas/phase-researcher.md +107 -0
  91. package/.mindforge/personas/plan-checker.md +92 -0
  92. package/.mindforge/personas/planner.md +105 -0
  93. package/.mindforge/personas/project-researcher.md +99 -0
  94. package/.mindforge/personas/qa-engineer.md +113 -61
  95. package/.mindforge/personas/release-manager.md +102 -64
  96. package/.mindforge/personas/research-agent.md +108 -24
  97. package/.mindforge/personas/research-synthesizer.md +101 -0
  98. package/.mindforge/personas/roadmapper-extend.md +100 -0
  99. package/.mindforge/personas/roadmapper.md +103 -0
  100. package/.mindforge/personas/security-reviewer.md +114 -91
  101. package/.mindforge/personas/tech-writer.md +118 -51
  102. package/.mindforge/personas/ui-auditor.md +94 -0
  103. package/.mindforge/personas/ui-checker.md +89 -0
  104. package/.mindforge/personas/ui-researcher.md +99 -0
  105. package/.mindforge/personas/user-profiler.md +93 -0
  106. package/.mindforge/personas/verifier.md +101 -0
  107. package/.planning/browser-daemon.log +32 -0
  108. package/CHANGELOG.md +26 -0
  109. package/MINDFORGE.md +2 -0
  110. package/README.md +38 -1
  111. package/bin/installer-core.js +3 -4
  112. package/docs/Context/Master-Context.md +6 -13
  113. package/docs/PERSONAS.md +611 -0
  114. package/docs/reference/commands.md +53 -43
  115. package/package.json +1 -1
@@ -1,33 +1,30 @@
1
- # MindForge — Benchmark Command
2
- # Usage: /mindforge:benchmark [--skill skill-name] [--compare skill-a skill-b]
1
+ ---
2
+ name: mindforge:benchmark
3
+ description: Measure skill effectiveness and project metrics over time
4
+ argument-hint: [--skill skill-name] [--compare skill-a skill-b]
5
+ allowed-tools:
6
+ - view_file
7
+ - list_dir
8
+ ---
3
9
 
4
- Measure skill effectiveness over time.
10
+ <objective>
11
+ Analyze command and skill performance by correlating usage data with verify pass rates and project quality scores, facilitating data-driven decisions on tool improvements.
12
+ </objective>
5
13
 
6
- ## Single skill benchmark
7
- For a named skill, analyse AUDIT.jsonl and skill-usage.jsonl:
8
- - How many times was the skill loaded this month?
9
- - What is the verify pass rate for tasks where this skill was loaded?
10
- - Are there anti-patterns less common after this skill is loaded?
11
- - What is the average session quality score when this skill is active?
14
+ <execution_context>
15
+ .claude/commands/mindforge/benchmark.md
16
+ </execution_context>
12
17
 
13
- Report:
14
- ```
15
- Skill Benchmark: security-review v1.0.0
16
- ────────────────────────────────────────
17
- Usage (last 30 days): 47 task loads
18
- Trigger distribution: text match 68%, file-path 22%, file-name 10%
19
- Verify pass rate: 91% (vs. 84% baseline without this skill)
20
- Security findings: 8 HIGH caught (0 CRITICAL missed in tasks using this skill)
21
- Session quality lift: +6.2 points average when loaded
18
+ <context>
19
+ Sources: AUDIT.jsonl, skill-usage.jsonl
20
+ Metrics: Pass rate, load frequency, anti-pattern reduction, quality lift.
21
+ </context>
22
22
 
23
- Assessment: HIGH VALUE — clear quality improvement signal
24
- ```
25
-
26
- ## Skill comparison
27
- Compare two skills head-to-head:
28
- - Load frequency
29
- - Verify pass rate improvement
30
- - Anti-pattern detection rate
31
- - Context budget cost (token estimate)
32
-
33
- Helps decide: should you keep both skills, or deprecate the lower-performer?
23
+ <process>
24
+ 1. **Gather Data**: Extract usage and outcome logs for the target skill(s).
25
+ 2. **Calculate Trends**: Determine pass rate vs baseline and session quality improvement.
26
+ 3. **Generate Assessment**:
27
+ - For single skill: Provide a usage distribution and quality lift report.
28
+ - For comparison: Provide a head-to-head comparison on cost and effectiveness.
29
+ 4. **Recommendation**: Advise on whether to keep, improve, or deprecate the targeted skills.
30
+ </process>
@@ -1,26 +1,28 @@
1
- # /mindforge:browse
1
+ ---
2
+ name: mindforge:browse
3
+ description: Control the persistent MindForge browser daemon for visual verification
4
+ argument-hint: <url | action>
5
+ allowed-tools:
6
+ - open_browser_url
7
+ - run_command
8
+ ---
2
9
 
3
- ## Usage
4
- `@mindforge browse <url | action>`
10
+ <objective>
11
+ Enable the agent to interact with web interfaces, maintain persistent sessions, and perform visual audits of UI changes using an automated browser daemon.
12
+ </objective>
5
13
 
6
- ## Description
7
- Controls the persistent MindForge browser daemon.
8
- Maintains session state (cookies/localStorage) for the AI.
14
+ <execution_context>
15
+ .claude/commands/mindforge/browse.md
16
+ </execution_context>
9
17
 
10
- ## Actions
11
- | Action | Description |
12
- |---|---|
13
- | `--start` | Initialize browser daemon |
14
- | `--stop` | Kill browser daemon |
15
- | `--status` | Show daemon health and active sessions |
16
- | `--session <name>` | Switch browser context |
17
- | `--import-session <name> --from <browser>` | Import cookies from host browser (chrome, arc, etc) |
18
- | `<url>` | Navigate the current page to URL |
19
- | `click <selector>` | Trigger click event |
20
- | `type <sel> <text>` | Fill input field |
21
- | `screenshot` | Capture current viewport |
18
+ <context>
19
+ Security: Daemon binds to 127.0.0.1. Sessions are gitignored.
20
+ State: Supports cookie/localStorage persistence via named sessions.
21
+ </context>
22
22
 
23
- ## Security
24
- - Daemon binds to `127.0.0.1` only.
25
- - Session files are gitignored.
26
- - Use only for debugging and visual verification.
23
+ <process>
24
+ 1. **Control Daemon**: Start, stop, or query the health/active sessions of the browser daemon.
25
+ 2. **Session Management**: Switch between browser contexts or import sessions from the host (Chrome/Arc).
26
+ 3. **Navigate & Interact**: Load URLs, click selectors, and type text into input fields.
27
+ 4. **Verify**: Capture screenshots of the current viewport for visual confirmation.
28
+ </process>
@@ -1,18 +1,32 @@
1
- Archive a completed milestone, generate a release report, and prepare the next
2
- milestone. Usage: `/mindforge:complete-milestone <name> <version>`
1
+ ---
2
+ name: mindforge:complete-milestone
3
+ description: Archive a completed milestone and prepare the next version
4
+ argument-hint: <name> <version>
5
+ allowed-tools:
6
+ - list_dir
7
+ - view_file
8
+ - write_to_file
9
+ - run_command
10
+ ---
3
11
 
4
- ## Step 1 — Validate milestone completion
5
- Ensure every included phase is verified and has no pending blocking approvals.
12
+ <objective>
13
+ Finalize a project milestone by summarizing shipped value, archiving phase artifacts, and preparing the environment for the next development cycle.
14
+ </objective>
6
15
 
7
- ## Step 2 — Generate milestone report
8
- Summarise shipped phases, notable changes, risks, approvals, and unresolved
9
- follow-ups.
16
+ <execution_context>
17
+ .claude/commands/mindforge/complete-milestone.md
18
+ </execution_context>
10
19
 
11
- ## Step 3 — Archive milestone artifacts
12
- Archive only the phases included in the milestone, not the entire
13
- `.planning/phases/` directory. Preserve history in the archive while keeping
14
- active planning files available in place.
20
+ <context>
21
+ Validation: Ensures all included phases are verified and have no pending approvals.
22
+ Storage: Moves phase files to a milestone-specific archive.
23
+ </context>
15
24
 
16
- ## Step 4 — Release metadata
17
- Create the release tag, update `STATE.md` with milestone summary, and mark the
18
- project ready for the next version.
25
+ <process>
26
+ 1. **Validate**: Confirm every phase in the milestone is signed off and verified.
27
+ 2. **Summarize**: Generate a MILESTONE-REPORT with shipped functionality, risks, and follow-ups.
28
+ 3. **Archive**: Move the included `.planning/phases/` directories to a persistent milestone archive.
29
+ 4. **Tag**: Create a git release tag for the milestone.
30
+ 5. **State Reset**: Update `STATE.md` to reflect the milestone completion and target the next version.
31
+ 6. **Audit**: Log `milestone_completed` event.
32
+ </process>
@@ -1,11 +1,28 @@
1
- # MindForge v2 — Costs Command
2
- # Usage: /mindforge:costs [--phase N] [--session ID] [--window 7d]
1
+ ---
2
+ name: mindforge:costs
3
+ description: Real-time cost tracking for AI model usage
4
+ argument-hint: [--phase N] [--session ID] [--window 7d]
5
+ allowed-tools:
6
+ - view_file
7
+ - run_command
8
+ ---
3
9
 
4
- ## Purpose
5
- Real-time cost tracking for all AI model usage.
6
- Enforce daily budgets and see per-model spend.
10
+ <objective>
11
+ Monitor and control project expenses related to AI model usage, enforcing budget guardrails and providing granular spend analysis.
12
+ </objective>
7
13
 
8
- ## Metrics
9
- - Total spend: $X.XX
10
- - Daily limit usage: XX%
11
- - Per-model breakdown (Tokens/Cost)
14
+ <execution_context>
15
+ .claude/commands/mindforge/costs.md
16
+ </execution_context>
17
+
18
+ <context>
19
+ Metrics: Total spend, daily limit usage, per-model breakdown.
20
+ Sources: AUDIT.jsonl and local token logs.
21
+ </context>
22
+
23
+ <process>
24
+ 1. **Gather Usage Data**: Parse logs for the specified phase, session, or time window.
25
+ 2. **Calculate Spend**: Apply pricing models to the detected token counts per model.
26
+ 3. **Enforce Budgets**: Compare current spend against configured daily and project limits.
27
+ 4. **Display Report**: Present the total spend and limit usage as a percentage.
28
+ </process>
@@ -1,17 +1,31 @@
1
- # MindForge v2 — Cross-Review Command
2
- # Usage: /mindforge:cross-review [--phase N] [--models list] [--focus area]
1
+ ---
2
+ name: mindforge:cross-review
3
+ description: Get code reviewed by multiple AI models simultaneously for consensus validation
4
+ argument-hint: [--phase N] [--models list] [--focus area]
5
+ allowed-tools:
6
+ - run_command
7
+ - view_file
8
+ - write_to_file
9
+ ---
3
10
 
4
- ## Purpose
5
- Get the same code diff reviewed by multiple AI models simultaneously.
6
- Claude finds what Claude finds. GPT-4o finds what GPT-4o finds.
7
- Consensus findings = high confidence issues.
11
+ <objective>
12
+ Increase review confidence by aggregating findings from multiple diverse AI models, identifying consensus issues and providing a multi-perspective quality assessment.
13
+ </objective>
8
14
 
9
- ## Round 1: Primary (Claude)
10
- Senior architect review.
15
+ <execution_context>
16
+ .claude/commands/mindforge/cross-review.md
17
+ </execution_context>
11
18
 
12
- ## Round 2: Adversarial (GPT-4o)
13
- Critical security and edge case review.
19
+ <context>
20
+ Models: Claude (Primary/Architectural), GPT-4o (Adversarial/Security).
21
+ Focus: Specific area like "security", "performance", or "consistency".
22
+ Pre-check: Models must be available via existing API integrations.
23
+ </context>
14
24
 
15
- ## Synthesis
16
- Consensus detector filters findings.
17
- Verdict is gating for `/mindforge:ship`.
25
+ <process>
26
+ 1. **Round 1 (Primary)**: Execute architectural review using the primary model.
27
+ 2. **Round 2 (Adversarial)**: Execute security-focused review using the secondary model.
28
+ 3. **Synthesis**: Compare findings from both rounds. Identify consensus "high confidence" issues.
29
+ 4. **Final Verdict**: Issue a gating verdict that must be resolved for `/mindforge:ship`.
30
+ 5. **Log**: Record the multi-model review results in the audit trail.
31
+ </process>
@@ -1,98 +1,35 @@
1
- # MindForge v2 — Dashboard Command
2
- # Usage: /mindforge:dashboard [--port 7339] [--open] [--stop] [--status]
3
- # Version: v2.0.0-alpha.5
4
-
5
- ## Purpose
6
- Start the MindForge real-time web dashboard — a live observability UI for the
7
- entire team. Shows execution progress, quality metrics, pending approvals,
8
- knowledge graph, and team activity without requiring CLI access.
9
-
10
- ## Design
11
- The dashboard is a localhost-only web server:
12
- - No build step — single HTML file, no bundler, no npm packages on client
13
- - No authentication binding to 127.0.0.1 is the security model
14
- - Live updates via Server-Sent Events — no WebSocket library needed
15
- - Designed for screensharing at standups, not external access
16
-
17
- ## Usage
18
-
19
- ### Start the dashboard
20
- ```
21
- /mindforge:dashboard
22
- Dashboard running at: http://localhost:7339
23
- Press CTRL+C to stop (or /mindforge:dashboard --stop)
24
- ```
25
-
26
- ### Start and open in browser
27
- ```
28
- /mindforge:dashboard --open
29
- Opens http://localhost:7339 in your default browser
30
- ```
31
-
32
- ### Custom port
33
- ```
34
- /mindforge:dashboard --port 7340
35
- → Useful if 7339 is already in use
36
- ```
37
-
38
- ### Stop the dashboard
39
- ```
40
- /mindforge:dashboard --stop
41
- → Finds the running dashboard process (from PID file) and sends SIGTERM
42
- ```
43
-
44
- ### Check dashboard status
45
- ```
46
- /mindforge:dashboard --status
47
- → Checks if dashboard is running, shows port and PID
48
- → Also shows: http://localhost:7339/api/status
49
- ```
50
-
51
- ## Dashboard pages
52
-
53
- ### Activity (default)
54
- - Phase name, auto mode status (RUNNING/PAUSED/ESCALATED/IDLE)
55
- - Wave progress bar (tasks completed / total)
56
- - Live AUDIT event feed with color-coded event types
57
- - Steering input: send guidance to auto mode without touching the CLI
58
-
59
- ### Quality Metrics
60
- - Session quality score trend (last 20 sessions)
61
- - Verify pass rate over time
62
- - Security findings by severity (CRITICAL/HIGH/MEDIUM/LOW)
63
- - Cost per session trend
64
-
65
- ### Approvals
66
- - All pending Tier 2/3 governance requests
67
- - [Approve] and [Reject] buttons — no CLI needed for approval
68
- - Tier, phase/plan, description, time since requested, expiry warning
69
- - Recent approval history
70
-
71
- ### Knowledge
72
- - Search the knowledge graph from the browser
73
- - Entries filtered by confidence, type, tags
74
- - Color-coded by knowledge type
75
-
76
- ### Team
77
- - Active developers (by git email, from AUDIT.jsonl)
78
- - What each person is working on (last task)
79
- - File conflict warnings (two developers recently touching the same file)
80
-
81
- ## Security rules
82
- 1. Never expose the dashboard on 0.0.0.0 — localhost only
83
- 2. Never forward the port externally (no ngrok, no port forwarding)
84
- 3. For remote team visibility: screenshare your browser instead
85
- 4. The dashboard shows project details including code patterns and decisions
86
-
87
- ## Integration with auto mode
88
- When `/mindforge:auto` is running and the dashboard is open:
89
- - Activity feed updates live as tasks complete
90
- - Wave progress bar advances in real-time
91
- - Any escalations appear immediately with red indicator
92
- - The Steering input is active — inject guidance without a second terminal
93
-
94
- ## AUDIT entry
95
- ```json
96
- { "event": "dashboard_started", "port": 7339, "pid": 12345 }
97
- { "event": "dashboard_stopped", "pid": 12345 }
98
- ```
1
+ ---
2
+ name: mindforge:dashboard
3
+ description: Start the MindForge real-time web dashboard
4
+ argument-hint: [--port N] [--open] [--stop] [--status]
5
+ allowed-tools:
6
+ - run_command
7
+ - list_dir
8
+ - view_file
9
+ - open_browser_url
10
+ ---
11
+
12
+ <objective>
13
+ Provide a real-time web-based observability interface for the project, allowing the team to monitor execution progress, quality metrics, pending approvals, and team activity.
14
+ </objective>
15
+
16
+ <execution_context>
17
+ .claude/commands/mindforge/dashboard.md
18
+ </execution_context>
19
+
20
+ <context>
21
+ Port: Default 7339 (configurable via --port).
22
+ Security: Binding to 127.0.0.1 (local only).
23
+ Features: Server-Sent Events for live updates, no-auth by design.
24
+ </context>
25
+
26
+ <process>
27
+ 1. **Handle Flags**:
28
+ - If `--stop`: Find the PID from the PID file and terminate the process.
29
+ - If `--status`: Check if the dashboard is running and report the URL/PID.
30
+ - Default: Start the server.
31
+ 2. **Start Server**: Execute the dashboard binary/script on the specified port.
32
+ 3. **Open Browser**: If `--open` is provided, trigger the default system browser to the dashboard URL.
33
+ 4. **Monitor**: Listen for steering inputs from the dashboard and route them to the active MindForge session.
34
+ 5. **Log**: Record `dashboard_started` or `dashboard_stopped` in the audit log.
35
+ </process>
@@ -1,126 +1,34 @@
1
- # MindForge — Debug Command
2
- # Usage: /mindforge:debug [description]
3
-
4
- Systematic debugging using the Debug Specialist persona with full RCA protocol.
5
-
6
- ## Activation
7
-
8
- Load `.mindforge/personas/debug-specialist.md` immediately.
9
- This command runs entirely in that persona for its full duration.
10
-
11
- ## Step 1 — Intake
12
-
13
- Ask the user:
14
- 1. "Describe the problem. What is happening vs. what should happen?"
15
- 2. "Can you reproduce it reliably? If yes: what are the exact steps?"
16
- 3. "When did this start? Was it working before? What changed?"
17
- 4. "Do you have an error message or stack trace? Paste it here."
18
-
19
- Capture all answers before proceeding.
20
-
21
- ## Step 2 — Triage
22
-
23
- Classify the issue immediately:
24
- - **Regression** (was working, now broken) → check recent commits
25
- - **Never worked** (new feature failing) → check the plan and verify step
26
- - **Environment issue** (works locally, fails in CI) → check environment diffs
27
- - **Data issue** (specific data causes failure) check data shape assumptions
28
- - **Integration issue** (fails when calling external service) check contracts
29
-
30
- Report classification to user: "This looks like a [type] issue. Here's my approach..."
31
-
32
- ## Step 3 Follow Debug Specialist protocol
33
-
34
- Execute the full protocol from `debug-specialist.md`:
35
- 1. Reproduce
36
- 2. Isolate
37
- 3. Read the error
38
- 4. Check recent changes
39
- 5. Instrument
40
- 6. Form hypothesis
41
- 7. Test hypothesis (write a failing test)
42
- 8. Fix
43
- 9. Verify (test from step 7 now passes, no regressions)
44
- 10. Document
45
-
46
- At each step, report what was found before moving to the next step.
47
- Do not skip steps or combine them.
48
-
49
- ## Step 3b — Full test suite verification (mandatory)
50
- After the fix and targeted verify pass, run the project's full test suite.
51
- Do not mark the debug task complete if any tests fail.
52
-
53
- ## Step 4 — Check recent git history
54
-
55
- ```bash
56
- git log --oneline -20
57
- git diff HEAD~[N] HEAD -- [suspected file]
58
- ```
59
-
60
- If a recent commit is the likely cause, show the user the specific diff.
61
-
62
- ## Step 5 — Write the RCA report
63
-
64
- Create `.planning/phases/[current-phase]/DEBUG-[timestamp].md`:
65
-
66
- ```markdown
67
- # Debug Report — [short description]
68
-
69
- ## Date
70
- [ISO-8601]
71
-
72
- ## Problem
73
- [User's description + what was verified during debugging]
74
-
75
- ## Root cause category
76
- [Logic error / Data error / Integration error / Concurrency error /
77
- Configuration error / Dependency error]
78
-
79
- ## Root cause
80
- [Precise description of what the actual cause was]
81
-
82
- ## Evidence
83
- - [How the root cause was confirmed]
84
- - [Failing test that proved the bug: file:line]
85
-
86
- ## Fix applied
87
- - File: [path]
88
- - Change: [description]
89
- - Commit: [SHA]
90
-
91
- ## Regression test
92
- [Test written to prevent this from recurring: file:line]
93
-
94
- ## Prevention
95
- [What should change in process/code to prevent this class of bug]
96
- ```
97
-
98
- ## Step 6 — Write AUDIT entry
99
-
100
- ```json
101
- {
102
- "id": "uuid",
103
- "timestamp": "ISO-8601",
104
- "event": "debug_completed",
105
- "agent": "mindforge-debug-specialist",
106
- "phase": [current phase or null],
107
- "session_id": "sess_abc",
108
- "issue_type": "regression",
109
- "root_cause_category": "Logic error",
110
- "root_cause_summary": "[one sentence]",
111
- "commit_sha": "[fix commit sha]",
112
- "regression_test_added": true,
113
- "report_path": ".planning/phases/[N]/DEBUG-[timestamp].md"
114
- }
115
- ```
116
-
117
- ## When the bug cannot be reproduced
118
-
119
- Ask:
120
- 1. "Does it happen every time or intermittently?"
121
- 2. "Does it happen in specific environments only? (dev/staging/prod)"
122
- 3. "Does it happen for specific users or all users?"
123
-
124
- If intermittent: focus on concurrency, caching, and race conditions.
125
- Write a monitoring/logging plan to catch the next occurrence.
126
- Document the inconclusive investigation in the DEBUG report with evidence gathered.
1
+ ---
2
+ name: mindforge:debug
3
+ description: Perform systematic debugging using the RCA protocol
4
+ argument-hint: [description]
5
+ allowed-tools:
6
+ - run_command
7
+ - view_file
8
+ - write_to_file
9
+ - list_dir
10
+ ---
11
+
12
+ <objective>
13
+ Resolve complex software defects by following a rigorous Root Cause Analysis (RCA) protocol, including reproduction, isolation, instrumentation, and regression testing.
14
+ </objective>
15
+
16
+ <execution_context>
17
+ .claude/commands/mindforge/debug.md
18
+ </execution_context>
19
+
20
+ <context>
21
+ Persona: debug-specialist.md
22
+ Lifecycle: Triage -> Reproduce -> Hypothesis -> Fix -> Verify.
23
+ Artifact: .planning/phases/[N]/DEBUG-[timestamp].md
24
+ </context>
25
+
26
+ <process>
27
+ 1. **Intake**: Gather symptoms, reproduction steps, working history, and error logs.
28
+ 2. **Triage**: Classify as Regression, Never Worked, Environment, or Integration issue.
29
+ 3. **Isolate**: Use git history and breadcrumb logging to identify the failure point.
30
+ 4. **Reproduce**: Write a failing test case that proves the bug.
31
+ 5. **Fix**: Implement the minimum necessary change to resolve the issue.
32
+ 6. **Verify**: Ensure the new test passes and run the full project test suite to detect regressions.
33
+ 7. **Document**: Write the `DEBUG-[timestamp].md` RCA report and log the event in `AUDIT.jsonl`.
34
+ </process>