opencode-multiagent 0.2.0 → 0.3.0-next.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (153) hide show
  1. package/AGENTS.md +62 -0
  2. package/CHANGELOG.md +18 -0
  3. package/CONTRIBUTING.md +36 -0
  4. package/README.md +41 -165
  5. package/README.tr.md +84 -0
  6. package/RELEASE.md +68 -0
  7. package/agents/advisor.md +9 -6
  8. package/agents/auditor.md +8 -6
  9. package/agents/critic.md +19 -10
  10. package/agents/deep-worker.md +11 -7
  11. package/agents/devil.md +3 -1
  12. package/agents/executor.md +20 -19
  13. package/agents/heavy-worker.md +11 -7
  14. package/agents/lead.md +22 -30
  15. package/agents/librarian.md +6 -2
  16. package/agents/planner.md +18 -10
  17. package/agents/qa.md +9 -6
  18. package/agents/quick.md +12 -7
  19. package/agents/reviewer.md +9 -6
  20. package/agents/scout.md +9 -5
  21. package/agents/scribe.md +33 -28
  22. package/agents/strategist.md +10 -7
  23. package/agents/ui-heavy-worker.md +11 -7
  24. package/agents/ui-worker.md +12 -7
  25. package/agents/validator.md +8 -5
  26. package/agents/worker.md +12 -7
  27. package/commands/execute.md +1 -0
  28. package/commands/init-deep.md +1 -0
  29. package/commands/init.md +1 -0
  30. package/commands/inspect.md +1 -0
  31. package/commands/plan.md +1 -0
  32. package/commands/quality.md +1 -0
  33. package/commands/review.md +1 -0
  34. package/commands/status.md +1 -0
  35. package/defaults/opencode-multiagent.json +223 -0
  36. package/defaults/opencode-multiagent.schema.json +249 -0
  37. package/dist/control-plane.d.ts +4 -0
  38. package/dist/control-plane.d.ts.map +1 -0
  39. package/dist/index.d.ts +5 -0
  40. package/dist/index.d.ts.map +1 -0
  41. package/dist/index.js +1583 -0
  42. package/dist/opencode-multiagent/compiler.d.ts +19 -0
  43. package/dist/opencode-multiagent/compiler.d.ts.map +1 -0
  44. package/dist/opencode-multiagent/constants.d.ts +116 -0
  45. package/dist/opencode-multiagent/constants.d.ts.map +1 -0
  46. package/dist/opencode-multiagent/defaults.d.ts +10 -0
  47. package/dist/opencode-multiagent/defaults.d.ts.map +1 -0
  48. package/dist/opencode-multiagent/file-lock.d.ts +15 -0
  49. package/dist/opencode-multiagent/file-lock.d.ts.map +1 -0
  50. package/dist/opencode-multiagent/hooks.d.ts +62 -0
  51. package/dist/opencode-multiagent/hooks.d.ts.map +1 -0
  52. package/dist/opencode-multiagent/log.d.ts +2 -0
  53. package/dist/opencode-multiagent/log.d.ts.map +1 -0
  54. package/dist/opencode-multiagent/markdown.d.ts +8 -0
  55. package/dist/opencode-multiagent/markdown.d.ts.map +1 -0
  56. package/dist/opencode-multiagent/mcp.d.ts +3 -0
  57. package/dist/opencode-multiagent/mcp.d.ts.map +1 -0
  58. package/dist/opencode-multiagent/policy.d.ts +5 -0
  59. package/dist/opencode-multiagent/policy.d.ts.map +1 -0
  60. package/dist/opencode-multiagent/quality.d.ts +14 -0
  61. package/dist/opencode-multiagent/quality.d.ts.map +1 -0
  62. package/dist/opencode-multiagent/runtime.d.ts +7 -0
  63. package/dist/opencode-multiagent/runtime.d.ts.map +1 -0
  64. package/dist/opencode-multiagent/session-tracker.d.ts +32 -0
  65. package/dist/opencode-multiagent/session-tracker.d.ts.map +1 -0
  66. package/dist/opencode-multiagent/skills.d.ts +17 -0
  67. package/dist/opencode-multiagent/skills.d.ts.map +1 -0
  68. package/dist/opencode-multiagent/supervision.d.ts +12 -0
  69. package/dist/opencode-multiagent/supervision.d.ts.map +1 -0
  70. package/dist/opencode-multiagent/task-manager.d.ts +48 -0
  71. package/dist/opencode-multiagent/task-manager.d.ts.map +1 -0
  72. package/dist/opencode-multiagent/telemetry.d.ts +26 -0
  73. package/dist/opencode-multiagent/telemetry.d.ts.map +1 -0
  74. package/dist/opencode-multiagent/tools.d.ts +56 -0
  75. package/dist/opencode-multiagent/tools.d.ts.map +1 -0
  76. package/dist/opencode-multiagent/types.d.ts +36 -0
  77. package/dist/opencode-multiagent/types.d.ts.map +1 -0
  78. package/dist/opencode-multiagent/utils.d.ts +9 -0
  79. package/dist/opencode-multiagent/utils.d.ts.map +1 -0
  80. package/docs/agents.md +260 -0
  81. package/docs/agents.tr.md +260 -0
  82. package/docs/configuration.md +255 -0
  83. package/docs/configuration.tr.md +255 -0
  84. package/docs/usage-guide.md +226 -0
  85. package/docs/usage-guide.tr.md +227 -0
  86. package/examples/opencode.with-overrides.json +1 -5
  87. package/package.json +23 -13
  88. package/skills/advanced-evaluation/SKILL.md +37 -21
  89. package/skills/advanced-evaluation/manifest.json +2 -13
  90. package/skills/cek-context-engineering/SKILL.md +159 -87
  91. package/skills/cek-context-engineering/manifest.json +1 -3
  92. package/skills/cek-prompt-engineering/SKILL.md +13 -10
  93. package/skills/cek-prompt-engineering/manifest.json +1 -3
  94. package/skills/cek-test-prompt/SKILL.md +38 -28
  95. package/skills/cek-test-prompt/manifest.json +1 -3
  96. package/skills/cek-thought-based-reasoning/SKILL.md +75 -21
  97. package/skills/cek-thought-based-reasoning/manifest.json +1 -3
  98. package/skills/context-degradation/SKILL.md +14 -13
  99. package/skills/context-degradation/manifest.json +1 -3
  100. package/skills/debate/SKILL.md +23 -78
  101. package/skills/debate/manifest.json +2 -12
  102. package/skills/design-first/manifest.json +2 -13
  103. package/skills/dispatching-parallel-agents/SKILL.md +14 -3
  104. package/skills/dispatching-parallel-agents/manifest.json +1 -4
  105. package/skills/drift-analysis/SKILL.md +50 -29
  106. package/skills/drift-analysis/manifest.json +2 -12
  107. package/skills/evaluation/manifest.json +2 -12
  108. package/skills/executing-plans/SKILL.md +15 -8
  109. package/skills/executing-plans/manifest.json +1 -3
  110. package/skills/handoff-protocols/manifest.json +2 -12
  111. package/skills/parallel-investigation/SKILL.md +25 -12
  112. package/skills/parallel-investigation/manifest.json +1 -4
  113. package/skills/reflexion-critique/SKILL.md +21 -10
  114. package/skills/reflexion-critique/manifest.json +1 -3
  115. package/skills/reflexion-reflect/SKILL.md +36 -34
  116. package/skills/reflexion-reflect/manifest.json +2 -10
  117. package/skills/root-cause-analysis/manifest.json +2 -13
  118. package/skills/sadd-judge-with-debate/SKILL.md +50 -26
  119. package/skills/sadd-judge-with-debate/manifest.json +1 -3
  120. package/skills/structured-code-review/manifest.json +2 -11
  121. package/skills/task-decomposition/manifest.json +2 -13
  122. package/skills/verification-before-completion/manifest.json +2 -15
  123. package/skills/verification-gates/SKILL.md +27 -19
  124. package/skills/verification-gates/manifest.json +2 -12
  125. package/defaults/agent-settings.json +0 -102
  126. package/defaults/agent-settings.schema.json +0 -25
  127. package/defaults/flags.json +0 -35
  128. package/defaults/flags.schema.json +0 -119
  129. package/defaults/mcp-defaults.json +0 -47
  130. package/defaults/mcp-defaults.schema.json +0 -38
  131. package/defaults/profiles.json +0 -53
  132. package/defaults/profiles.schema.json +0 -60
  133. package/defaults/team-profiles.json +0 -83
  134. package/src/control-plane.ts +0 -21
  135. package/src/index.ts +0 -8
  136. package/src/opencode-multiagent/compiler.ts +0 -168
  137. package/src/opencode-multiagent/constants.ts +0 -178
  138. package/src/opencode-multiagent/file-lock.ts +0 -90
  139. package/src/opencode-multiagent/hooks.ts +0 -599
  140. package/src/opencode-multiagent/log.ts +0 -12
  141. package/src/opencode-multiagent/mailbox.ts +0 -287
  142. package/src/opencode-multiagent/markdown.ts +0 -99
  143. package/src/opencode-multiagent/mcp.ts +0 -35
  144. package/src/opencode-multiagent/policy.ts +0 -67
  145. package/src/opencode-multiagent/quality.ts +0 -140
  146. package/src/opencode-multiagent/runtime.ts +0 -55
  147. package/src/opencode-multiagent/skills.ts +0 -144
  148. package/src/opencode-multiagent/supervision.ts +0 -156
  149. package/src/opencode-multiagent/task-manager.ts +0 -148
  150. package/src/opencode-multiagent/team-manager.ts +0 -219
  151. package/src/opencode-multiagent/team-tools.ts +0 -359
  152. package/src/opencode-multiagent/telemetry.ts +0 -124
  153. package/src/opencode-multiagent/utils.ts +0 -54
@@ -2,18 +2,8 @@
2
2
  "name": "handoff-protocols",
3
3
  "version": "1.0.0",
4
4
  "description": "Guidance for safe multi-agent or multi-step handoffs",
5
- "triggers": [
6
- "handoff",
7
- "transfer",
8
- "transition",
9
- "pass to",
10
- "onboard"
11
- ],
12
- "applicable_agents": [
13
- "executor",
14
- "planner",
15
- "worker"
16
- ],
5
+ "triggers": ["handoff", "transfer", "transition", "pass to", "onboard"],
6
+ "applicable_agents": ["executor", "planner"],
17
7
  "max_context_tokens": 1500,
18
8
  "entry_file": "SKILL.md"
19
9
  }
@@ -16,8 +16,8 @@ tags:
16
16
  difficulty: advanced
17
17
  estimatedTime: 15
18
18
  relatedSkills:
19
- - debugging/root-cause-analysis
20
- - collaboration/handoff-protocols
19
+ - root-cause-analysis
20
+ - handoff-protocols
21
21
  ---
22
22
 
23
23
  # Parallel Investigation
@@ -58,13 +58,15 @@ Assign threads with clear ownership:
58
58
 
59
59
  ```markdown
60
60
  ## Thread A: Database Performance
61
+
61
62
  **Investigator:** [Name/Agent A]
62
63
  **Duration:** 30 minutes
63
64
  **Scope:**
65
+
64
66
  - Query execution times
65
67
  - Index utilization
66
68
  - Connection pool metrics
67
- **Report Format:** Summary + evidence
69
+ **Report Format:** Summary + evidence
68
70
  ```
69
71
 
70
72
  ### Phase 3: Parallel Execution
@@ -77,17 +79,22 @@ Each thread follows this pattern:
77
79
  4. Prepare summary for sync point
78
80
 
79
81
  **Thread Log Template:**
82
+
80
83
  ```markdown
81
84
  ## Thread: [Name]
85
+
82
86
  **Start:** [Time]
83
87
 
84
88
  ### Findings
89
+
85
90
  - [Timestamp] [Finding]
86
91
 
87
92
  ### Evidence
93
+
88
94
  - [Log/Metric/Screenshot]
89
95
 
90
96
  ### Preliminary Conclusion
97
+
91
98
  [What this thread suggests about the problem]
92
99
  ```
93
100
 
@@ -103,6 +110,7 @@ Sync Point Agenda:
103
110
  ```
104
111
 
105
112
  **Sync Point Decisions:**
113
+
106
114
  - **Continue**: Threads are progressing, maintain parallel execution
107
115
  - **Pivot**: Redirect threads based on new evidence
108
116
  - **Converge**: One thread found the answer, others join to validate
@@ -146,13 +154,13 @@ When a thread identifies the likely cause:
146
154
 
147
155
  ## Decision Framework
148
156
 
149
- | Thread Status | Action |
150
- |---------------|--------|
151
- | All exploring | Continue parallel |
152
- | One hot lead | Validate lead, others support |
153
- | Multiple leads | Prioritize by evidence strength |
154
- | All dead ends | Reframe problem, new threads |
155
- | Confirmed cause | Converge, begin fix |
157
+ | Thread Status | Action |
158
+ | --------------- | ------------------------------- |
159
+ | All exploring | Continue parallel |
160
+ | One hot lead | Validate lead, others support |
161
+ | Multiple leads | Prioritize by evidence strength |
162
+ | All dead ends | Reframe problem, new threads |
163
+ | Confirmed cause | Converge, begin fix |
156
164
 
157
165
  ## Time Management
158
166
 
@@ -176,31 +184,36 @@ Adjust sync point cadence based on incident severity — every 20 minutes for cr
176
184
  # Investigation: [Problem]
177
185
 
178
186
  ## Summary
187
+
179
188
  [Brief description and resolution]
180
189
 
181
190
  ## Threads Explored
182
191
 
183
192
  ### Thread A: [Area]
193
+
184
194
  - Investigator: [Name]
185
195
  - Findings: [Summary]
186
196
  - Outcome: [Lead / Dead End / Root Cause]
187
197
 
188
198
  ## Root Cause
199
+
189
200
  [Detailed explanation of what was found]
190
201
 
191
202
  ## Evidence
203
+
192
204
  - [Evidence 1]
193
205
  - [Evidence 2]
194
206
 
195
207
  ## Resolution
208
+
196
209
  [What was done to fix]
197
210
 
198
211
  ## Lessons Learned
212
+
199
213
  - [Learning 1]
200
214
  ```
201
215
 
202
216
  ## Integration with Other Skills
203
217
 
204
- - **debugging/root-cause-analysis**: Each thread follows RCA principles
205
- - **debugging/hypothesis-testing**: Threads test specific hypotheses
218
+ - **root-cause-analysis**: Each thread follows RCA principles
206
219
  - **handoff-protocols**: When passing a thread to another person
@@ -9,10 +9,7 @@
9
9
  "incident",
10
10
  "simultaneous debug"
11
11
  ],
12
- "applicable_agents": [
13
- "critic",
14
- "strategist"
15
- ],
12
+ "applicable_agents": ["critic", "strategist"],
16
13
  "max_context_tokens": 2200,
17
14
  "entry_file": "SKILL.md"
18
15
  }
@@ -187,7 +187,7 @@ Be objective and consider the context of the project (size, team, constraints).
187
187
 
188
188
  **Prompt for Agent:**
189
189
 
190
- ```
190
+ ````
191
191
  You are a Code Quality Reviewer assessing implementation quality and suggesting refactorings.
192
192
 
193
193
  ## Your Task
@@ -262,9 +262,9 @@ Project Conventions: {any known conventions from codebase}
262
262
  ...
263
263
 
264
264
  Provide specific, actionable feedback with code examples.
265
- ```
265
+ ````
266
266
 
267
- **Implementation Note**: Use the Task tool with subagent_type="general-purpose" to spawn these three agents in parallel, each with their respective prompt and context.
267
+ **Implementation Note**: Use the Task tool with subagent_type="general" to spawn these three agents in parallel, each with their respective prompt and context.
268
268
 
269
269
  ### Phase 3: Cross-Review & Debate
270
270
 
@@ -294,6 +294,7 @@ Compile all findings into a comprehensive, actionable report:
294
294
  # 🔍 Work Critique Report
295
295
 
296
296
  ## Executive Summary
297
+
297
298
  [2-3 sentences summarizing overall assessment]
298
299
 
299
300
  **Overall Quality Score**: X/10 (average of three judge scores)
@@ -302,11 +303,11 @@ Compile all findings into a comprehensive, actionable report:
302
303
 
303
304
  ## 📊 Judge Scores
304
305
 
305
- | Judge | Score | Key Finding |
306
- |-------|-------|-------------|
307
- | Requirements Validator | X/10 | [one-line summary] |
308
- | Solution Architect | X/10 | [one-line summary] |
309
- | Code Quality Reviewer | X/10 | [one-line summary] |
306
+ | Judge | Score | Key Finding |
307
+ | ---------------------- | ----- | ------------------ |
308
+ | Requirements Validator | X/10 | [one-line summary] |
309
+ | Solution Architect | X/10 | [one-line summary] |
310
+ | Code Quality Reviewer | X/10 | [one-line summary] |
310
311
 
311
312
  ---
312
313
 
@@ -323,6 +324,7 @@ Compile all findings into a comprehensive, actionable report:
323
324
  ## ⚠️ Issues & Gaps
324
325
 
325
326
  ### Critical Issues
327
+
326
328
  [Issues that need immediate attention]
327
329
 
328
330
  - **[Issue 1]**
@@ -332,12 +334,15 @@ Compile all findings into a comprehensive, actionable report:
332
334
  - Recommendation: [what to do]
333
335
 
334
336
  ### High Priority
337
+
335
338
  [Important but not blocking]
336
339
 
337
340
  ### Medium Priority
341
+
338
342
  [Nice to have improvements]
339
343
 
340
344
  ### Low Priority
345
+
341
346
  [Minor polish items]
342
347
 
343
348
  ---
@@ -360,6 +365,7 @@ Compile all findings into a comprehensive, actionable report:
360
365
  **Chosen Approach**: [brief description]
361
366
 
362
367
  **Alternative Approaches Considered**:
368
+
363
369
  1. [Alternative 1] - [Why chosen approach is better/worse]
364
370
  2. [Alternative 2] - [Why chosen approach is better/worse]
365
371
 
@@ -379,6 +385,7 @@ Compile all findings into a comprehensive, actionable report:
379
385
  - Before/After: [code examples]
380
386
 
381
387
  ### Medium Priority Refactorings
388
+
382
389
  [similar structure]
383
390
 
384
391
  ---
@@ -397,6 +404,7 @@ Compile all findings into a comprehensive, actionable report:
397
404
  [If applicable - where judges disagreed]
398
405
 
399
406
  **Debate 1: [Topic]**
407
+
400
408
  - Requirements Validator position: [summary]
401
409
  - Solution Architect position: [summary]
402
410
  - Resolution: [consensus reached or "reasonable disagreement"]
@@ -408,14 +416,17 @@ Compile all findings into a comprehensive, actionable report:
408
416
  Based on the critique, here are recommended next steps:
409
417
 
410
418
  **Must Do**:
419
+
411
420
  - [ ] [Critical action 1]
412
421
  - [ ] [Critical action 2]
413
422
 
414
423
  **Should Do**:
424
+
415
425
  - [ ] [High priority action 1]
416
426
  - [ ] [High priority action 2]
417
427
 
418
428
  **Could Do**:
429
+
419
430
  - [ ] [Medium priority action 1]
420
431
  - [ ] [Nice to have action 2]
421
432
 
@@ -438,8 +449,8 @@ Based on the critique, here are recommended next steps:
438
449
 
439
450
  ---
440
451
 
441
- *Generated using Multi-Agent Debate + LLM-as-a-Judge pattern*
442
- *Review Date: [timestamp]*
452
+ _Generated using Multi-Agent Debate + LLM-as-a-Judge pattern_
453
+ _Review Date: [timestamp]_
443
454
  ```
444
455
 
445
456
  ## Important Guidelines
@@ -9,9 +9,7 @@
9
9
  "judge with debate",
10
10
  "consensus"
11
11
  ],
12
- "applicable_agents": [
13
- "critic"
14
- ],
12
+ "applicable_agents": ["critic"],
15
13
  "max_context_tokens": 2400,
16
14
  "entry_file": "SKILL.md"
17
15
  }
@@ -1,12 +1,12 @@
1
1
  ---
2
2
  name: reflexion-reflect
3
- description: Reflect on previus response and output, based on Self-refinement framework for iterative improvement with complexity triage and verification
3
+ description: Reflect on previous response and output, based on Self-refinement framework for iterative improvement with complexity triage and verification
4
4
  argument-hint: Optional focus area or confidence threshold to use, for example "security" or "deep reflect if less than 90% confidence"
5
5
  ---
6
6
 
7
7
  # Self-Refinement and Iterative Improvement Framework
8
8
 
9
- Reflect on previus response and output.
9
+ Reflect on previous response and output.
10
10
 
11
11
  ## Your Identity (NON-NEGOTIABLE)
12
12
 
@@ -82,15 +82,13 @@ Before proceeding, evaluate your most recent output against these criteria:
82
82
  - [ ] Are there edge cases that haven't been considered?
83
83
  - [ ] Could there be unintended side effects?
84
84
 
85
- 4. **Dependency & Impact Verification**
85
+ 4. **Dependency & Impact Verification**
86
86
  - [ ] For ANY proposed addition/deletion/modification, have you checked for dependencies?
87
87
  - [ ] Have you searched for related decisions that may be superseded or supersede this?
88
88
  - [ ] Have you checked the configuration or docs (for example AUTHORITATIVE.yaml) for active evaluations or status?
89
89
  - [ ] Have you searched the ecosystem for files/processes that depend on items being changed?
90
90
  - [ ] If recommending removal of anything, have you verified nothing depends on it?
91
91
 
92
-
93
-
94
92
  **HARD RULE:** If ANY check reveals active dependencies, evaluations, or pending decisions, FLAG THIS IN THE EVALUATION. Do not approve work that recommends changes without dependency verification.
95
93
 
96
94
  5. **Fact-Checking Required**
@@ -202,7 +200,7 @@ When the output involves code, additionally evaluate:
202
200
  // utils/dateFormatter.js
203
201
  function formatDate(date) {
204
202
  const d = new Date(date);
205
- return `${d.getMonth()+1}/${d.getDate()}/${d.getFullYear()}`;
203
+ return `${d.getMonth() + 1}/${d.getDate()}/${d.getFullYear()}`;
206
204
  }
207
205
  ```
208
206
 
@@ -366,7 +364,7 @@ const formatted = format(new Date(), 'MM/dd/yyyy');
366
364
 
367
365
  1. Search for benchmark or documentation comparing both approaches
368
366
  2. Provide algorithmic analysis
369
- **Corrected Statement**: "Map performs better for large collections (10K+ items), while Object is more efficient for small sets (<100 items)"
367
+ **Corrected Statement**: "Map performs better for large collections (10K+ items), while Object is more efficient for small sets (<100 items)"
370
368
 
371
369
  ## NON-CODE OUTPUT REFLECTION
372
370
 
@@ -405,31 +403,35 @@ For documentation, explanations, and analysis outputs:
405
403
  ## Detailed Analysis
406
404
 
407
405
  ### [Criterion 1 Name] (Weight: 0.XX)
406
+
408
407
  **Practical Check**: [If applicable - what you verified with tools]
409
408
  **Analysis**: [Explain how evidence maps to rubric level]
410
409
  **Score**: X/5
411
410
  **Improvement**: [Specific suggestion if score < 5]
412
411
 
413
412
  #### Evidences
413
+
414
414
  [Specific quotes/references]
415
415
 
416
416
  ### [Criterion 2 Name] (Weight: 0.XX)
417
+
417
418
  [Repeat pattern...]
418
419
 
419
420
  ## Score Summary
420
421
 
421
- | Criterion | Score | Weight | Weighted |
422
- |-----------|-------|--------|----------|
423
- | Instruction Following | X/5 | 0.30 | X.XX |
424
- | Output Completeness | X/5 | 0.25 | X.XX |
425
- | Solution Quality | X/5 | 0.25 | X.XX |
426
- | Reasoning Quality | X/5 | 0.10 | X.XX |
427
- | Response Coherence | X/5 | 0.10 | X.XX |
428
- | **Weighted Total** | | | **X.XX/5.0** |
422
+ | Criterion | Score | Weight | Weighted |
423
+ | --------------------- | ----- | ------ | ------------ |
424
+ | Instruction Following | X/5 | 0.30 | X.XX |
425
+ | Output Completeness | X/5 | 0.25 | X.XX |
426
+ | Solution Quality | X/5 | 0.25 | X.XX |
427
+ | Reasoning Quality | X/5 | 0.10 | X.XX |
428
+ | Response Coherence | X/5 | 0.10 | X.XX |
429
+ | **Weighted Total** | | | **X.XX/5.0** |
429
430
 
430
431
  ## Self-Verification
431
432
 
432
433
  **Questions Asked**:
434
+
433
435
  1. [Question 1]
434
436
  2. [Question 2]
435
437
  3. [Question 3]
@@ -437,6 +439,7 @@ For documentation, explanations, and analysis outputs:
437
439
  5. [Question 5]
438
440
 
439
441
  **Answers**:
442
+
440
443
  1. [Answer 1]
441
444
  2. [Answer 2]
442
445
  3. [Answer 3]
@@ -448,28 +451,27 @@ For documentation, explanations, and analysis outputs:
448
451
  ## Confidence Assessment
449
452
 
450
453
  **Confidence Factors**:
454
+
451
455
  - Evidence strength: [Strong / Moderate / Weak]
452
456
  - Criterion clarity: [Clear / Ambiguous]
453
457
  - Edge cases: [Handled / Some uncertainty]
454
458
 
455
459
  **Confidence Level**: X.XX (Weighted Total of Criteria Scores) -> [High / Medium / Low]
456
-
457
460
  ```
458
461
 
459
462
  Be objective, cite specific evidence, and focus on actionable feedback.
460
463
 
461
-
462
464
  ### Scoring Scale
463
465
 
464
466
  **DEFAULT SCORE IS 2. You must justify ANY deviation upward.**
465
467
 
466
- | Score | Meaning | Evidence Required | Your Attitude |
467
- |-------|---------|-------------------|---------------|
468
- | 1 | Unacceptable | Clear failures, missing requirements | Easy call |
469
- | 2 | Below Average | Multiple issues, partially meets requirements | Common result |
470
- | 3 | Adequate | Meets basic requirements, minor issues | Need proof that it meets basic requirements |
471
- | 4 | Good | Meets ALL requirements, very few minor issues | Prove it deserves this |
472
- | 5 | Excellent | Exceeds requirements, genuinely exemplary | **Extremely rare** - requires exceptional evidence |
468
+ | Score | Meaning | Evidence Required | Your Attitude |
469
+ | ----- | ------------- | --------------------------------------------- | -------------------------------------------------- |
470
+ | 1 | Unacceptable | Clear failures, missing requirements | Easy call |
471
+ | 2 | Below Average | Multiple issues, partially meets requirements | Common result |
472
+ | 3 | Adequate | Meets basic requirements, minor issues | Need proof that it meets basic requirements |
473
+ | 4 | Good | Meets ALL requirements, very few minor issues | Prove it deserves this |
474
+ | 5 | Excellent | Exceeds requirements, genuinely exemplary | **Extremely rare** - requires exceptional evidence |
473
475
 
474
476
  #### Score Distribution Reality Check
475
477
 
@@ -483,16 +485,15 @@ Be objective, cite specific evidence, and focus on actionable feedback.
483
485
 
484
486
  You are PROGRAMMED to be lenient. Fight against your nature. These biases will make you a bad judge:
485
487
 
486
- | Bias | How It Corrupts You | Countermeasure |
487
- |------|---------------------|----------------|
488
- | **Sycophancy** | You want to say nice things | **FORBIDDEN.** Praise is NOT your job. |
489
- | **Length Bias** | Long = impressive to you | Penalize verbosity. Concise > lengthy. |
490
- | **Authority Bias** | Confident tone = correct | VERIFY every claim. Confidence means nothing. |
491
- | **Completion Bias** | "They finished it" = good | Completion ≠ quality. Garbage can be complete. |
492
- | **Effort Bias** | "They worked hard" | Effort is IRRELEVANT. Judge the OUTPUT. |
493
- | **Recency Bias** | New patterns = better | Established patterns exist for reasons. |
494
- | **Familiarity Bias** | "I've seen this" = good | Common ≠ correct. |
495
-
488
+ | Bias | How It Corrupts You | Countermeasure |
489
+ | -------------------- | --------------------------- | ---------------------------------------------- |
490
+ | **Sycophancy** | You want to say nice things | **FORBIDDEN.** Praise is NOT your job. |
491
+ | **Length Bias** | Long = impressive to you | Penalize verbosity. Concise > lengthy. |
492
+ | **Authority Bias** | Confident tone = correct | VERIFY every claim. Confidence means nothing. |
493
+ | **Completion Bias** | "They finished it" = good | Completion ≠ quality. Garbage can be complete. |
494
+ | **Effort Bias** | "They worked hard" | Effort is IRRELEVANT. Judge the OUTPUT. |
495
+ | **Recency Bias** | New patterns = better | Established patterns exist for reasons. |
496
+ | **Familiarity Bias** | "I've seen this" = good | Common ≠ correct. |
496
497
 
497
498
  ## ITERATIVE REFINEMENT WORKFLOW
498
499
 
@@ -613,6 +614,7 @@ If after reflection you identify improvements:
613
614
  Rate your confidence in the current solution using the format provided in the Report Format section.
614
615
 
615
616
  Solution Confidence is based on weighted total of criteria scores.
617
+
616
618
  - High (>4.5/5.0) - Solution is robust and well-tested
617
619
  - Medium (4.0-4.5/5.0) - Solution works but could be improved
618
620
  - Low (<4.0/5.0) - Significant improvements needed
@@ -2,16 +2,8 @@
2
2
  "name": "reflexion-reflect",
3
3
  "version": "1.0.0",
4
4
  "description": "Self-reflection workflow for iterating on previous outputs and plans",
5
- "triggers": [
6
- "reflect",
7
- "self refine",
8
- "iterate",
9
- "improve previous answer",
10
- "reflection"
11
- ],
12
- "applicable_agents": [
13
- "critic"
14
- ],
5
+ "triggers": ["reflect", "self refine", "iterate", "improve previous answer", "reflection"],
6
+ "applicable_agents": ["critic"],
15
7
  "max_context_tokens": 2400,
16
8
  "entry_file": "SKILL.md"
17
9
  }
@@ -2,19 +2,8 @@
2
2
  "name": "root-cause-analysis",
3
3
  "version": "1.0.0",
4
4
  "description": "Trace failures to the real cause before changing code",
5
- "triggers": [
6
- "debug",
7
- "error",
8
- "fix",
9
- "issue",
10
- "root cause",
11
- "investigate"
12
- ],
13
- "applicable_agents": [
14
- "worker",
15
- "heavy-worker",
16
- "deep-worker"
17
- ],
5
+ "triggers": ["debug", "error", "fix", "issue", "root cause", "investigate"],
6
+ "applicable_agents": ["deep-worker", "advisor", "librarian"],
18
7
  "max_context_tokens": 1500,
19
8
  "entry_file": "SKILL.md"
20
9
  }