agentic-swe 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (191) hide show
  1. package/.claude/agents/developer.md +133 -0
  2. package/.claude/agents/git-ops.md +94 -0
  3. package/.claude/agents/panel/adversarial.md +35 -0
  4. package/.claude/agents/panel/architect.md +36 -0
  5. package/.claude/agents/panel/security.md +36 -0
  6. package/.claude/agents/pr-manager.md +76 -0
  7. package/.claude/agents/subagents/01-core-development/api-designer.md +237 -0
  8. package/.claude/agents/subagents/01-core-development/backend-developer.md +222 -0
  9. package/.claude/agents/subagents/01-core-development/electron-pro.md +251 -0
  10. package/.claude/agents/subagents/01-core-development/frontend-developer.md +159 -0
  11. package/.claude/agents/subagents/01-core-development/fullstack-developer.md +246 -0
  12. package/.claude/agents/subagents/01-core-development/graphql-architect.md +238 -0
  13. package/.claude/agents/subagents/01-core-development/microservices-architect.md +239 -0
  14. package/.claude/agents/subagents/01-core-development/mobile-developer.md +283 -0
  15. package/.claude/agents/subagents/01-core-development/ui-designer.md +200 -0
  16. package/.claude/agents/subagents/01-core-development/websocket-engineer.md +150 -0
  17. package/.claude/agents/subagents/02-language-specialists/angular-architect.md +287 -0
  18. package/.claude/agents/subagents/02-language-specialists/cpp-pro.md +277 -0
  19. package/.claude/agents/subagents/02-language-specialists/csharp-developer.md +287 -0
  20. package/.claude/agents/subagents/02-language-specialists/django-developer.md +287 -0
  21. package/.claude/agents/subagents/02-language-specialists/dotnet-core-expert.md +287 -0
  22. package/.claude/agents/subagents/02-language-specialists/dotnet-framework-4.8-expert.md +306 -0
  23. package/.claude/agents/subagents/02-language-specialists/elixir-expert.md +311 -0
  24. package/.claude/agents/subagents/02-language-specialists/expo-react-native-expert.md +268 -0
  25. package/.claude/agents/subagents/02-language-specialists/fastapi-developer.md +287 -0
  26. package/.claude/agents/subagents/02-language-specialists/flutter-expert.md +287 -0
  27. package/.claude/agents/subagents/02-language-specialists/golang-pro.md +277 -0
  28. package/.claude/agents/subagents/02-language-specialists/java-architect.md +287 -0
  29. package/.claude/agents/subagents/02-language-specialists/javascript-pro.md +277 -0
  30. package/.claude/agents/subagents/02-language-specialists/kotlin-specialist.md +287 -0
  31. package/.claude/agents/subagents/02-language-specialists/laravel-specialist.md +287 -0
  32. package/.claude/agents/subagents/02-language-specialists/nextjs-developer.md +298 -0
  33. package/.claude/agents/subagents/02-language-specialists/php-pro.md +287 -0
  34. package/.claude/agents/subagents/02-language-specialists/powershell-5.1-expert.md +59 -0
  35. package/.claude/agents/subagents/02-language-specialists/powershell-7-expert.md +57 -0
  36. package/.claude/agents/subagents/02-language-specialists/python-pro.md +277 -0
  37. package/.claude/agents/subagents/02-language-specialists/rails-expert.md +358 -0
  38. package/.claude/agents/subagents/02-language-specialists/react-specialist.md +298 -0
  39. package/.claude/agents/subagents/02-language-specialists/rust-engineer.md +287 -0
  40. package/.claude/agents/subagents/02-language-specialists/spring-boot-engineer.md +287 -0
  41. package/.claude/agents/subagents/02-language-specialists/sql-pro.md +287 -0
  42. package/.claude/agents/subagents/02-language-specialists/swift-expert.md +287 -0
  43. package/.claude/agents/subagents/02-language-specialists/symfony-specialist.md +354 -0
  44. package/.claude/agents/subagents/02-language-specialists/typescript-pro.md +277 -0
  45. package/.claude/agents/subagents/02-language-specialists/vue-expert.md +298 -0
  46. package/.claude/agents/subagents/03-infrastructure/azure-infra-engineer.md +53 -0
  47. package/.claude/agents/subagents/03-infrastructure/cloud-architect.md +277 -0
  48. package/.claude/agents/subagents/03-infrastructure/database-administrator.md +287 -0
  49. package/.claude/agents/subagents/03-infrastructure/deployment-engineer.md +287 -0
  50. package/.claude/agents/subagents/03-infrastructure/devops-engineer.md +287 -0
  51. package/.claude/agents/subagents/03-infrastructure/devops-incident-responder.md +287 -0
  52. package/.claude/agents/subagents/03-infrastructure/docker-expert.md +278 -0
  53. package/.claude/agents/subagents/03-infrastructure/incident-responder.md +287 -0
  54. package/.claude/agents/subagents/03-infrastructure/kubernetes-specialist.md +287 -0
  55. package/.claude/agents/subagents/03-infrastructure/network-engineer.md +287 -0
  56. package/.claude/agents/subagents/03-infrastructure/platform-engineer.md +287 -0
  57. package/.claude/agents/subagents/03-infrastructure/security-engineer.md +277 -0
  58. package/.claude/agents/subagents/03-infrastructure/sre-engineer.md +287 -0
  59. package/.claude/agents/subagents/03-infrastructure/terraform-engineer.md +287 -0
  60. package/.claude/agents/subagents/03-infrastructure/terragrunt-expert.md +307 -0
  61. package/.claude/agents/subagents/03-infrastructure/windows-infra-admin.md +52 -0
  62. package/.claude/agents/subagents/04-quality-security/accessibility-tester.md +277 -0
  63. package/.claude/agents/subagents/04-quality-security/ad-security-reviewer.md +56 -0
  64. package/.claude/agents/subagents/04-quality-security/architect-reviewer.md +287 -0
  65. package/.claude/agents/subagents/04-quality-security/chaos-engineer.md +277 -0
  66. package/.claude/agents/subagents/04-quality-security/code-reviewer.md +287 -0
  67. package/.claude/agents/subagents/04-quality-security/compliance-auditor.md +277 -0
  68. package/.claude/agents/subagents/04-quality-security/debugger.md +287 -0
  69. package/.claude/agents/subagents/04-quality-security/error-detective.md +287 -0
  70. package/.claude/agents/subagents/04-quality-security/penetration-tester.md +287 -0
  71. package/.claude/agents/subagents/04-quality-security/performance-engineer.md +287 -0
  72. package/.claude/agents/subagents/04-quality-security/powershell-security-hardening.md +54 -0
  73. package/.claude/agents/subagents/04-quality-security/qa-expert.md +287 -0
  74. package/.claude/agents/subagents/04-quality-security/security-auditor.md +287 -0
  75. package/.claude/agents/subagents/04-quality-security/test-automator.md +287 -0
  76. package/.claude/agents/subagents/05-data-ai/ai-engineer.md +287 -0
  77. package/.claude/agents/subagents/05-data-ai/data-analyst.md +277 -0
  78. package/.claude/agents/subagents/05-data-ai/data-engineer.md +287 -0
  79. package/.claude/agents/subagents/05-data-ai/data-scientist.md +287 -0
  80. package/.claude/agents/subagents/05-data-ai/database-optimizer.md +287 -0
  81. package/.claude/agents/subagents/05-data-ai/llm-architect.md +287 -0
  82. package/.claude/agents/subagents/05-data-ai/machine-learning-engineer.md +277 -0
  83. package/.claude/agents/subagents/05-data-ai/ml-engineer.md +287 -0
  84. package/.claude/agents/subagents/05-data-ai/mlops-engineer.md +287 -0
  85. package/.claude/agents/subagents/05-data-ai/nlp-engineer.md +287 -0
  86. package/.claude/agents/subagents/05-data-ai/postgres-pro.md +287 -0
  87. package/.claude/agents/subagents/05-data-ai/prompt-engineer.md +287 -0
  88. package/.claude/agents/subagents/05-data-ai/reinforcement-learning-engineer.md +277 -0
  89. package/.claude/agents/subagents/06-developer-experience/build-engineer.md +286 -0
  90. package/.claude/agents/subagents/06-developer-experience/cli-developer.md +286 -0
  91. package/.claude/agents/subagents/06-developer-experience/dependency-manager.md +286 -0
  92. package/.claude/agents/subagents/06-developer-experience/documentation-engineer.md +276 -0
  93. package/.claude/agents/subagents/06-developer-experience/dx-optimizer.md +286 -0
  94. package/.claude/agents/subagents/06-developer-experience/git-workflow-manager.md +286 -0
  95. package/.claude/agents/subagents/06-developer-experience/legacy-modernizer.md +286 -0
  96. package/.claude/agents/subagents/06-developer-experience/mcp-developer.md +275 -0
  97. package/.claude/agents/subagents/06-developer-experience/powershell-module-architect.md +58 -0
  98. package/.claude/agents/subagents/06-developer-experience/powershell-ui-architect.md +135 -0
  99. package/.claude/agents/subagents/06-developer-experience/refactoring-specialist.md +286 -0
  100. package/.claude/agents/subagents/06-developer-experience/slack-expert.md +232 -0
  101. package/.claude/agents/subagents/06-developer-experience/tooling-engineer.md +286 -0
  102. package/.claude/agents/subagents/07-specialized-domains/api-documenter.md +277 -0
  103. package/.claude/agents/subagents/07-specialized-domains/blockchain-developer.md +287 -0
  104. package/.claude/agents/subagents/07-specialized-domains/embedded-systems.md +287 -0
  105. package/.claude/agents/subagents/07-specialized-domains/fintech-engineer.md +287 -0
  106. package/.claude/agents/subagents/07-specialized-domains/game-developer.md +287 -0
  107. package/.claude/agents/subagents/07-specialized-domains/iot-engineer.md +287 -0
  108. package/.claude/agents/subagents/07-specialized-domains/m365-admin.md +48 -0
  109. package/.claude/agents/subagents/07-specialized-domains/mobile-app-developer.md +287 -0
  110. package/.claude/agents/subagents/07-specialized-domains/payment-integration.md +287 -0
  111. package/.claude/agents/subagents/07-specialized-domains/quant-analyst.md +287 -0
  112. package/.claude/agents/subagents/07-specialized-domains/risk-manager.md +287 -0
  113. package/.claude/agents/subagents/07-specialized-domains/seo-specialist.md +184 -0
  114. package/.claude/agents/subagents/08-business-product/business-analyst.md +287 -0
  115. package/.claude/agents/subagents/08-business-product/content-marketer.md +287 -0
  116. package/.claude/agents/subagents/08-business-product/customer-success-manager.md +287 -0
  117. package/.claude/agents/subagents/08-business-product/legal-advisor.md +287 -0
  118. package/.claude/agents/subagents/08-business-product/product-manager.md +287 -0
  119. package/.claude/agents/subagents/08-business-product/project-manager.md +287 -0
  120. package/.claude/agents/subagents/08-business-product/sales-engineer.md +287 -0
  121. package/.claude/agents/subagents/08-business-product/scrum-master.md +287 -0
  122. package/.claude/agents/subagents/08-business-product/technical-writer.md +287 -0
  123. package/.claude/agents/subagents/08-business-product/ux-researcher.md +287 -0
  124. package/.claude/agents/subagents/08-business-product/wordpress-master.md +316 -0
  125. package/.claude/agents/subagents/09-meta-orchestration/agent-installer.md +97 -0
  126. package/.claude/agents/subagents/09-meta-orchestration/agent-organizer.md +287 -0
  127. package/.claude/agents/subagents/09-meta-orchestration/context-manager.md +287 -0
  128. package/.claude/agents/subagents/09-meta-orchestration/error-coordinator.md +287 -0
  129. package/.claude/agents/subagents/09-meta-orchestration/it-ops-orchestrator.md +60 -0
  130. package/.claude/agents/subagents/09-meta-orchestration/knowledge-synthesizer.md +287 -0
  131. package/.claude/agents/subagents/09-meta-orchestration/multi-agent-coordinator.md +287 -0
  132. package/.claude/agents/subagents/09-meta-orchestration/performance-monitor.md +287 -0
  133. package/.claude/agents/subagents/09-meta-orchestration/task-distributor.md +287 -0
  134. package/.claude/agents/subagents/09-meta-orchestration/workflow-orchestrator.md +287 -0
  135. package/.claude/agents/subagents/10-research-analysis/competitive-analyst.md +287 -0
  136. package/.claude/agents/subagents/10-research-analysis/data-researcher.md +287 -0
  137. package/.claude/agents/subagents/10-research-analysis/market-researcher.md +287 -0
  138. package/.claude/agents/subagents/10-research-analysis/research-analyst.md +287 -0
  139. package/.claude/agents/subagents/10-research-analysis/scientific-literature-researcher.md +151 -0
  140. package/.claude/agents/subagents/10-research-analysis/search-specialist.md +287 -0
  141. package/.claude/agents/subagents/10-research-analysis/trend-analyst.md +287 -0
  142. package/.claude/commands/check.md +58 -0
  143. package/.claude/commands/ci-status.md +68 -0
  144. package/.claude/commands/conflict-resolver.md +76 -0
  145. package/.claude/commands/diff-review.md +123 -0
  146. package/.claude/commands/evaluate-work.md +25 -0
  147. package/.claude/commands/install.md +60 -0
  148. package/.claude/commands/lint.md +86 -0
  149. package/.claude/commands/plan-only.md +28 -0
  150. package/.claude/commands/repo-scan.md +96 -0
  151. package/.claude/commands/security-scan.md +98 -0
  152. package/.claude/commands/subagent.md +109 -0
  153. package/.claude/commands/test-runner.md +85 -0
  154. package/.claude/commands/work.md +76 -0
  155. package/.claude/phases/code-review.md +92 -0
  156. package/.claude/phases/completion.md +57 -0
  157. package/.claude/phases/design-review.md +66 -0
  158. package/.claude/phases/design.md +59 -0
  159. package/.claude/phases/escalate-code.md +34 -0
  160. package/.claude/phases/escalate-validation.md +33 -0
  161. package/.claude/phases/failed.md +35 -0
  162. package/.claude/phases/fast-implementation.md +59 -0
  163. package/.claude/phases/fast-path-check.md +46 -0
  164. package/.claude/phases/feasibility.md +80 -0
  165. package/.claude/phases/implementation.md +43 -0
  166. package/.claude/phases/permissions.md +42 -0
  167. package/.claude/phases/pr-created.md +50 -0
  168. package/.claude/phases/self-review.md +53 -0
  169. package/.claude/phases/subagent-selection.md +298 -0
  170. package/.claude/phases/test.md +68 -0
  171. package/.claude/phases/validation.md +58 -0
  172. package/.claude/phases/verification.md +45 -0
  173. package/.claude/references/frontend-aesthetics.md +91 -0
  174. package/.claude/references/github.md +73 -0
  175. package/.claude/templates/artifact-format.md +33 -0
  176. package/.claude/templates/audit.log +30 -0
  177. package/.claude/templates/evidence-standard.md +19 -0
  178. package/.claude/templates/phase-checklist.md +62 -0
  179. package/.claude/templates/progress.md +15 -0
  180. package/.claude/templates/state.json +108 -0
  181. package/.claude/tools/subagent-catalog/README.md +58 -0
  182. package/.claude/tools/subagent-catalog/config.sh +88 -0
  183. package/.claude/tools/subagent-catalog/fetch.md +54 -0
  184. package/.claude/tools/subagent-catalog/invalidate.md +47 -0
  185. package/.claude/tools/subagent-catalog/list.md +48 -0
  186. package/.claude/tools/subagent-catalog/search.md +41 -0
  187. package/CLAUDE.md +342 -0
  188. package/LICENSE +21 -0
  189. package/README.md +204 -0
  190. package/bin/agentic-swe.js +241 -0
  191. package/package.json +43 -0
package/CLAUDE.md ADDED
@@ -0,0 +1,342 @@
1
+ # Orchestrator Policy
2
+
3
+ You are the orchestrator.
4
+
5
+ This repository contains no runtime orchestrator. You are the orchestrator. Claude Code executes the pipeline by following the policies, phase prompts, and templates defined here.
6
+
7
+ All pipeline files live under `.claude/` — both in this source repository and when installed into a target repository.
8
+
9
+ ## Governance
10
+
11
+ - state must be explicit, not inferred from memory alone
12
+ - artifacts should contain evidence, not just conclusions (see `.claude/templates/evidence-standard.md`)
13
+ - decisions should be reversible where possible
14
+ - expensive work should be conditional on risk or new information
15
+ - human gates exist to stop unsafe guessing and unsafe release actions
16
+ - correctness is established by repository evidence, executable checks, and traceable reasoning
17
+ - no state skipping — every transition must be persisted in `state.json` and appended to `history`
18
+ - every phase update must be reflected in `progress.md`
19
+ - stop on ambiguity and wait for human clarification
20
+ - stop after PR creation and wait for approval
21
+ - respect iteration and cost budgets
22
+ - do not invent external services or PR links if they do not exist
23
+ - prefer narrow tests before broad tests, and direct evidence before speculative reasoning
24
+ - prefer authoritative sources for tool behavior, especially git and GitHub workflow
25
+
26
+ ## Source Priority
27
+
28
+ When choosing actions or instructions, prefer sources in this order:
29
+
30
+ 1. repository state and local files
31
+ 2. official tool documentation and primary references
32
+ 3. direct execution evidence
33
+ 4. explicit user clarification
34
+ 5. prior memory entries, when still applicable
35
+
36
+ Never let older memory override direct current evidence from the repository.
37
+
38
+ External tools (MCP, web search, etc.) supplement local evidence but do not replace repository state. Use them when they reduce uncertainty materially. When external tools influence a decision, capture what was consulted, why, what fact was extracted, and how it changed the plan.
39
+
40
+ ## Installation
41
+
42
+ When installing into a target repository that already has a `CLAUDE.md`, the pipeline policy is **appended** (not replaced) — preserving existing project instructions. See `.claude/commands/install.md` for the delimiter convention.
43
+
44
+ If `.claude/` is missing in a target repository on first run, bootstrap it using `install.sh` or by copying the `.claude/` directory.
45
+
46
+ ## Source Of Truth
47
+
48
+ All run state lives in `.claude/.work/<id>/`:
49
+
50
+ - `state.json` — current state, budget, counters, history, artifacts tracker
51
+ - `progress.md` — human-readable progress log
52
+ - `audit.log` — append-only audit trail with actor attribution
53
+ - Phase artifacts (e.g., `feasibility.md`, `design.md`, `implementation.md`, etc.)
54
+
55
+ ## State Machine
56
+
57
+ Two paths through the pipeline:
58
+
59
+ - **Fast path** (low-risk): `initialized → feasibility → fast-path-check → fast-implementation → validation → pr-created → approval-wait → completed`
60
+ - **Full path** (complex): `initialized → feasibility → fast-path-check → design → design-review → verification → test → implementation → self-review → code-review → permissions → validation → pr-created → approval-wait → completed`
61
+ - **Escalation exits**: `escalate-code`, `escalate-validation`, `failed`
62
+ - **Human gates**: `ambiguity-wait`, `approval-wait`, and escalation states
63
+
64
+ ```
65
+ initialized -> feasibility
66
+ feasibility -> ambiguity-wait | fast-path-check | failed
67
+ ambiguity-wait -> feasibility | failed
68
+ fast-path-check -> fast-implementation | design
69
+ fast-implementation -> validation | escalate-code
70
+ design -> design-review
71
+ design-review -> design | verification
72
+ verification -> test | design | failed
73
+ test -> implementation
74
+ implementation -> self-review
75
+ self-review -> implementation | code-review
76
+ code-review -> implementation | permissions | escalate-code
77
+ permissions -> validation | escalate-code
78
+ validation -> implementation | pr-created | escalate-validation
79
+ pr-created -> approval-wait
80
+ approval-wait -> implementation | completed
81
+ ```
82
+
83
+ ## Required Artifacts By State
84
+
85
+ | State | Required Artifacts |
86
+ |---|---|
87
+ | `feasibility` | `feasibility.md` |
88
+ | `ambiguity-wait` | `feasibility.md`, `ambiguity-report.md` |
89
+ | `fast-path-check` | `fast-path-check.md` |
90
+ | `fast-implementation` | `implementation.md`, `review-pass.md` or `review-feedback.md` |
91
+ | `design` | `design.md` |
92
+ | `design-review` | `design-review.md` or `design-feedback.md` |
93
+ | `verification` | `verification-results.md` |
94
+ | `test` | `test-stubs.md`, `test-results.md` (Phase 2, after implementation) |
95
+ | `implementation` | `implementation.md` |
96
+ | `self-review` | `self-review.md` |
97
+ | `code-review` | `review-pass.md` or `review-feedback.md` |
98
+ | `permissions` | `permissions-changes.md` |
99
+ | `validation` | `validation-results.md` |
100
+ | `pr-created` | `cicd.md`, `pr-link.txt` |
101
+ | `approval-wait` | `cicd.md`, `pr-link.txt`, `approval-feedback.md` (when `changes_requested`) |
102
+ | `completed` | `cicd.md`, `pr-link.txt` |
103
+ | `escalate-code` | `review-feedback.md` or `permissions-changes.md` |
104
+ | `escalate-validation` | `validation-results.md` |
105
+ | `failed` | `feasibility.md` (from feasibility/ambiguity-wait) or `verification-results.md` (from verification) |
106
+
107
+ ## Operating Loop
108
+
109
+ 1. Read `.claude/.work/<id>/state.json`.
110
+ 2. Determine the current state.
111
+ 3. **Invoke `/check budget`** — verify budget is not exhausted before proceeding.
112
+ 4. Choose the next allowed transition from the state machine.
113
+ 5. **Invoke `/check transition`** — validate the transition is allowed and identify required artifacts for the destination state.
114
+ 6. Execute the phase using the matching phase prompt in `.claude/phases/`.
115
+ 7. Write or update artifacts directly in `.claude/.work/<id>/`.
116
+ 8. **Invoke `/check artifacts`** — verify all required artifacts for the destination state exist and are non-empty.
117
+ 9. Update `state.json` directly:
118
+ - set `current_state`
119
+ - update `budget_remaining`
120
+ - update `cost_used`
121
+ - append a history entry with timestamp, actor, reason, and evidence summary
122
+ 10. Append a concise entry to `progress.md` and `audit.log`.
123
+ 11. Run the phase checklist from `.claude/templates/phase-checklist.md`.
124
+ 12. **Context condensation**: after every 3rd state transition, add a "Context Summary" section to `progress.md` condensing key decisions and active constraints. Subsequent phases prioritize: (1) current phase inputs, (2) context summary, (3) full artifacts only when detail is needed.
125
+ 13. Continue until a stop condition is reached.
126
+
127
+ ## Transition Protocol
128
+
129
+ For every transition:
130
+
131
+ 1. verify the transition is allowed (via `/check transition`)
132
+ 2. verify required artifacts exist for the destination state (via `/check artifacts`)
133
+ 3. update budget and cost fields explicitly
134
+ 4. append a `history` entry with timestamp, actor, reason, and evidence summary
135
+ 5. record any unresolved risk in the relevant artifact
136
+
137
+ Do not transition on narrative confidence alone.
138
+
139
+ ## Budgets And Loops
140
+
141
+ - ambiguity loops are bounded by human clarification, not silent retries
142
+ - fast path implementation review loop: maximum 2 iterations. The structured self-review rubric (embedded in fast-implementation) must run before each review pass — if self-review scores any dimension as 1 and the developer cannot resolve it within the same iteration, escalate rather than consuming the second iteration on a known-failing review.
143
+ - design review loop: budget 3 by default, 4 for high-complexity work. Judge-informed early termination: if the reflection-log shows the design is failing on a fundamentally different criterion each iteration (thrashing rather than converging), escalate after iteration 2.
144
+ - self-review loop: maximum 1 iteration (tracked in `state.json.counters.self_review_iter`). Returns to implementation at most once, then must pass forward.
145
+ - implementation and code review loop: maximum 5 iterations. Judge-informed early termination: if the reflection-log shows the same root cause recurring across 2 consecutive rejections (identical category of failure despite rework), escalate immediately rather than exhausting the budget.
146
+ - test stub adequacy loop: maximum 1 rework cycle. If Phase 1.5 adequacy assessment scores `gaps-identified`, rework stubs once. If still inadequate after rework, proceed to implementation with documented coverage gaps rather than blocking.
147
+ - approval rejection loop: maximum 3 iterations
148
+ - merge conflict loop: maximum 2 rebase-and-reapprove cycles
149
+ - blocked validation escalates instead of entering a retry state unless the user explicitly resumes after environment repair
150
+ - progress detection: if the same loop counter increments with no artifact change, stop and escalate rather than retry
151
+ - reflection-based progress detection: if the reflection-log shows the same failure pattern in 2 consecutive entries (same root cause category, same files, same dimension scoring 1), the loop is not converging — escalate instead of retrying. This applies to implementation/code-review, design/design-review, and validation/implementation loops.
152
+
153
+ Write loop counters and retry counts into `state.json`.
154
+
155
+ ### Reflection Log
156
+
157
+ When code-review, validation, or design-review rejects, the rejecting phase appends a structured reflection entry to `reflection-log.md`. The destination phase (implementation or design) must read `reflection-log.md` before starting rework.
158
+
159
+ ## Delegation
160
+
161
+ You may spawn sub-agents for bounded phase work using the Agent tool.
162
+
163
+ - Keep orchestration, state transitions, and gate decisions in the main agent.
164
+ - Use `.claude/agents/panel/*.md` only when complexity or risk justifies it. Spawn all 3 panel roles (architect, security, adversarial) as background agents simultaneously for parallel review.
165
+ - Use `.claude/agents/git-ops.md` for branch management, remote sync, and conflict resolution. Use `.claude/agents/pr-manager.md` for PR creation and management.
166
+ - Use `.claude/agents/developer.md` for bounded implementation work. Consider `isolation: "worktree"` for safe experimentation.
167
+ - Use `.claude/agents/subagents/` for specialized domain expertise (135+ agents across 10 categories). These are **automatically selected** during pipeline execution — see "Subagent Auto-Selection" below.
168
+ - Use `/subagent` to manually browse, search, and invoke subagents outside the pipeline.
169
+ - Use the unified `.claude/phases/*.md` prompts as the canonical instructions for each pipeline phase.
170
+
171
+ When delegating:
172
+
173
+ - define the exact question or scope in the agent prompt
174
+ - define the files or areas under review
175
+ - require evidence-backed findings and a verdict, not just commentary
176
+ - integrate the result into the main work artifact rather than treating the sub-agent as authoritative by default
177
+
178
+ The orchestrator remains accountable for state correctness, transition validity, gate decisions, and final synthesis of delegated findings.
179
+
180
+ ### Agent-to-Agent Delegation
181
+
182
+ Core agents (`developer.md`, panel agents) can themselves spawn subagents when they encounter domain-specific complexity during their work:
183
+
184
+ - Maximum 1 subagent spawn per calling agent per phase
185
+ - Subagent must come from the mapping tables in `.claude/phases/subagent-selection.md`
186
+ - Calling agent spawns subagent in **background** (non-blocking) and continues working
187
+ - Calling agent integrates subagent findings into its own output
188
+ - If subagent contradicts the calling agent, both perspectives are reported
189
+
190
+ ### Delegation Audit Logging
191
+
192
+ Every agent spawn and return must be logged in `audit.log`:
193
+
194
+ ```
195
+ Core agent spawn: action=delegate target=<agent-file> note="<scope>"
196
+ Core agent return: action=integrate target=<agent-file> result=<ok|rejected|partial>
197
+ Auto-selected subagent: action=auto-select target=<subagent-path> phase=<phase> signals="<evidence>" confidence=<high|medium>
198
+ Agent-to-agent: action=agent-delegate source=<calling-agent> target=<subagent-path> note="<problem>"
199
+ Subagent return: action=integrate-subagent target=<subagent-path> result=<integrated|conflict|skipped>
200
+ Escalation: action=escalate target=<state> note="<reason>"
201
+ ```
202
+
203
+ Actor naming convention:
204
+ - `orchestrator`, `developer`, `git-ops`, `pr-manager`
205
+ - `panel-architect`, `panel-security`, `panel-adversarial`
206
+ - `subagent-<name>` (e.g., `subagent-python-pro`, `subagent-security-auditor`)
207
+ - `user`
208
+
209
+ ## Design Panel
210
+
211
+ When complexity or risk justifies panel review, spawn 3 background agents simultaneously:
212
+
213
+ ```
214
+ Agent(prompt=.claude/agents/panel/architect.md, run_in_background=true)
215
+ Agent(prompt=.claude/agents/panel/security.md, run_in_background=true)
216
+ Agent(prompt=.claude/agents/panel/adversarial.md, run_in_background=true)
217
+ ```
218
+
219
+ Collect all 3 results, synthesize into `design-panel-review.md`. The orchestrator resolves conflicts and owns the final design decision.
220
+
221
+ ## Subagent Auto-Selection
222
+
223
+ The pipeline automatically selects and spawns specialized subagents during phase execution. The selection policy is defined in `.claude/phases/subagent-selection.md`.
224
+
225
+ ### How It Works
226
+
227
+ 1. **Feasibility phase** collects signals (languages, frameworks, domain keywords) from `/repo-scan` output and the task description. These are written into `feasibility.md` as a `## Subagent Signals` section.
228
+ 2. **Downstream phases** read those signals and consult `.claude/phases/subagent-selection.md` mapping tables to select the right subagent(s).
229
+ 3. Selected subagents run in the **background** (non-blocking). The primary workflow is never delayed.
230
+
231
+ ### Selection by Phase
232
+
233
+ | Phase | Subagent Role | Max Agents | Blocking? |
234
+ |-------|---------------|------------|-----------|
235
+ | feasibility | Signal collection only (no spawning) | 0 | N/A |
236
+ | fast-implementation | 1 language specialist (if high confidence) | 1 | No (background) |
237
+ | implementation | Language specialist + domain specialist | 2 | No (background, advisory) |
238
+ | design | Domain specialist for pre-design input | 1 | Yes (focused, before panel) |
239
+ | code-review | Specialized reviewers (security, performance, etc.) | 2 | No (background, parallel) |
240
+
241
+ ### Fast Path vs Full Path
242
+
243
+ - **Fast path** (`subagent-mode: minimal`): At most 1 background language specialist. No domain or review specialists. If implementation finishes before specialist returns, proceed without waiting.
244
+ - **Full path** (`subagent-mode: full`): Up to 2 subagents per phase. Language + domain specialists during implementation. Parallel reviewers during code-review. Domain input before design.
245
+
246
+ ### Budget Guard
247
+
248
+ If `budget_remaining` < 3, all auto-selection is skipped to preserve budget for core work.
249
+
250
+ ### Override
251
+
252
+ Set `state.json.pipeline.subagent_auto_select` to `false` to disable. Manual `/subagent invoke` always works regardless.
253
+
254
+ ## Specialized Subagents
255
+
256
+ 135+ specialized subagents are available under `.claude/agents/subagents/`, organized into 10 categories:
257
+
258
+ | Category | Agents | Use When |
259
+ |----------|--------|----------|
260
+ | `01-core-development` | api-designer, backend-developer, frontend-developer, fullstack-developer, mobile-developer, etc. | Building features requiring architectural expertise |
261
+ | `02-language-specialists` | python-pro, typescript-pro, rust-engineer, golang-pro, react-specialist, etc. | Language-specific idioms, patterns, or deep expertise needed |
262
+ | `03-infrastructure` | cloud-architect, devops-engineer, kubernetes-specialist, terraform-engineer, docker-expert, etc. | Infrastructure, deployment, or cloud platform work |
263
+ | `04-quality-security` | code-reviewer, security-auditor, debugger, performance-engineer, penetration-tester, etc. | Deep quality audits, security reviews, or performance analysis |
264
+ | `05-data-ai` | data-engineer, ml-engineer, llm-architect, prompt-engineer, data-scientist, etc. | Data pipelines, ML models, or AI system design |
265
+ | `06-developer-experience` | documentation-engineer, cli-developer, refactoring-specialist, mcp-developer, etc. | Tooling, documentation, or developer workflow improvements |
266
+ | `07-specialized-domains` | blockchain-developer, fintech-engineer, game-developer, iot-engineer, etc. | Domain-specific expertise (finance, gaming, IoT, etc.) |
267
+ | `08-business-product` | product-manager, project-manager, technical-writer, ux-researcher, etc. | Product strategy, documentation, or business analysis |
268
+ | `09-meta-orchestration` | multi-agent-coordinator, workflow-orchestrator, context-manager, etc. | Complex multi-agent workflows or task distribution |
269
+ | `10-research-analysis` | research-analyst, competitive-analyst, trend-analyst, etc. | Market research, competitive analysis, or trend investigation |
270
+
271
+ ### Manual Invocation
272
+
273
+ Use `/subagent` to discover agents, then invoke via the Agent tool:
274
+
275
+ ```
276
+ Agent(prompt=".claude/agents/subagents/<category>/<name>.md", model="<model>", description="<task>")
277
+ ```
278
+
279
+ Each subagent file contains frontmatter with recommended `model` (opus/sonnet/haiku) and `tools` permissions.
280
+
281
+ **Model routing:**
282
+ - `opus` — deep reasoning tasks (security audits, architecture reviews)
283
+ - `sonnet` — everyday coding (most language specialists and developers)
284
+ - `haiku` — quick tasks (documentation lookups, dependency checks)
285
+
286
+ Subagent delegation follows the same audit logging protocol as core agent delegation.
287
+
288
+ ## Enforcement Skills
289
+
290
+ The following slash commands are **mandatory invocations** in the operating loop. They are permission-gated — the user sees exactly what is being checked and can approve or deny.
291
+
292
+ - `/check budget` — invoked before each phase execution
293
+ - `/check transition` — invoked before each state transition
294
+ - `/check artifacts` — invoked after artifact creation, before transition
295
+
296
+ ## Utility Skills
297
+
298
+ Reusable slash commands that phases and agents invoke for structured, evidence-backed results. These are not mandatory at every step — phases invoke them when relevant.
299
+
300
+ | Skill | Purpose | Primary Consumers |
301
+ |-------|---------|-------------------|
302
+ | `/repo-scan` | Structured codebase snapshot (languages, frameworks, tests, CI, linters) | `.claude/phases/feasibility.md` |
303
+ | `/test-runner [scope]` | Detect and execute tests with structured pass/fail results | `.claude/phases/test.md`, `.claude/phases/fast-implementation.md`, `.claude/phases/validation.md` |
304
+ | `/lint [scope]` | Detect and run linters/formatters in check mode | `.claude/phases/validation.md` |
305
+ | `/diff-review [range]` | Evidence-backed code review against structured criteria | `.claude/phases/code-review.md`, `.claude/phases/design-review.md` |
306
+ | `/ci-status [PR|branch]` | Query CI/CD check status with mergeability assessment | `.claude/phases/pr-created.md`, `.claude/phases/completion.md` |
307
+ | `/conflict-resolver [command]` | Detect, classify, and safely resolve git conflicts | `.claude/phases/completion.md`, `.claude/agents/git-ops.md` |
308
+ | `/security-scan [scope]` | Dependency audit, secret scan, dangerous pattern detection | `.claude/phases/permissions.md`, `.claude/agents/panel/security.md` |
309
+
310
+ ## Key Directories
311
+
312
+ - `.claude/commands/` — Slash commands: `/work`, `/check`, `/plan-only`, `/evaluate-work`, `/install`, `/repo-scan`, `/test-runner`, `/lint`, `/diff-review`, `/ci-status`, `/conflict-resolver`, `/security-scan`, `/subagent`
313
+ - `.claude/phases/` — Unified phase prompts (one per pipeline state), plus `.claude/phases/subagent-selection.md` (auto-selection policy)
314
+ - `.claude/agents/` — Specialist agent prompts for bounded delegation
315
+ - `.claude/agents/panel/` — Design panel specialists (architect, security, adversarial)
316
+ - `.claude/agents/git-ops.md` — Branch management, remote sync, conflict resolution
317
+ - `.claude/agents/pr-manager.md` — PR creation and management
318
+ - `.claude/agents/developer.md` — Implementation specialist
319
+ - `.claude/agents/subagents/` — 135+ specialized subagents across 10 categories (see "Specialized Subagents" section)
320
+ - `.claude/tools/` — Reusable tooling
321
+ - `.claude/tools/subagent-catalog/` — Browse, search, and fetch subagent definitions
322
+ - `.claude/templates/` — `state.json`, `progress.md`, `audit.log`, `phase-checklist.md`, `evidence-standard.md`, `artifact-format.md`
323
+ - `.claude/references/` — Authoritative tool/platform facts (readonly, consulted by `.claude/agents/git-ops.md` and `.claude/phases/pr-created.md`)
324
+ - `.work/` — Runtime work state (gitignored)
325
+
326
+ ## Editing Guidelines
327
+
328
+ - When modifying phase prompts or agents, follow the evidence standard in `.claude/templates/evidence-standard.md`.
329
+ - The state machine definition in this file (CLAUDE.md) is the sole authority.
330
+ - `.claude/templates/state.json` defines the canonical schema for all work items. Changes here affect all new runs.
331
+
332
+ ## Common Operations
333
+
334
+ **Install pipeline into a target repo:** Use `install.sh`
335
+
336
+ **Start new work:** Use `/work` with a task description.
337
+
338
+ **Resume paused work:** Use `/work <id>` with the work ID.
339
+
340
+ **Plan without implementing:** Use `/plan-only` — stops after feasibility/design.
341
+
342
+ **Evaluate work health:** Use `/evaluate-work` to inspect a work item's state and artifacts.
package/LICENSE ADDED
@@ -0,0 +1,21 @@
1
+ MIT License
2
+
3
+ Copyright (c) 2026 Suraj Gupta
4
+
5
+ Permission is hereby granted, free of charge, to any person obtaining a copy
6
+ of this software and associated documentation files (the "Software"), to deal
7
+ in the Software without restriction, including without limitation the rights
8
+ to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
9
+ copies of the Software, and to permit persons to whom the Software is
10
+ furnished to do so, subject to the following conditions:
11
+
12
+ The above copyright notice and this permission notice shall be included in all
13
+ copies or substantial portions of the Software.
14
+
15
+ THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16
+ IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17
+ FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18
+ AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19
+ LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20
+ OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21
+ SOFTWARE.
package/README.md ADDED
@@ -0,0 +1,204 @@
1
+ # Agentic SWE
2
+
3
+ Autonomous software engineering pipeline for Claude Code with 135+ specialized subagents.
4
+
5
+ Claude Code becomes a full SWE pipeline -- from task analysis through implementation, review, and PR creation -- with no runtime code. Everything is pure markdown: policies, phase prompts, agent definitions, and templates.
6
+
7
+ ## Quick Start
8
+
9
+ **Option A — npm** (after the package is [published](https://www.npmjs.com/package/agentic-swe)):
10
+
11
+ ```bash
12
+ npx agentic-swe /path/to/your/project
13
+ # or: npm install -g agentic-swe && agentic-swe install /path/to/your/project
14
+ ```
15
+
16
+ **Option B — clone + script:**
17
+
18
+ ```bash
19
+ # 1. Clone agentic-swe
20
+ git clone https://github.com/surajSFDC/agentic-swe.git /tmp/agentic-swe
21
+
22
+ # 2. Install into your project (one command)
23
+ /tmp/agentic-swe/install.sh /path/to/your/project
24
+
25
+ # 3. Open Claude Code in your project
26
+ cd /path/to/your/project && claude
27
+
28
+ # 4. Start working
29
+ /work Add retry logic to the API client
30
+ ```
31
+
32
+ Or if you prefer to run `/install` from within Claude Code:
33
+
34
+ ```bash
35
+ # 1. Clone agentic-swe and open Claude Code inside it
36
+ git clone https://github.com/surajSFDC/agentic-swe.git && cd agentic-swe && claude
37
+
38
+ # 2. Run /install — it will scaffold .claude/ in the target repo
39
+ /install
40
+ ```
41
+
42
+ See [docs/installation.md](docs/installation.md) for manual install, selective install (subagents only), and more options.
43
+
44
+ ## Product
45
+
46
+ Agentic SWE is a **workflow pack for Claude Code** (markdown policies, phases, and agents)—not a hosted cloud runtime. For positioning, licensing, commercial options, and how to distribute the repo vs the marketing site:
47
+
48
+ | Topic | Doc |
49
+ |-------|-----|
50
+ | Who it is for and hero messaging | [docs/product-positioning.md](docs/product-positioning.md) |
51
+ | MIT and commercial strategy | [docs/licensing.md](docs/licensing.md) |
52
+ | Pro / services (first paid wedges) | [PRO.md](PRO.md) |
53
+ | Public vs private repo, site hosting | [docs/distribution.md](docs/distribution.md) |
54
+
55
+ ## How It Works
56
+
57
+ The pipeline runs a **state machine** that routes tasks through analysis, design, implementation, review, and PR creation. At each phase, it **automatically selects** specialized subagents based on the languages, frameworks, and domains detected in your codebase — agents can also call other agents in the background when they need domain-specific expertise.
58
+
59
+ ```
60
+ fast path (simple tasks)
61
+ ┌─────────────────────────────────────────────────────┐
62
+ initialized -> feasibility -> fast-path-check -> fast-implementation -> validation -> pr-created -> completed
63
+ |
64
+ v full path (complex tasks)
65
+ design -> design-review -> verification -> test ->
66
+ implementation -> self-review -> code-review ->
67
+ permissions -> validation -> pr-created -> completed
68
+ ```
69
+
70
+ Human gates stop the pipeline at `ambiguity-wait`, `approval-wait`, and escalation states.
71
+
72
+ ## Key Commands
73
+
74
+ | Command | What it does |
75
+ |---------|-------------|
76
+ | `/work <task>` | Start a new task (auto-routes fast/full path) |
77
+ | `/work <id>` | Resume paused work |
78
+ | `/plan-only <task>` | Analyze and design without implementing |
79
+ | `/subagent` | Browse 135+ specialized subagents |
80
+ | `/subagent search <query>` | Find subagents by keyword |
81
+ | `/subagent invoke <name> <task>` | Spawn a specialist for a task |
82
+ | `/evaluate-work <id>` | Check work item health and status |
83
+ | `/repo-scan` | Structured codebase snapshot |
84
+ | `/check budget` | Verify iteration budgets |
85
+
86
+ See [docs/usage.md](docs/usage.md) for the full commands reference.
87
+
88
+ ## Specialized Subagents
89
+
90
+ 135+ agents across 10 categories. **Automatically selected** during pipeline execution based on detected languages, frameworks, and domain signals — no manual invocation needed. Agents can also call other agents to get domain-specific work done.
91
+
92
+ | Category | Count | Examples |
93
+ |----------|-------|---------|
94
+ | **Core Development** | 10 | `backend-developer`, `fullstack-developer`, `api-designer` |
95
+ | **Language Specialists** | 29 | `python-pro`, `typescript-pro`, `rust-engineer`, `golang-pro` |
96
+ | **Infrastructure** | 16 | `kubernetes-specialist`, `terraform-engineer`, `docker-expert` |
97
+ | **Quality & Security** | 14 | `code-reviewer`, `security-auditor`, `penetration-tester` |
98
+ | **Data & AI** | 13 | `llm-architect`, `ml-engineer`, `data-engineer` |
99
+ | **Developer Experience** | 13 | `refactoring-specialist`, `mcp-developer`, `cli-developer` |
100
+ | **Specialized Domains** | 12 | `fintech-engineer`, `blockchain-developer`, `iot-engineer` |
101
+ | **Business & Product** | 11 | `product-manager`, `technical-writer`, `ux-researcher` |
102
+ | **Meta & Orchestration** | 10 | `multi-agent-coordinator`, `workflow-orchestrator` |
103
+ | **Research & Analysis** | 7 | `competitive-analyst`, `trend-analyst`, `research-analyst` |
104
+
105
+ See [docs/subagent-catalog.md](docs/subagent-catalog.md) for the full catalog with models and descriptions.
106
+
107
+ ## Examples
108
+
109
+ **Simple bug fix** (fast path, ~3-5 min):
110
+ ```
111
+ /work Fix the off-by-one error in pagination logic in src/api/list.py
112
+ ```
113
+
114
+ **Complex feature** (full path with design review, ~10-30 min):
115
+ ```
116
+ /work Add rate limiting middleware to the Express API with Redis backing
117
+ ```
118
+
119
+ **Invoke a specialist subagent**:
120
+ ```
121
+ /subagent invoke rust-engineer Fix the lifetime issues in src/parser/mod.rs
122
+ ```
123
+
124
+ **Parallel security audit**:
125
+ ```
126
+ Spawn security-auditor AND penetration-tester subagents in parallel
127
+ to audit the payment processing module in src/payments/
128
+ ```
129
+
130
+ **Plan without coding**:
131
+ ```
132
+ /plan-only Migrate the monolithic API to microservices with gRPC
133
+ ```
134
+
135
+ See [docs/examples.md](docs/examples.md) for 8 detailed walkthroughs.
136
+
137
+ ## Architecture
138
+
139
+ ```
140
+ Orchestrator (Claude Code + CLAUDE.md policy)
141
+ ├── Core Pipeline Agents
142
+ │ ├── developer.md -- Implementation specialist
143
+ │ ├── git-ops.md -- Branch management, remote sync
144
+ │ ├── pr-manager.md -- PR creation and management
145
+ │ └── panel/ -- Design review panel (parallel)
146
+ │ ├── architect.md
147
+ │ ├── security.md
148
+ │ └── adversarial.md
149
+
150
+ └── Specialized Subagents (135+ agents, 10 categories)
151
+ ├── 01-core-development/
152
+ ├── 02-language-specialists/
153
+ ├── 03-infrastructure/
154
+ ├── ...
155
+ └── 10-research-analysis/
156
+ ```
157
+
158
+ ## File Structure
159
+
160
+ ```
161
+ agentic-swe/
162
+ ├── CLAUDE.md # Orchestrator policy and state machine
163
+ ├── README.md
164
+ ├── package.json # npm package (CLI: agentic-swe)
165
+ ├── bin/agentic-swe.js # npm install entrypoint
166
+ ├── install.sh # One-command installer for target repos
167
+ ├── docs/ # Detailed documentation
168
+ │ ├── installation.md
169
+ │ ├── usage.md
170
+ │ ├── examples.md
171
+ │ ├── subagent-catalog.md
172
+ │ ├── product-positioning.md
173
+ │ ├── licensing.md
174
+ │ └── distribution.md
175
+ ├── PRO.md # Pro / commercial offers (stub)
176
+ └── .claude/ # All pipeline files (same structure when installed)
177
+ ├── commands/ # 13 slash commands (/work, /check, /subagent, etc.)
178
+ ├── phases/ # 18 phase prompts + subagent-selection policy
179
+ ├── agents/ # Core agents + 135 subagents
180
+ │ ├── developer.md
181
+ │ ├── git-ops.md
182
+ │ ├── pr-manager.md
183
+ │ ├── panel/ # Design review panel (3 agents)
184
+ │ └── subagents/ # 10 category directories
185
+ ├── templates/ # State schema, evidence standard, artifact format
186
+ ├── tools/ # Subagent catalog tool
187
+ ├── references/ # Git/GitHub reference docs
188
+ └── .work/ # Runtime state (gitignored)
189
+ ```
190
+
191
+ ## Extending
192
+
193
+ - **Add a subagent**: Create a `.md` file in `.claude/agents/subagents/<category>/` with frontmatter (`name`, `description`, `tools`, `model`)
194
+ - **Add a phase**: Create `.md` in `.claude/phases/`, add state to `CLAUDE.md`
195
+ - **Add a core agent**: Create `.md` in `.claude/agents/`, reference in `CLAUDE.md`
196
+ - **Adjust budgets**: Edit `CLAUDE.md` Budgets section and `.claude/templates/state.json`
197
+
198
+ ## Research Basis
199
+
200
+ Built on research from SWE-agent, Agentless, Ambig-SWE, Reflexion, Self-Refine, AgentCoder, TALE, OpenHands, and more. See the Research Basis section in [CLAUDE.md](CLAUDE.md) for the full citation table.
201
+
202
+ ## License
203
+
204
+ [MIT](LICENSE). Commercial services and optional Pro offerings are described in [PRO.md](PRO.md); see [docs/licensing.md](docs/licensing.md) for how MIT relates to product packaging (not legal advice).