agentic-dev 0.2.20 → 0.2.21

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (54) hide show
  1. package/README.md +13 -10
  2. package/dist/lib/orchestration-assets.d.ts +1 -1
  3. package/dist/lib/orchestration-assets.d.ts.map +1 -1
  4. package/dist/lib/orchestration-assets.js +78 -21
  5. package/dist/lib/orchestration-assets.js.map +1 -1
  6. package/dist/lib/scaffold.d.ts +1 -0
  7. package/dist/lib/scaffold.d.ts.map +1 -1
  8. package/dist/lib/scaffold.js +175 -4
  9. package/dist/lib/scaffold.js.map +1 -1
  10. package/dist/lib/types.d.ts +2 -0
  11. package/dist/lib/types.d.ts.map +1 -1
  12. package/package.json +2 -5
  13. package/.agent/prd.json +0 -29
  14. package/.agent/progress.txt +0 -1
  15. package/.agent/prompt.md +0 -21
  16. package/.agent/ralph-loop-state.json +0 -13
  17. package/.agent/ralph-supervisor-state.json +0 -12
  18. package/.agent/ralph-supervisor.sh +0 -238
  19. package/.agent/ralph.sh +0 -305
  20. package/.agent/runs/README.md +0 -7
  21. package/.agent/sdd-build-ast-audit.json +0 -13
  22. package/.claude/CLAUDE.md +0 -44
  23. package/.claude/agentic-dev.json +0 -3
  24. package/.claude/agents/ai-dev.md +0 -27
  25. package/.claude/agents/backend-dev.md +0 -26
  26. package/.claude/agents/db-dev.md +0 -26
  27. package/.claude/agents/devops.md +0 -27
  28. package/.claude/agents/frontend-dev.md +0 -25
  29. package/.claude/agents/github-ops.md +0 -25
  30. package/.claude/agents/test-dev.md +0 -26
  31. package/.claude/agents/uiux-designer.md +0 -25
  32. package/.claude/settings.json +0 -49
  33. package/.claude/settings.local.json +0 -8
  34. package/.claude/skills/sdd/SKILL.md +0 -189
  35. package/.claude/skills/sdd/agents/openai.yaml +0 -4
  36. package/.claude/skills/sdd/references/section-map.md +0 -67
  37. package/.claude/workspace-config.json +0 -3
  38. package/.codex/agentic-dev.json +0 -3
  39. package/.codex/agents/README.md +0 -22
  40. package/.codex/agents/api.toml +0 -11
  41. package/.codex/agents/architecture.toml +0 -11
  42. package/.codex/agents/ci.toml +0 -11
  43. package/.codex/agents/gitops.toml +0 -11
  44. package/.codex/agents/orchestrator.toml +0 -11
  45. package/.codex/agents/quality.toml +0 -11
  46. package/.codex/agents/runtime.toml +0 -11
  47. package/.codex/agents/security.toml +0 -11
  48. package/.codex/agents/specs.toml +0 -11
  49. package/.codex/agents/ui.toml +0 -11
  50. package/.codex/config.toml +0 -46
  51. package/.codex/skills/SKILL.md +0 -13
  52. package/.codex/skills/sdd/SKILL.md +0 -189
  53. package/.codex/skills/sdd/agents/openai.yaml +0 -4
  54. package/.codex/skills/sdd/references/section-map.md +0 -67
@@ -1,11 +0,0 @@
1
- model = "gpt-5.3-codex"
2
- model_reasoning_effort = "medium"
3
- sandbox_mode = "workspace-write"
4
- developer_instructions = """
5
- You are the UI sub-agent.
6
-
7
- Mission:
8
- - Keep UI contracts aligned with backend APIs and design intent.
9
- - Prefer minimal, compatible changes.
10
- - Preserve reusable component surfaces.
11
- """
@@ -1,46 +0,0 @@
1
- [features]
2
- multi_agent = true
3
-
4
- [agents]
5
- max_threads = 10
6
- max_depth = 1
7
-
8
- [agents.architecture]
9
- description = "Drive high-level architecture, boundaries, and migration decisions."
10
- config_file = "agents/architecture.toml"
11
-
12
- [agents.runtime]
13
- description = "Refactor runtime and application wiring while preserving behavior."
14
- config_file = "agents/runtime.toml"
15
-
16
- [agents.gitops]
17
- description = "Own CI/CD, compose, and deployment wiring."
18
- config_file = "agents/gitops.toml"
19
-
20
- [agents.quality]
21
- description = "Run validation gates and identify regressions."
22
- config_file = "agents/quality.toml"
23
-
24
- [agents.api]
25
- description = "Own API boundary contracts and backward compatibility."
26
- config_file = "agents/api.toml"
27
-
28
- [agents.orchestrator]
29
- description = "Improve orchestration flows and operational safety."
30
- config_file = "agents/orchestrator.toml"
31
-
32
- [agents.ci]
33
- description = "Maintain pipeline policy and release path integrity."
34
- config_file = "agents/ci.toml"
35
-
36
- [agents.specs]
37
- description = "Validate SDD and specification consistency."
38
- config_file = "agents/specs.toml"
39
-
40
- [agents.ui]
41
- description = "Own UI contracts, hooks, and frontend integration surfaces."
42
- config_file = "agents/ui.toml"
43
-
44
- [agents.security]
45
- description = "Audit security and operational regression risk."
46
- config_file = "agents/security.toml"
@@ -1,13 +0,0 @@
1
- ---
2
- name: otro
3
- description: OTRO (Overlap-Tolerant Residual Orchestration) root alias for the canonical template skill surface.
4
- ---
5
-
6
- # OTRO Alias
7
-
8
- 이 파일은 root alias다. canonical OTRO skill body와 scripts/references/schemas는 [`otro/SKILL.md`](./otro/SKILL.md)를 기준으로 사용한다.
9
-
10
- ## Rule
11
-
12
- - OTRO 실행 시 root 중복 자산이 아니라 `otro/` 하위 canonical 자산만 사용한다.
13
- - `sdd-development`, `ralph-loop`, `planning-with-files`는 별도 skill surface로 유지한다.
@@ -1,189 +0,0 @@
1
- ---
2
- name: sdd
3
- description: "Use for any software development request in a repository that treats `sdd/` as the canonical delivery system. Trigger on requests like develop, implement, build, code, work on, modify, fix, patch, refactor, test, verify, deploy, monitor, or screen/UI-driven prompts such as 화면명세서, 화면설계서, 화면 설계, 화면, 화면 스펙, UI, 디자인, 디자인 가이드, screen spec, screen design, or design guide. The workflow is always SDD-first: inspect and update `sdd/01_planning`, create or update the task plan under `sdd/02_plan`, implement the change, record execution in `sdd/03_build`, capture validation in `sdd/03_verify`, and record deployment or monitoring in `sdd/05_operate` when rollout happens."
4
- ---
5
-
6
- # SDD Development
7
-
8
- ## Overview
9
-
10
- Use this skill for implementation work in repositories that treat `sdd/` as the canonical delivery record.
11
-
12
- This skill enforces one workflow:
13
- 1. inspect and fix relevant `sdd/01_planning` artifacts first,
14
- 2. create or update the task plan under `sdd/02_plan/<section>/`,
15
- 3. perform the code work,
16
- 4. record the current implementation summary in `sdd/03_build`,
17
- 5. record the current retained verification summary in `sdd/03_verify`,
18
- 6. record deployment and monitoring outcomes in `sdd/05_operate` when rollout happens.
19
-
20
- When rollout is explicitly in scope, and the repository has separate DEV and PROD environments, this skill enforces a staged release rule: deploy to DEV first, complete the retained full-layer validation surface there, promote to PROD only after DEV passes, then rerun the same retained validation surface in PROD. If PROD validation fails, rollback is required unless the user explicitly redirects and that risk is recorded.
21
- For persistence-affecting work, this skill also enforces schema-parity verification. Always compare migration or model intent against the real DEV and PROD schema state for the affected database objects instead of assuming deployed reality matches the code.
22
- Unless the user explicitly forbids it, durable work is not complete at code-edit state. Finish with a coherent git commit, push the retained result to the configured remote, and if the repository ships an installable package or CLI, publish the new version and verify the registry reflects it.
23
-
24
- Read [references/section-map.md](references/section-map.md) when you need the exact destination inside `sdd/`.
25
- For screen-spec-driven UI work, reusable static assets from the spec must be extracted through the repo's canonical asset builder before being used in code.
26
- For screen-spec-driven layout work, inspect the repo's canonical design guide builder first when one exists.
27
- For local screen exactness, treat the repo's Playwright exactness runner and suite registry as the canonical automation gate when they exist.
28
- For verification work, treat regression scope selection as a required retained artifact and carry it through `sdd/02_plan`, `sdd/03_build`, and `sdd/03_verify`.
29
- Do not infer rollout scope from the existence of `sdd/05_operate` alone; require rollout only when the user asks for deployment or the repo's current policy/plan makes rollout part of completion.
30
- When a repo or team treats DEV deployment from `main` as the completion bar, temporary branches or worktrees are only working space. Before calling the task deployed, land the final retained change on `main` and push `origin/main`.
31
-
32
- ## When To Use
33
-
34
- Use this skill when:
35
- - the repository has `sdd/01_planning`, `02_plan`, `03_build`, `03_verify`, `05_operate`,
36
- - the user gives a development instruction such as `개발해`, `작업해`, `구현해`, `수정해`, `고쳐`, `리팩토링해`, `테스트해`, `배포해`,
37
- - the user asks for screen/UI work with prompts such as `화면명세서`, `화면설계서`, `화면 설계`, `화면`, `화면 스펙`, `UI`, `디자인`, `디자인 가이드`, `screen spec`, `screen design`, or `design guide`,
38
- - the user wants work to be traceable through those folders,
39
- - the task includes both implementation and documentation/verification updates,
40
- - the task may end in deployment or operational follow-up.
41
-
42
- Do not use this skill for:
43
- - casual questions with no repo changes,
44
- - one-off local debugging where no durable SDD record is needed,
45
- - repositories that do not use `sdd/` as their primary document system.
46
-
47
- ## Workflow
48
-
49
- ### 1. Inspect Planning First
50
-
51
- - Identify the impacted planning area before editing code.
52
- - Open only the relevant artifacts in `sdd/01_planning`:
53
- - feature
54
- - screen
55
- - architecture
56
- - data
57
- - api
58
- - iac
59
- - integration
60
- - nonfunctional
61
- - security
62
- - test
63
- - If the implementation has already drifted from planning, update the planning artifact first or at least record the drift before coding.
64
-
65
- ### 2. Create Or Update The Plan
66
-
67
- - Create or reuse a durable plan file under `sdd/02_plan/<section>/`.
68
- - Prefer the repo's planning scaffold if available.
69
- - The plan must include:
70
- - scope
71
- - assumptions
72
- - acceptance criteria
73
- - execution checklist
74
- - current notes
75
- - validation
76
- - For any task that may end in deployment, acceptance criteria must explicitly include the DEV gate, the matching PROD gate, the retained full-layer test surface, and the rollback trigger/path.
77
- - For any task that touches persistence, models, repositories, migrations, SQL, ORM mappings, or runtime failures that may involve schema drift, acceptance criteria must explicitly include DEV/PROD schema verification.
78
- - Keep exactly one checklist item in progress.
79
-
80
- ### 3. Implement Against The Plan
81
-
82
- - Make code changes only after the impacted planning artifact and plan are aligned enough to proceed.
83
- - Update the plan current notes after meaningful edits or decisions.
84
- - When document generators or capture pipelines are involved, keep those tools under `sdd/99_toolchain`.
85
- - For local screen exactness, treat Playwright as the canonical automation gate unless the repo documents a stronger exact gate for that surface.
86
- - In repos created from this template, prefer `python3 sdd/99_toolchain/01_automation/run_playwright_exactness.py --suite <suite-id>` over ad-hoc `npx playwright test ...`.
87
- - Keep the suite registry in `sdd/99_toolchain/01_automation/playwright_exactness_manifest.py`.
88
- - Browser Use, manual screenshots, or semantic extraction can supplement diagnosis, but they do not replace the retained Playwright exactness gate when a suite exists.
89
- - If the needed suite does not exist yet, add or extend it in the same task and register it before calling the work complete.
90
- - When the task depends on icons, logos, illustrations, or other static assets visible in a screen spec, use the repo's canonical Asset Spec Builder first.
91
- - In repos created from this template, this is typically `sdd/99_toolchain/01_automation/spec_asset_builder.py` or a wrapper/manifest around it.
92
- - Reusable asset planning records belong under `sdd/01_planning/02_screen/assets/`.
93
- - Build the runtime asset from the approved PDF/image source instead of hand-tracing or screenshot-cropping it.
94
- - Use exact verification such as `--verify-exact` when the asset is expected to match the source crop exactly.
95
- - Record the source, manifest, generated asset path, and any exception in `sdd/03_build` and `sdd/03_verify`.
96
- - Only fall back to manual recreation when the builder cannot express the asset, and explicitly document that exception in the plan/build/verify trail.
97
- - When the task depends on spacing, layout density, typography, color rhythm, or component hierarchy derived from a screen spec, inspect the repo's canonical design guide builder first.
98
- - In repos created from this template, inspect `sdd/99_toolchain/01_automation/README.md` and use the actual builder, wrapper, or manifest that exists in the repo.
99
- - Use the generated guide as the working baseline before manual spacing or palette tweaks.
100
- - If the repo does not provide a design guide builder yet, document the manual interpretation source in plan/build/verify.
101
- - Define the regression surface before calling implementation complete.
102
- - Start from `sdd/02_plan/10_test/regression_verification.md`.
103
- - Identify the direct target plus any upstream, downstream, and shared surfaces affected by the change.
104
- - If the change touches shared routing, shell/auth, shared state, common components, contracts, generated assets, or builder output, widen the regression scope instead of validating only the edited module.
105
- - Record the selected regression scope and any justified exclusions in plan/build/verify.
106
- - When rollout is in scope, define one retained full-layer validation surface and reuse it in DEV and PROD.
107
- - Include the relevant app/runtime entrypoints, API/contracts, persistence/schema, jobs or workflow side effects, shared integrations, and health/monitoring checks affected by the change.
108
- - Do not promote to PROD with a narrower verification surface than the DEV gate unless the user explicitly approves that exception and it is recorded.
109
-
110
- ### 4. Record Build Summary
111
-
112
- - Record what you implemented in `sdd/03_build`.
113
- - Use:
114
- - `03_build/01_feature` for feature implementation summaries
115
- - `03_build/02_screen` for screen implementation summaries
116
- - `03_build/03_architecture`, `06_iac`, `10_test` for current-state cross-cutting summaries
117
- - Keep entries factual and current-state only: implemented scope, modules, assets, contracts, and current user-visible behavior.
118
-
119
- ### 5. Record Verification
120
-
121
- - Record retained verification status in `sdd/03_verify`.
122
- - Use:
123
- - `03_verify/01_feature` for feature verification summaries
124
- - `03_verify/02_screen` for screen verification summaries
125
- - `03_verify/03_architecture`, `06_iac`, `10_test` for current retained checks and residual risk
126
- - Never claim completion without command-level validation evidence.
127
- - For staged DEV -> PROD rollout, verification must use the same retained full-layer validation surface in both environments.
128
- - Run the full-layer validation in DEV after deployment and treat it as a hard gate before PROD promotion.
129
- - After PROD deployment, rerun the same retained validation surface in PROD.
130
- - If PROD validation fails, execute rollback or the approved recovery procedure immediately and record the failure and recovery outcome.
131
- - For persistence-affecting work, verification must include real schema evidence from both DEV and PROD when those environments exist.
132
- - Check migration state and actual runtime schema separately.
133
- - Validate the tables, columns, indexes, constraints, triggers, defaults, and any legacy compatibility objects touched by the change.
134
- - Record the commands or queries used, the environments checked, and the drift or parity result.
135
- - Regression verification is mandatory.
136
- - Verification must cover the direct surface and the retained upstream/downstream/shared surfaces selected from the regression baseline.
137
- - If no automation exists for a needed regression slice yet, run the best available manual or command checks and record that gap as current residual risk.
138
- - When a Playwright suite exists for the surface, record the canonical runner command, suite id, screenshot/json artifact paths, and any live-vs-local split explicitly.
139
-
140
- ### 6. Record Operate Outcomes
141
-
142
- - If deployment or runtime follow-up happens, update `sdd/05_operate`.
143
- - Use:
144
- - `05_operate/01_runbooks` for durable operating procedure changes
145
- - `05_operate/02_delivery_status` for the current live state and monitoring baseline
146
- - Record:
147
- - what was deployed
148
- - which live baseline is current
149
- - how it is monitored
150
- - any current residual risk
151
- - For staged DEV -> PROD rollout, record the DEV gate, PROD gate, and any rollback outcome explicitly.
152
- - When the DEV deployment baseline is tied to `main`, do not treat a side-branch push as sufficient. Merge, cherry-pick, or otherwise replay the final change onto `main`, push `origin/main`, then record the deployment evidence against that `main` baseline.
153
-
154
- ## Guardrails
155
-
156
- - Do not create or repopulate a parallel `docs/` tree when `sdd/` exists.
157
- - Do not skip planning review just because the code change looks small.
158
- - Do not leave build, verify, or operate evidence only in chat text when it should live in `sdd/`.
159
- - Do not stop after local edits when durable changes remain; commit and push are the default completion bar unless the user explicitly forbids them.
160
- - Do not leave a publishable package or CLI unpublished after changing shipped behavior or instructions unless the user explicitly forbids publish.
161
- - When PROD rollout is in scope, do not promote to PROD before the retained full-layer DEV validation surface has passed.
162
- - When PROD rollout is in scope, do not use a weaker PROD validation surface than the one that gated DEV unless the user explicitly approves and that risk is recorded.
163
- - When PROD rollout is in scope, do not stop at "PROD deployment succeeded"; post-deploy PROD validation is mandatory.
164
- - When PROD rollout is in scope, do not leave a failed PROD deployment unreconciled; rollback or the approved recovery procedure must be executed and recorded.
165
- - Do not assume local tests, migration heads, or current model code prove deployed schema parity.
166
- - Do not skip DEV/PROD schema inspection for persistence-affecting work when schema drift could influence behavior.
167
- - Do not manually redraw screen-spec static assets when a canonical Asset Spec Builder exists for the repo; extract them first and use the generated asset.
168
- - Do not skip a relevant screen automation builder just because the requested UI change looks like a small manual tweak.
169
- - Do not stop verification at the edited file, route, or screen when the change can affect shared or adjacent behavior.
170
- - Do not omit regression scope selection from the retained SDD trail.
171
- - Do not update `05_operate` for tasks that never reached deployment; explicitly note that rollout did not happen instead.
172
- - Do not call a DEV rollout complete from a temporary branch when the repo or team baseline expects the deployed change to be on `origin/main`.
173
-
174
- ## Output Standard
175
-
176
- By the end of an implementation task, the expected trail is:
177
- - planning artifact reviewed or corrected,
178
- - plan file updated,
179
- - build summary written,
180
- - verification summary written, including selected regression scope and residual risk,
181
- - operate status updated if rollout occurred,
182
- - coherent git commit created and pushed,
183
- - publishable package/CLI인 경우 registry publish and latest verification completed unless the user explicitly forbade it.
184
-
185
- When PROD rollout is in scope, the retained completion state also requires:
186
- - DEV deployment happened first and the retained full-layer DEV validation surface passed,
187
- - the same retained full-layer validation surface was executed again in PROD,
188
- - DEV/PROD schema state was checked and recorded when schema could influence behavior,
189
- - any PROD validation failure produced rollback or recovery evidence in verify/operate.
@@ -1,4 +0,0 @@
1
- interface:
2
- display_name: "SDD Development"
3
- short_description: "Use SDD-first flow with schema parity, regression scope, and staged rollout gates"
4
- default_prompt: "Use $sdd to handle this development task through sdd planning, build, verify, and operate, including regression scope selection, schema parity checks for persistence-affecting work, and staged DEV-first validation when multiple environments exist."
@@ -1,67 +0,0 @@
1
- # SDD Section Map
2
-
3
- ## Planning
4
-
5
- - `sdd/01_planning/01_feature`
6
- - domain or service feature specifications
7
- - `sdd/01_planning/02_screen`
8
- - service-level screen specifications and PDFs
9
- - `sdd/01_planning/03_architecture`
10
- - bounded context, runtime, and structural design
11
- - `sdd/01_planning/04_data`
12
- - data model and relationship definitions
13
- - `sdd/01_planning/05_api`
14
- - transport contracts and API definitions
15
- - `sdd/01_planning/06_iac`
16
- - infrastructure planning and deployment design
17
- - `sdd/01_planning/07_integration`
18
- - integration contracts and external dependency planning
19
- - `sdd/01_planning/08_nonfunctional`
20
- - performance, reliability, scalability, and operational constraints
21
- - `sdd/01_planning/09_security`
22
- - security posture, threat model, and control planning
23
- - `sdd/01_planning/10_test`
24
- - test strategy and planned cases
25
-
26
- ## Plan
27
-
28
- - `sdd/02_plan/<section>`
29
- - executable plan files and migration backlogs
30
-
31
- ## Build
32
-
33
- - `sdd/03_build/01_feature`
34
- - feature implementation summaries
35
- - `sdd/03_build/02_screen`
36
- - screen implementation summaries
37
- - `sdd/03_build/03_architecture`
38
- - structural and governance implementation summaries
39
- - `sdd/03_build/06_iac`
40
- - current delivery/runtime implementation summaries
41
- - `sdd/03_build/10_test`
42
- - current harness and validation implementation summaries
43
-
44
- ## Verify
45
-
46
- - `sdd/03_verify/01_feature`
47
- - feature verification summaries
48
- - `sdd/03_verify/02_screen`
49
- - screen verification summaries
50
- - `sdd/03_verify/03_architecture`
51
- - governance and structure verification summaries
52
- - `sdd/03_verify/06_iac`
53
- - delivery/runtime verification summaries
54
- - `sdd/03_verify/10_test`
55
- - current harness outputs and retained validation references
56
-
57
- ## Operate
58
-
59
- - `sdd/05_operate/01_runbooks`
60
- - durable operating procedures
61
- - `sdd/05_operate/02_delivery_status`
62
- - current live state, monitoring baseline, and residual risk
63
-
64
- ## Tooling
65
-
66
- - `sdd/99_toolchain`
67
- - generators, capture tooling, manifests, and other SDD automation