waypoint-codex 1.0.14 → 1.0.16

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (39) hide show
  1. package/package.json +1 -1
  2. package/templates/.agents/skills/collapse-fragmented-modules/SKILL.md +31 -52
  3. package/templates/.agents/skills/collapse-fragmented-modules/agents/openai.yaml +4 -0
  4. package/templates/.agents/skills/edit-at-the-right-layer/SKILL.md +24 -17
  5. package/templates/.agents/skills/edit-at-the-right-layer/agents/openai.yaml +2 -2
  6. package/templates/.agents/skills/execution-reset/SKILL.md +68 -31
  7. package/templates/.agents/skills/execution-reset/agents/openai.yaml +2 -2
  8. package/templates/.agents/skills/find-duplicate-ownership/SKILL.md +120 -0
  9. package/templates/.agents/skills/find-duplicate-ownership/agents/openai.yaml +0 -0
  10. package/templates/.agents/skills/find-duplicate-ownership/references/audit-prompts.md +89 -0
  11. package/templates/.agents/skills/foundational-redesign/SKILL.md +18 -13
  12. package/templates/.agents/skills/foundational-redesign/agents/openai.yaml +2 -2
  13. package/templates/.agents/skills/hard-cut/SKILL.md +78 -0
  14. package/templates/.agents/skills/hard-cut/agents/openai.yaml +4 -0
  15. package/templates/.agents/skills/legibility-pass/SKILL.md +30 -26
  16. package/templates/.agents/skills/legibility-pass/agents/openai.yaml +2 -2
  17. package/templates/.agents/skills/make-invariants-explicit/SKILL.md +57 -26
  18. package/templates/.agents/skills/make-invariants-explicit/agents/openai.yaml +2 -2
  19. package/templates/.agents/skills/plan-start/SKILL.md +65 -28
  20. package/templates/.agents/skills/plan-start/agents/openai.yaml +4 -0
  21. package/templates/.agents/skills/plan-swarm-audit/SKILL.md +50 -6
  22. package/templates/.agents/skills/plan-swarm-audit/agents/openai.yaml +2 -2
  23. package/templates/.agents/skills/planning/SKILL.md +115 -62
  24. package/templates/.agents/skills/planning/agents/openai.yaml +2 -2
  25. package/templates/.agents/skills/replace-dont-layer/SKILL.md +68 -22
  26. package/templates/.agents/skills/replace-dont-layer/agents/openai.yaml +4 -0
  27. package/templates/.agents/skills/root-cause-finder/SKILL.md +70 -0
  28. package/templates/.agents/skills/root-cause-finder/agents/openai.yaml +0 -0
  29. package/templates/.agents/skills/test-writing/SKILL.md +53 -39
  30. package/templates/.agents/skills/test-writing/agents/openai.yaml +2 -2
  31. package/templates/.agents/skills/verify-codebase-coherence/SKILL.md +26 -27
  32. package/templates/.agents/skills/verify-codebase-coherence/agents/openai.yaml +3 -3
  33. package/templates/.agents/skills/verify-completeness/SKILL.md +38 -27
  34. package/templates/.agents/skills/verify-completeness/agents/openai.yaml +2 -2
  35. package/templates/.codex/agents/duplicate_ownership_explorer.toml +17 -0
  36. package/templates/.codex/agents/ownership_taxonomy_mapper.toml +16 -0
  37. package/templates/.codex/agents/ssot_judge.toml +17 -0
  38. package/templates/.codex/config.toml +12 -0
  39. package/templates/managed-agents-block.md +1 -0
@@ -1,36 +1,35 @@
1
1
  ---
2
2
  name: verify-codebase-coherence
3
- description: Verify that completed work fits the existing codebase instead of introducing unnecessary parallel patterns. Use after implementation within a defined scope to detect avoidable new components, utilities, abstractions, state paths, design patterns, or conventions that should have reused or extended existing ones. Correct the work so it integrates coherently with the repo's existing architecture, components, naming, contracts, and design language.
3
+ description: Audit completed work in a defined scope for codebase coherence before handoff. Use after implementation to verify the change reuses existing components, utilities, abstractions, state paths, naming, contracts, and design language instead of introducing avoidable parallel patterns. Do not use for redesign, replacement, collapse, or other implementation tasks that belong to foundational/edit-layer skills.
4
4
  ---
5
5
 
6
- Review the completed work in the requested scope and check whether it fits the existing codebase.
6
+ # Verify Codebase Coherence
7
7
 
8
- Look for unnecessary parallel patterns such as:
9
- - new frontend components where an existing component should have been reused or extended
10
- - new helpers, hooks, utilities, or adapters that duplicate an existing pattern
11
- - new state paths or data flows that bypass the established architecture
12
- - new naming, file structure, or API shapes that do not match nearby conventions
13
- - one-off design, styling, or interaction patterns that do not fit the app
14
- - local abstractions that solve a problem the codebase already has a standard way to solve
8
+ ## Mission
9
+ Audit the finished change for coherence with the existing codebase and report whether it is ready for closeout.
15
10
 
16
- Before keeping a new construct, check whether the repo already has:
17
- - a reusable component or composition pattern
18
- - an established state or data-fetching pattern
19
- - a standard boundary for validation, formatting, permissions, or persistence
20
- - an existing utility or shared contract
21
- - a nearby feature that should be extended instead of bypassed
11
+ ## Ordered Workflow
12
+ 1. Confirm the requested scope and the files actually changed by the implementation.
13
+ 2. Inspect the changed code in context of nearby code, shared helpers, and adjacent conventions.
14
+ 3. Check for avoidable parallel patterns: duplicate components, helpers, hooks, adapters, state paths, naming, API shapes, styling, or local abstractions.
15
+ 4. Check whether the change should have reused an existing component, utility, boundary, or composition pattern instead of introducing a new one.
16
+ 5. Classify each issue as either a coherence finding, a deliberate divergence, or out of scope.
17
+ 6. Decide closeout status: pass only if no unresolved coherence findings remain.
18
+ 7. Report findings with enough detail for the owner to act on them.
22
19
 
23
- If the work introduced a parallel pattern without a clear reason, fix it. Do not just report it.
20
+ ## Rules
21
+ - Do not edit files.
22
+ - Do not recommend a redesign, replacement, collapse, or refactor as a substitute for this audit.
23
+ - Do not accept a new component, utility, hook, adapter, state path, or API shape if an existing one already covers the same job.
24
+ - Do not treat faster implementation as a valid reason to fork the architecture, data flow, or design language.
25
+ - Do not expand the review beyond the requested scope unless a change in that scope creates a direct coherence issue outside it.
26
+ - Do not mark a deliberate divergence as a finding when the repo already documents or consistently uses that variant.
24
27
 
25
- When correcting violations:
26
- - reuse or extend existing components, utilities, and patterns where appropriate
27
- - remove unnecessary one-off abstractions or duplicate paths
28
- - align naming, structure, and interfaces with nearby code
29
- - preserve intended behavior unless the user asked for a behavioral change
28
+ ## Exception Rule
29
+ If the codebase already has a sanctioned local variant, feature flag boundary, or documented exception that justifies the divergence, classify it as accepted and do not report it as a coherence defect.
30
30
 
31
- Rules:
32
- - Do not create a new component, utility, hook, adapter, or pattern if the repo already has one that should be reused or extended.
33
- - Do not fork the design language or architecture for a local feature without a clear reason.
34
- - Do not bypass established patterns just because creating a new path is faster.
35
- - Prefer extending the existing system over creating a parallel mini-system.
36
- - If divergence is necessary, it must be justified by a real requirement, not convenience.
31
+ ## Output Contract
32
+ - Start with `PASS` or `FAIL`.
33
+ - If `FAIL`, list each finding with file path, concise reason, and the specific reuse or alignment that should have happened.
34
+ - If `PASS`, state that the audited scope is coherent and closeout-ready.
35
+ - Include no code changes, no patch plan, and no redesign proposal.
@@ -1,4 +1,4 @@
1
1
  interface:
2
- display_name: "Verify Codebase Coherence"
3
- short_description: "Check architectural and structural coherence"
4
- default_prompt: "Use $verify-codebase-coherence to audit the current scope for architectural coherence, boundary consistency, duplication, and drift before final handoff."
2
+ display_name: "Verify Codebase Coherence Audit"
3
+ short_description: "Audit completed work for coherence and drift"
4
+ default_prompt: "Use $verify-codebase-coherence to audit the completed scope for codebase coherence, duplication, boundary consistency, and convention drift. Report findings only and do not change files."
@@ -1,52 +1,63 @@
1
1
  ---
2
2
  name: verify-completeness
3
- description: Use when implementation appears done and before reporting completion. Re-read the original plan and agreed scope, re-read files that were supposed to be created or changed, verify no approved scope was reduced or skipped, and continue working until the scope is truly complete.
3
+ description: Use when implementation appears done and before reporting completion. Re-read the approved plan and final scope, verify every in-scope file and checkpoint, and only then decide whether work can be reported complete.
4
4
  ---
5
5
 
6
6
  # Verify Completeness
7
7
 
8
- Use this skill at final closeout, right before you would report the work complete.
8
+ Use this skill at final closeout, right before you would report work complete. Its job is to gate completion, not to re-open the whole project.
9
9
 
10
- ## Required verification loop
10
+ ## Rules
11
11
 
12
- 1. Re-read the original plan and the latest agreed scope before deciding status.
13
- 2. Re-read `ACTIVE_PLANS.md` and `WORKSPACE.md` for current checklist, phase, blockers, and verification state.
14
- 3. Build the expected file set from plan/scope: files that were supposed to be created, modified, or deleted.
15
- 4. Re-read those files directly. This final re-read is mandatory even if they were read earlier in the session.
16
- 5. Compare expected scope vs actual outcome and list any missing or partially completed items.
17
- 6. Run a scope-discipline pass: identify additions that were not requested or approved. Remove/simplify them before completion, or explicitly ask the user to approve keeping them.
18
- 7. Run a cleanup pass on changed files: remove duplicated logic, unnecessary abstractions/files, and low-value comments that create maintenance bloat.
19
- 8. If changed code is still hard to read or reason about, run `legibility-pass` before completion and apply the resulting readability cleanup.
20
- 9. Run a file-footprint sanity pass: collapse avoidable tiny-file fragmentation and keep code that changes together in the same place when boundary/reuse/size reasons are weak.
21
- 10. Run a test-signal sanity pass: remove redundant or brittle tests and keep the smallest high-signal set that still protects the contract.
22
- 11. Before commit/final handoff, run the full checks required by the plan (for example full typecheck/test/build sweep) once, unless explicitly blocked or the user asks for a different cadence.
23
- 12. If any approved item is missing, incomplete, or silently deferred, do not report completion. Continue working until the agreed scope is fully satisfied or discuss a scope change explicitly.
12
+ 1. Re-read the approved plan and the latest agreed scope before deciding status.
13
+ 2. Re-read `ACTIVE_PLANS.md` and `WORKSPACE.md` for the current checklist, phase, blockers, and verification state.
14
+ 3. Build the expected file set from the approved scope only: files that were supposed to be created, modified, or deleted.
15
+ 4. Re-read every file in the expected set directly. This final re-read is mandatory even if the file was read earlier in the session.
16
+ 5. Compare expected scope vs actual outcome and identify any missing, partial, or silently deferred items.
17
+ 6. Run required plan checkpoints at the required cadence, including the full pre-commit checks when the plan requires them, unless a bounded exception applies.
18
+ 7. Do not report completion if any approved item is missing, incomplete, or deferred without explicit approval.
19
+ 8. Do not keep unapproved additions, cleanup work, refactors, abstractions, file splits, or test pruning in this skill's core scope; treat them as separate decisions that require explicit approval unless they are needed to finish the approved scope.
20
+ 9. If changed code is still hard to read or reason about, run `legibility-pass` and apply only the readability cleanup required to finish the approved scope.
21
+ 10. Keep adjacent skills conditional and narrow: use them only when the verification pass exposes that specific need, not as part of the default completion gate.
24
22
 
25
- ## Completion gate
23
+ ## Exception Rule
24
+
25
+ You may relax the normal verification loop only when one of these is true:
26
+
27
+ - required plan artifacts are missing or stale, and you need to reconstruct the approved scope before continuing
28
+ - the task is read-only or review-only, so no code or files are expected to change
29
+ - required checks cannot run because the environment, dependencies, permissions, or upstream blockers make them impossible right now
30
+
31
+ In these cases, continue only far enough to identify the gap, record the blocker, and report the exact missing verification step or artifact. Do not use the exception to absorb cleanup, refactor, or scope expansion work.
32
+
33
+ ## Completion Gate
26
34
 
27
35
  You can report complete only when all are true:
28
36
 
29
37
  - approved scope items are done
30
38
  - planned file changes match reality
31
- - verification/checkpoints required by the plan were run at the required cadence, including full pre-commit checks when required (or explicitly called out as blocked)
39
+ - required verification/checkpoints were run, or each skipped check has a specific blocked reason
32
40
  - no hidden scope reduction occurred
33
41
  - no unapproved scope expansion remains
34
42
  - no obvious duplication or avoidable bloat remains in touched files
35
43
  - no avoidable file fragmentation remains in touched feature areas
36
44
  - test set remains high-signal and non-redundant for the risk level
37
45
 
38
- ## Output contract
46
+ ## Output Contract
47
+
48
+ Before final status, report these items explicitly:
39
49
 
40
- Before final status, summarize briefly:
50
+ - `status`: `complete`, `blocked`, or `incomplete`
51
+ - `scope reviewed`: the plan/scope sources you re-read
52
+ - `files re-read`: the files you re-opened for final verification
53
+ - `missing scope items`: any approved items still absent, or `none`
54
+ - `checks run`: each verification step actually executed
55
+ - `checks skipped`: each omitted check with a reason, or `none`
56
+ - `removed extras`: any unapproved extras, cleanup, or bloat you removed, or `none`
57
+ - `adjacent skill escalation`: any conditional skill you invoked and why, or `none`
58
+ - `next action`: continue execution, request scope approval, or complete
41
59
 
42
- - scope reviewed
43
- - files re-read for final verification
44
- - completed items
45
- - removed unapproved extras or bloat cleanup applied
46
- - legibility cleanup applied (if run)
47
- - file-collapsing or test-pruning done during sanity passes
48
- - remaining gaps (if any)
49
- - next action (continue execution or complete)
60
+ Do not say the work is complete unless the `status` is `complete` and the completion gate is satisfied.
50
61
 
51
62
  ## Gotchas
52
63
 
@@ -1,4 +1,4 @@
1
1
  interface:
2
2
  display_name: "Verify Completeness"
3
- short_description: "Run a strict final scope and file verification pass"
4
- default_prompt: "Use $verify-completeness now: re-read the approved plan and scope, re-read all files that were supposed to change, remove unapproved extras and obvious bloat, verify nothing was dropped, and keep working if any approved scope item is still incomplete."
3
+ short_description: "Gate completion by re-reading scope, files, and required checks before closeout"
4
+ default_prompt: "Use $verify-completeness now: re-read the approved plan and final scope, re-read every file that was supposed to change, confirm missing scope items and skipped checks with reasons, and only report completion if the approved scope is fully finished."
@@ -0,0 +1,17 @@
1
+ name = "duplicate_ownership_explorer"
2
+ description = "Read-only explorer for one bounded slice of duplicate ownership. Use one agent per feature or contract slice."
3
+ model = "gpt-5.3-codex"
4
+ model_reasoning_effort = "medium"
5
+ sandbox_mode = "read-only"
6
+ nickname_candidates = ["Slice", "Scout", "Trace"]
7
+ developer_instructions = """
8
+ Own one narrow slice only.
9
+ Look for duplicate ownership of rules such as validation, defaults, canonicalization, mapping, repair, persistence policy, and helper semantics.
10
+ For each candidate, decide whether it is:
11
+ - architecture / SSOT bug
12
+ - local dedupe cleanup
13
+ - legitimate boundary adapter
14
+ - legitimate domain constraint
15
+ Return exact files and symbols.
16
+ Do not recommend wrappers, shims, or fallback paths.
17
+ """
@@ -0,0 +1,16 @@
1
+ name = "ownership_taxonomy_mapper"
2
+ description = "Read-only mapper for duplicate-ownership audits. Use first to identify likely SSOT conflicts, ownership boundaries, and exploration slices before deeper review."
3
+ model = "gpt-5.3-codex"
4
+ model_reasoning_effort = "medium"
5
+ sandbox_mode = "read-only"
6
+ nickname_candidates = ["Mapper", "Topo", "Surveyor"]
7
+ developer_instructions = """
8
+ Stay in exploration mode.
9
+ Map ownership boundaries, not fixes.
10
+ Find likely places where the same rule is owned twice.
11
+ Return:
12
+ - candidate taxonomy
13
+ - likely hot spots
14
+ - recommended slice boundaries for parallel follow-up
15
+ Do not propose compatibility shims or code changes unless the parent asks.
16
+ """
@@ -0,0 +1,17 @@
1
+ name = "ssot_judge"
2
+ description = "Strict read-only judge for duplicate-ownership findings. Use after exploration to decide the winning owner and hard-cut cleanup."
3
+ model = "gpt-5.3-codex"
4
+ model_reasoning_effort = "high"
5
+ sandbox_mode = "read-only"
6
+ nickname_candidates = ["Judge", "Owner", "Verdict"]
7
+ developer_instructions = """
8
+ Act like an architecture owner.
9
+ Given candidate duplicate-ownership findings, decide:
10
+ - is this real duplicate ownership or legitimate boundary work
11
+ - who should be the single owner
12
+ - what should be deleted
13
+ - what should remain
14
+ - what should be renamed for honest semantics
15
+ Bias toward hard-cut cleanup.
16
+ Reject mediator layers, wrappers, compatibility paths, and dual ownership.
17
+ """
@@ -16,3 +16,15 @@ config_file = "agents/code-reviewer.toml"
16
16
  [agents."plan-reviewer"]
17
17
  description = "Read-only plan validator that checks whether a proposed implementation plan is complete, feasible, and safe to execute."
18
18
  config_file = "agents/plan-reviewer.toml"
19
+
20
+ [agents."ssot_judge"]
21
+ description = "Strict read-only judge for duplicate-ownership findings that selects the canonical owner and hard-cut cleanup."
22
+ config_file = "agents/ssot_judge.toml"
23
+
24
+ [agents."ownership_taxonomy_mapper"]
25
+ description = "Read-only mapper that identifies ownership boundaries and high-risk SSOT duplicate-ownership slices before deeper audits."
26
+ config_file = "agents/ownership_taxonomy_mapper.toml"
27
+
28
+ [agents."duplicate_ownership_explorer"]
29
+ description = "Read-only slice explorer that audits one bounded area for duplicate ownership and classifies findings with file-level evidence."
30
+ config_file = "agents/duplicate_ownership_explorer.toml"
@@ -37,6 +37,7 @@ Once the user approves a plan or tells you to proceed, that approved scope is th
37
37
 
38
38
  `WORKSPACE.md` is the live state file. `ACTIVE_PLANS.md` is the active execution checklist. Keep them current when state, blockers, or verification materially change.
39
39
  When durable behavior changes, update the relevant docs during the work. When live execution state changes, update `WORKSPACE.md` or `ACTIVE_PLANS.md` during the work, not only at the end.
40
+ When creating or updating routable docs in `.waypoint/docs/` or `.waypoint/plans/`, include valid YAML frontmatter (`summary`, `last_updated`, `read_when`) so `.waypoint/DOCS_INDEX.md` can parse and route them.
40
41
 
41
42
  When changing code, do not hesitate to aggressively delete legacy code and rebuild the system when that is the clearest path to accomplishing the goal. Prefer clean replacement over compatibility scaffolding unless the user or project docs explicitly require coexistence.
42
43
  Do not widen a local change into a broader rewrite unless the current structure directly blocks the approved change or the user approves the expansion.