npm - @bastani/atomic - Versions diffs - 0.8.28 → 0.8.29-alpha.3 - Mend

@bastani/atomic 0.8.28 → 0.8.29-alpha.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (145) hide show

package/CHANGELOG.md +37 -0
package/dist/builtin/cursor/CHANGELOG.md +27 -0
package/dist/builtin/cursor/LICENSE +26 -0
package/dist/builtin/cursor/README.md +22 -0
package/dist/builtin/cursor/index.ts +9 -0
package/dist/builtin/cursor/package.json +46 -0
package/dist/builtin/cursor/src/auth.ts +352 -0
package/dist/builtin/cursor/src/catalog-cache.ts +155 -0
package/dist/builtin/cursor/src/config.ts +123 -0
package/dist/builtin/cursor/src/conversation-state.ts +135 -0
package/dist/builtin/cursor/src/cursor-models-raw.json +583 -0
package/dist/builtin/cursor/src/model-mapper.ts +270 -0
package/dist/builtin/cursor/src/models.ts +54 -0
package/dist/builtin/cursor/src/native-loader.ts +71 -0
package/dist/builtin/cursor/src/proto/README.md +34 -0
package/dist/builtin/cursor/src/proto/agent_pb.ts +15294 -0
package/dist/builtin/cursor/src/proto/protobuf-codec.ts +717 -0
package/dist/builtin/cursor/src/provider.ts +301 -0
package/dist/builtin/cursor/src/stream.ts +564 -0
package/dist/builtin/cursor/src/transport.ts +791 -0
package/dist/builtin/intercom/CHANGELOG.md +4 -0
package/dist/builtin/intercom/package.json +2 -2
package/dist/builtin/intercom/skills/intercom/SKILL.md +5 -5
package/dist/builtin/mcp/CHANGELOG.md +4 -0
package/dist/builtin/mcp/package.json +3 -3
package/dist/builtin/subagents/CHANGELOG.md +13 -0
package/dist/builtin/subagents/README.md +7 -3
package/dist/builtin/subagents/agents/codebase-online-researcher.md +9 -24
package/dist/builtin/subagents/agents/debugger.md +3 -5
package/dist/builtin/subagents/package.json +4 -4
package/dist/builtin/subagents/src/runs/background/subagent-runner.ts +2 -1
package/dist/builtin/subagents/src/runs/foreground/execution.ts +2 -1
package/dist/builtin/subagents/src/runs/shared/parallel-utils.ts +1 -0
package/dist/builtin/subagents/src/runs/shared/pi-args.ts +19 -2
package/dist/builtin/subagents/src/runs/shared/structured-output.ts +271 -10
package/dist/builtin/subagents/src/runs/shared/subagent-prompt-runtime.ts +12 -39
package/dist/builtin/subagents/src/shared/types.ts +5 -3
package/dist/builtin/subagents/src/shared/utils.ts +50 -10
package/dist/builtin/subagents/src/slash/saved-chain-mapping.ts +77 -0
package/dist/builtin/subagents/src/slash/slash-commands.ts +1 -55
package/dist/builtin/web-access/CHANGELOG.md +5 -1
package/dist/builtin/web-access/README.md +1 -1
package/dist/builtin/web-access/github-extract.ts +1 -1
package/dist/builtin/web-access/package.json +3 -3
package/dist/builtin/workflows/CHANGELOG.md +26 -0
package/dist/builtin/workflows/README.md +28 -8
package/dist/builtin/workflows/builtin/deep-research-codebase.ts +9 -49
package/dist/builtin/workflows/builtin/goal.ts +63 -106
package/dist/builtin/workflows/builtin/index.d.ts +2 -0
package/dist/builtin/workflows/builtin/open-claude-design.ts +31 -76
package/dist/builtin/workflows/builtin/ralph.d.ts +2 -0
package/dist/builtin/workflows/builtin/ralph.ts +227 -518
package/dist/builtin/workflows/builtin/shared-prompts.ts +7 -0
package/dist/builtin/workflows/package.json +2 -2
package/dist/builtin/workflows/skills/research-codebase/SKILL.md +17 -3
package/dist/builtin/workflows/src/extension/wiring.ts +72 -9
package/dist/builtin/workflows/src/extension/workflow-schema.ts +34 -0
package/dist/builtin/workflows/src/runs/foreground/executor.ts +13 -2
package/dist/builtin/workflows/src/runs/foreground/stage-runner.ts +86 -14
package/dist/builtin/workflows/src/shared/authoring-contract.d.ts +11 -3
package/dist/builtin/workflows/src/shared/types.ts +8 -4
package/dist/builtin/workflows/src/tui/overlay-adapter.ts +64 -2
package/dist/builtin/workflows/src/tui/workflow-attach-pane.ts +8 -8
package/dist/builtin/workflows/src/tui/workflow-status.ts +2 -0
package/dist/core/atomic-guide-command.d.ts.map +1 -1
package/dist/core/atomic-guide-command.js +7 -7
package/dist/core/atomic-guide-command.js.map +1 -1
package/dist/core/builtin-packages.d.ts.map +1 -1
package/dist/core/builtin-packages.js +6 -0
package/dist/core/builtin-packages.js.map +1 -1
package/dist/core/extensions/index.d.ts +1 -1
package/dist/core/extensions/index.d.ts.map +1 -1
package/dist/core/extensions/index.js.map +1 -1
package/dist/core/extensions/types.d.ts +20 -0
package/dist/core/extensions/types.d.ts.map +1 -1
package/dist/core/extensions/types.js.map +1 -1
package/dist/core/model-resolver.d.ts +1 -0
package/dist/core/model-resolver.d.ts.map +1 -1
package/dist/core/model-resolver.js +17 -8
package/dist/core/model-resolver.js.map +1 -1
package/dist/core/package-manager.d.ts +11 -9
package/dist/core/package-manager.d.ts.map +1 -1
package/dist/core/package-manager.js +55 -10
package/dist/core/package-manager.js.map +1 -1
package/dist/core/project-trust.d.ts +1 -0
package/dist/core/project-trust.d.ts.map +1 -1
package/dist/core/project-trust.js +3 -3
package/dist/core/project-trust.js.map +1 -1
package/dist/core/resource-loader.d.ts +11 -2
package/dist/core/resource-loader.d.ts.map +1 -1
package/dist/core/resource-loader.js +72 -9
package/dist/core/resource-loader.js.map +1 -1
package/dist/core/sdk.d.ts +3 -3
package/dist/core/sdk.d.ts.map +1 -1
package/dist/core/sdk.js +5 -5
package/dist/core/sdk.js.map +1 -1
package/dist/core/tools/index.d.ts +1 -0
package/dist/core/tools/index.d.ts.map +1 -1
package/dist/core/tools/index.js +1 -0
package/dist/core/tools/index.js.map +1 -1
package/dist/core/tools/structured-output.d.ts +39 -0
package/dist/core/tools/structured-output.d.ts.map +1 -0
package/dist/core/tools/structured-output.js +141 -0
package/dist/core/tools/structured-output.js.map +1 -0
package/dist/index.d.ts +1 -1
package/dist/index.d.ts.map +1 -1
package/dist/index.js +1 -1
package/dist/index.js.map +1 -1
package/dist/main.d.ts.map +1 -1
package/dist/main.js +36 -14
package/dist/main.js.map +1 -1
package/dist/modes/interactive/components/login-dialog.d.ts +3 -0
package/dist/modes/interactive/components/login-dialog.d.ts.map +1 -1
package/dist/modes/interactive/components/login-dialog.js +16 -0
package/dist/modes/interactive/components/login-dialog.js.map +1 -1
package/dist/modes/interactive/interactive-mode.d.ts +11 -0
package/dist/modes/interactive/interactive-mode.d.ts.map +1 -1
package/dist/modes/interactive/interactive-mode.js +158 -11
package/dist/modes/interactive/interactive-mode.js.map +1 -1
package/dist/modes/print-mode.d.ts.map +1 -1
package/dist/modes/print-mode.js +39 -0
package/dist/modes/print-mode.js.map +1 -1
package/docs/custom-provider.md +1 -0
package/docs/extensions.md +2 -2
package/docs/models.md +2 -0
package/docs/packages.md +3 -1
package/docs/providers.md +15 -0
package/docs/quickstart.md +3 -3
package/docs/sdk.md +61 -0
package/docs/security.md +1 -1
package/docs/subagents.md +21 -0
package/docs/usage.md +2 -0
package/docs/workflows.md +28 -21
package/examples/extensions/README.md +1 -1
package/examples/extensions/custom-provider-anthropic/package-lock.json +2 -2
package/examples/extensions/custom-provider-anthropic/package.json +1 -1
package/examples/extensions/custom-provider-gitlab-duo/package.json +1 -1
package/examples/extensions/gondolin/package-lock.json +2 -2
package/examples/extensions/gondolin/package.json +1 -1
package/examples/extensions/sandbox/package-lock.json +2 -2
package/examples/extensions/sandbox/package.json +1 -1
package/examples/extensions/structured-output.ts +22 -53
package/examples/extensions/with-deps/package-lock.json +2 -2
package/examples/extensions/with-deps/package.json +1 -1
package/package.json +12 -9

package/docs/workflows.md CHANGED Viewed

@@ -9,7 +9,7 @@ Use a workflow when a task should be repeatable, inspectable, resumable, or spli
 **Key capabilities:**
 - **Tracked stages** - Name each step and inspect it in workflow status and graph views
 - **Parallel branches** - Run independent research, review, or implementation branches concurrently
-- **Context handoffs** - Pass summaries, artifacts, files, and structured outputs between stages
+- **Context handoffs** - Pass summaries, artifacts, files, and schema-backed structured results between stages
 - **Human input** - Pause for `ctx.ui.input`, `confirm`, `select`, `editor`, or custom TUI widget decisions during a run
 - **Resumable control** - Interrupt, pause, resume, attach to, or kill workflow runs
 - **Artifacts** - Save large outputs to files instead of pushing everything through model context
@@ -153,7 +153,7 @@ For the builtin result tables below, `deep-research-codebase`, `goal`, and `ralp
 |---|---|---|
 | `deep-research-codebase` | Scout + research-history chain → parallel specialist waves → aggregator. Indexes the whole repo and synthesizes findings. | Broad or cross-cutting research before you decide what to change. Prefer `/skill:research-codebase` for one subsystem. |
 | `goal` | Persisted goal ledger → bounded worker turns → receipts → three-reviewer gate → deterministic reducer → final report. | Small-to-medium scope changes when you can identify the work surface, state the exact outcome, and name the validation that proves it is done — for example tests, lint/typecheck, docs builds, or observable behavior. |
-| `ralph` | RFC planning → sub-agent orchestration → simplification → parallel review → optional final-stage PR handoff. | Larger migrations, broad refactors, multi-package changes, and spec-to-reviewed-change work where you want Atomic to plan the approach, delegate implementation through sub-agents, simplify, review, iterate, and optionally allow only the final `pull-request` stage to attempt PR creation with `create_pr=true`. |
+| `ralph` | Prompt-engineering → codebase/online research → sub-agent orchestration → parallel review → optional final-stage PR handoff. | Larger migrations, broad refactors, and multi-package changes where you want Atomic to transform the prompt into a research question, research the codebase before implementing, delegate through sub-agents, review, iterate, and optionally allow only the final `pull-request` stage to attempt PR creation with `create_pr=true`. |
 | `open-claude-design` | Design-system onboarding → reference import → HTML generation → impeccable-driven refinement → quality gate → rich HTML handoff. Renders a live `preview.html` you can iterate against (opens through `browser` when available). | UI, page, component, theme, or design-token work that benefits from generation + critique loops. |
 ### `deep-research-codebase`
@@ -224,7 +224,7 @@ Run examples:
 Write the `objective` like a compact acceptance spec. Say what should exist when the run is done, how you want testing handled, which command(s) or manual checks matter, and what outcome proves completion. The workflow is intentionally lean: it does not first generate an RFC or migration plan, so the developer-supplied objective is where scope, validation, and completion criteria belong.
-The worker may claim readiness, but it cannot finalize completion. Three reviewers independently inspect the ledger, worker receipt, repository state, and diff against `base_branch`; each returns structured JSON with findings, evidence, verification still remaining, and an optional blocker. A TypeScript reducer marks the goal complete only when reviewer quorum approves, marks blocked only when the same dependency/tool blocker repeats for the blocker threshold, continues when evidence is missing, and returns `needs_human` when `max_turns` is exhausted or worker execution fails.
+The worker may claim readiness, but it cannot finalize completion. Workers and reviewers are prompted to verify user-visible behavior end-to-end when practical, using browser-skilled subagents for web/frontend flows that may depend on backend/API behavior and tmux-skilled subagents for TUI or terminal-app scenarios. Three reviewers independently inspect the ledger, worker receipt, repository state, and diff against `base_branch`; each returns structured JSON with findings, evidence, verification still remaining, and an optional blocker. A TypeScript reducer marks the goal complete only when reviewer quorum approves, marks blocked only when the same dependency/tool blocker repeats for the blocker threshold, continues when evidence is missing, and returns `needs_human` when `max_turns` is exhausted or worker execution fails.
 Result fields:
@@ -248,8 +248,8 @@ Inputs:
 | Input | Type | Required | Default | Description |
 |---|---|---|---|---|
-| `prompt` | text | yes | — | Task, feature request, issue summary, or spec path to plan, execute, refine, and review. |
-| `max_loops` | number | no | `10` | Maximum plan/orchestrate/review iterations before the workflow completes or, when enabled, proceeds to final handoff without reviewer approval. |
+| `prompt` | text | yes | — | Task, feature request, issue summary, or spec path to research, execute, refine, and review. |
+| `max_loops` | number | no | `10` | Maximum research/orchestrate/review iterations before the workflow completes or, when enabled, proceeds to final handoff without reviewer approval. |
 | `base_branch` | string | no | `origin/main` | Branch reviewers and the optional final stage compare the current code delta against; also used to create a missing worktree. |
 | `git_worktree_dir` | string | no | `""` | Optional reusable Git worktree root. Empty runs in the invoking checkout; non-empty values run Ralph stages in the created/reused worktree. |
 | `create_pr` | boolean | no | `false` | Safe-by-default PR creation flag. Omitted or `false` skips the final `pull-request` stage and omits `pr_report`; prompt text alone does not opt in, and only strict `true` authorizes the final `pull-request` stage to attempt provider-appropriate PR/MR/review creation. |
@@ -257,12 +257,12 @@ Inputs:
 Run examples:
 ```text
-/workflow ralph prompt="Plan and migrate the database layer to Drizzle" max_loops=3 base_branch=develop
+/workflow ralph prompt="Migrate the database layer to Drizzle" max_loops=3 base_branch=develop
 /workflow ralph prompt="Refactor authentication across the API, CLI, and web UI" create_pr=true
 /workflow ralph prompt="Safely implement the API refactor" git_worktree_dir=../atomic-ralph-api-wt base_branch=main
 ```
-Each `ralph` iteration writes an RFC-style technical design document under `specs/`, initializes an OS-temp implementation notes file, delegates implementation through sub-agents, runs a behavior-preserving code simplifier, and asks two reviewers to inspect the patch directly against `base_branch`. Reviewers discover any needed repository infrastructure themselves while inspecting the actual diff; Ralph no longer runs separate `infra-*` discovery stages. The loop stops when every reviewer approves or `max_loops` is reached. By default Ralph does not start the final `pull-request` stage, and `pr_report` is omitted. Prompt text alone does not opt in. Pass `create_pr=true` only when you explicitly want the final `pull-request` stage to inspect provider credentials and attempt provider-appropriate PR/MR/review creation, such as GitHub `gh`, Azure Repos `az repos pr create`, or Sapling/Phabricator tooling; Ralph's own PR-creation instructions live in that final stage.
+Each `ralph` iteration starts by prompt-engineering the user prompt with `/skill:prompt-engineer Transform the following user prompt to a codebase and online research question which can be thoroughly explored: ...`, then researches that transformed question with `/skill:research-codebase ...` and writes the findings under `research/`. The orchestrator treats that research artifact as its primary implementation context, initializes/updates an OS-temp implementation notes file, delegates implementation through sub-agents, and asks two reviewers to inspect the patch directly against `base_branch`. Ralph's orchestrator and reviewers are prompted to verify user-visible behavior end-to-end when practical, using browser-skilled subagents for web/frontend flows that may depend on backend/API behavior and tmux-skilled subagents for TUI or terminal-app scenarios. If reviewers find issues, the next prompt-engineering and research stages receive the review artifact path so follow-up research can address unresolved findings, and research stages fork from prior research session data when available. The loop stops when every reviewer approves or `max_loops` is reached. By default Ralph does not start the final `pull-request` stage, and `pr_report` is omitted. Prompt text alone does not opt in. Pass `create_pr=true` only when you explicitly want the final `pull-request` stage to inspect provider credentials and attempt provider-appropriate PR/MR/review creation, such as GitHub `gh`, Azure Repos `az repos pr create`, or Sapling/Phabricator tooling; Ralph's own PR-creation instructions live in that final stage.
 Set `git_worktree_dir` when you want Ralph's worker stages isolated in a reusable Git worktree. Relative paths resolve from the invoking repository root, existing same-repository worktree roots are reused, and missing paths are created from `base_branch`. Ralph preserves the invoking repo-relative cwd inside the worktree, so launching from `repo/packages/api` with `git_worktree_dir=../repo-wt` runs stages from `../repo-wt/packages/api`.
@@ -271,16 +271,18 @@ Result fields:
 | Field | Meaning |
 |---|---|
 | `result` | Final implementation report from the orchestrator stage. |
-| `plan` | Latest RFC-style plan text. |
-| `plan_path` | Path to the latest generated spec under `specs/`. |
+| `plan` | Latest transformed research question, retained for compatibility. |
+| `plan_path` | Backward-compatible alias for `research_path`. |
+| `research` | Latest research report text or artifact reference. |
+| `research_path` | Path to the latest generated research artifact under `research/`. |
 | `implementation_notes_path` | OS-temp notes file containing decisions, deviations, blockers, and validation notes. |
 | `pr_report` | Pull-request report emitted only when `create_pr=true` and the final `pull-request` stage runs. |
 | `approved` | Whether the reviewer loop approved before completion or optional final handoff. |
-| `iterations_completed` | Number of plan/orchestrate/review loops completed. |
+| `iterations_completed` | Number of research/orchestrate/review loops completed. |
 | `review_report` | Compact reference to the latest reviewer payload artifact. |
 | `review_report_path` | JSON artifact path for the latest Ralph review round. |
-A typical end-to-end flow is `/skill:research-codebase` → `/skill:create-spec` → `/workflow goal objective="Implement the researched rate-limit behavior, run the focused tests, and finish when the documented burst behavior is validated"` when you can identify the work surface, state the exact outcome, and name the validation that proves it is done. Keep using `/workflow ralph` for larger migrations, broad refactors, multi-package changes, and spec-to-reviewed-change work where you want Atomic to plan, delegate through sub-agents, simplify, review, iterate, and optionally allow only the final `pull-request` stage to attempt PR creation with `create_pr=true`.
+A typical end-to-end flow is `/skill:research-codebase` → `/skill:create-spec` → `/workflow goal objective="Implement the researched rate-limit behavior, run the focused tests, and finish when the documented burst behavior is validated"` when you can identify the work surface, state the exact outcome, and name the validation that proves it is done. Keep using `/workflow ralph` for larger migrations, broad refactors, and multi-package changes where you want Atomic to research first, delegate through sub-agents, review, iterate, and optionally allow only the final `pull-request` stage to attempt PR creation with `create_pr=true`.
 ### `open-claude-design`
@@ -335,7 +337,7 @@ Use the goal workflow to implement specs/2026-03-rate-limit.md, run the focused
 ```
 ```text
-Use the ralph workflow to plan a database-layer migration, implement it, review it, and set `create_pr=true` for final-stage PR handoff.
+Use the ralph workflow to research a database-layer migration, implement it, review it, and set `create_pr=true` for final-stage PR handoff.
 ```
 ```text
@@ -381,7 +383,7 @@ If the task is only deterministic TypeScript with no LLM/session stage, use a sc
 |-----------|-----|
 | Run, inspect, attach to, pause, interrupt, resume, or check status for an existing workflow | `/workflow ...` or `workflow({ action: ... })` |
 | Implement a small-to-medium scope change with an identifiable work surface, exact outcome, and named validation | `/workflow goal objective="..."` so Atomic keeps the run bounded, captures receipts in a goal ledger, gates completion through reviewers, and stops as `complete`, `blocked`, or `needs_human` |
-| Plan and execute a larger migration, broad refactor, multi-package change, or spec-to-reviewed-change effort | `/workflow ralph prompt="..."` so Atomic can plan the approach, delegate implementation through sub-agents, simplify, review, and iterate; prompt text alone does not opt in to PR creation, so add `create_pr=true` only when you want the final `pull-request` stage and `pr_report` |
+| Research and execute a larger migration, broad refactor, or multi-package change | `/workflow ralph prompt="..."` so Atomic can transform the prompt into a research question, research the codebase first, delegate implementation through sub-agents, review, and iterate; prompt text alone does not opt in to PR creation, so add `create_pr=true` only when you want the final `pull-request` stage and `pr_report` |
 | Create or edit reusable automation | a TypeScript workflow definition exported from `defineWorkflow(...).compile()` |
 | Track one-off work without saving a workflow file | direct `workflow({ task })`, `workflow({ tasks })`, or `workflow({ chain })` calls |
 | Make a workflow robust | design the stage graph, context handoffs, artifacts, validation gates, model fallbacks, and human approval points before coding |
@@ -1100,7 +1102,7 @@ Control-signal probing is fail-closed. When the executor inspects an arbitrary t
 - Avoid workflow-specific or stage-specific vocabulary that is not explained inside the current prompt.
 - Use clear software engineering terminology in self-described prompts.
 - Avoid hard-coded regular expressions for condition matching when gating reviews or model outputs.
-- Prefer structured output schemas for review/gate decisions whenever model output needs to be evaluated.
+- Prefer schema-backed workflow stages (`ctx.stage(..., { schema })`, `ctx.chain` items, or `ctx.parallel` items) for review/gate decisions whenever model output needs to be evaluated; Atomic injects the canonical `structured_output` tool only for those schema-enabled items.
 - Treat atomic workflow units as language model stages, not deterministic tools.
 - When deterministic gates are needed, create small dedicated stages that instruct a model to run a specific tool or perform a specific check. This keeps gates adaptive to the current codebase while preserving explicit workflow structure.
@@ -1315,7 +1317,7 @@ Common builtin import targets:
 |---|---|---|---|
 | `deep-research-codebase` | `deepResearchCodebase` | `@bastani/workflows/builtin/deep-research-codebase` | Gather broad repo research before planning, synthesis, or implementation. |
 | `goal` | `goal` | `@bastani/workflows/builtin/goal` | Run a bounded implementation/check loop with receipts and reviewer-gated completion. |
-| `ralph` | `ralph` | `@bastani/workflows/builtin/ralph` | Delegate a larger migration/refactor/spec-to-reviewed-change effort to Ralph's plan/orchestrate/review loop; pass `create_pr=true` to authorize only the final PR-creation stage. |
+| `ralph` | `ralph` | `@bastani/workflows/builtin/ralph` | Delegate a larger migration/refactor effort to Ralph's research/orchestrate/review loop; pass `create_pr=true` to authorize only the final PR-creation stage. |
 | `open-claude-design` | `openClaudeDesign` | `@bastani/workflows/builtin/open-claude-design` | Generate and refine a UI/design artifact and handoff spec. |
 Example parent workflow that runs builtin deep research, then chooses either `goal` or `ralph` as the nested implementation runner:
@@ -1330,7 +1332,7 @@ export default defineWorkflow("research-then-implement")
     "runner",
     Type.Union([Type.Literal("goal"), Type.Literal("ralph")], {
       default: "goal",
-      description: "Use goal for bounded changes or Ralph for broad spec-to-reviewed-change work.",
+      description: "Use goal for bounded changes or Ralph for broad research-first implementation work.",
     }),
   )
   .output("research_doc_path", Type.Optional(Type.String({ description: "Path to the deep-research document used for implementation." })))
@@ -1473,9 +1475,14 @@ Common task/stage options include:
 - `context: "fresh" | "fork"`, `forkFromSessionFile`
 - `model`, `fallbackModels`, `thinkingLevel`, `scopedModels`, `modelRegistry` — `model` and each `fallbackModels` entry accept a `model_name:thinking_effort` reasoning suffix; the standalone `thinkingLevel` is deprecated (see [Reasoning levels](#reasoning-levels))
 - `tools`, `noTools`, `customTools`, `mcp: { allow?: string[], deny?: string[] }`, `bashPolicy`
+- `schema` for a structured final answer from this workflow item
 - `output`, `outputMode`, `reads`, `worktree`, `gitWorktreeDir`, `baseBranch`, `maxOutput`, `artifacts`, `sessionDir`, `cwd`, `agentDir`
 - advanced host-supplied SDK seams: `authStorage`, `resourceLoader`, `sessionManager`, `settingsManager`, `sessionStartEvent`
+`schema` is opt-in. When a `ctx.stage` call, `ctx.task` call, `ctx.chain` item, or `ctx.parallel` item includes a top-level object TypeBox/JSON Schema, Atomic registers a schema-specific `structured_output` tool for that item only, appends final-answer instructions, and requires the stage to finish by calling the tool exactly once. The prompt result is the parsed structured value for `ctx.stage(..., { schema }).prompt(...)`; task/chain/parallel results also include `result.structured` and keep `result.text` as formatted JSON for handoffs. Because the result contract is single-use, a schema-backed `StageContext` supports one `prompt()` call; create a new `ctx.stage(..., { schema })` for each additional structured prompt. If the item also uses an explicit `tools` allowlist, Atomic automatically adds `structured_output` to that allowlist. Items without `schema` do not receive `structured_output` from the normal tool registry.
+`subagent` is available as a default workflow-stage tool, with the same default two-hop nesting budget as main chat: a workflow stage can launch a subagent, and that subagent can launch one nested subagent before the guard blocks further delegation. `tools` remains an allowlist across built-in tools and bundled extension tools; if you set `tools`, list every tool the stage should see. Explicitly listing tools such as `subagent`, `web_search`, `fetch_content`, or `intercom` exposes those tools to the stage, while `excludedTools` and `noTools: "all"` still win. The bundled subagent definitions from `@bastani/subagents` are available to the `subagent` tool in workflow stages; when a workflow is itself running inside a subagent child process, Atomic isolates stage resource discovery from the parent child-process flags so `subagent` remains available while workflow-stage nested-depth guards remain in force.
 `bashPolicy` scopes the built-in `bash` tool for one stage or task. `tools` must still include `"bash"` (or leave it available by default); the policy only narrows command text after the shell tool is exposed. It supports exact strings, `{ prefix }`, command-string `{ glob }`, and `{ regex, flags? }` rules, `default: "allow" | "deny"` (default `"allow"`), `deny` precedence, and `match: "segments" | "whole"` (default `"segments"`). Omitting `bashPolicy`, passing `{}`, or passing a default-allow policy with no `allow`/`deny` rules (including empty arrays or match-only default-allow policies) preserves legacy behavior and does not parse commands; malformed policy shapes such as unknown top-level keys (`denny`, `extra`), non-array `allow`/`deny`, invalid rule objects, invalid regexes, invalid glob bracket ranges, or stateful `g`/`y` regex flags fail closed as `invalid-policy`. Segment mode checks each command in pipelines/chains/substitutions before execution, treats unquoted LF, CRLF, and bare CR as command separators, keeps non-leading Bash `>|` noclobber redirections inside the current command segment, and rejects reserved/compound shell heads, leading redirections, attached command-head redirections, and command heads that are not literal words.
 ```ts
@@ -1619,7 +1626,7 @@ Stage prompts should be local contracts, not miniature descriptions of the entir
 - the stage's current objective and what is out of scope for this stage
 - the exact files, artifacts, child outputs, or user inputs it may use
-- the expected output format or structured-output tool/schema it must return
+- the expected output format, or the schema it must return when the workflow item is schema-enabled
 - the checks, tools, or deterministic commands it should run when relevant
 - the success criteria that let this stage stop
@@ -1735,9 +1742,9 @@ Build validation into the workflow instead of waiting for a final manual check.
 - reviewer stages: fresh-context reviewers that inspect artifacts and current files
 - LLM-as-judge stages: direct scoring, pairwise comparison, or rubric-based grading for subjective outputs
-Prefer structured output schemas or structured-output tools for model review and gate decisions. Do not make correctness depend on brittle regular-expression matching against free-form prose such as “looks good”, “approved”, or “PASS”. A schema with explicit booleans/enums, findings arrays, confidence, evidence fields, and error reporting is easier to validate, replay, and safely default to “not approved” when malformed.
+Prefer schema-enabled workflow items for model review and gate decisions. `structured_output` is not available to workflow stages through the normal Atomic tool registry; it is injected only when a `ctx.stage`, `ctx.task`, `ctx.chain` item, or `ctx.parallel` item includes `schema`. Structured-output schemas must be top-level object tool-argument schemas, so wrap array or primitive decisions in object fields such as `{ items: [...] }` or `{ value: ... }`; direct JSON invocations of the `workflow` tool must use a schema with `type: "object"` so invalid array/primitive contracts fail at argument validation instead of later in the stage. Terminating `structured_output` JSON is preserved inline even when it exceeds the normal oversized-tool-result threshold, so workflow code can consume the parsed value instead of a `<persisted-output>` pointer. Do not add the old synthetic `{ value: ... }` wrapper around an object payload unless your schema defines that field, and do not make correctness depend on brittle regular-expression matching against free-form prose such as “looks good”, “approved”, or “PASS”. A schema with explicit booleans/enums, findings arrays, confidence, evidence fields, and error reporting is easier to validate, replay, and safely default to “not approved” when malformed.
-Use small dedicated model stages for adaptive gates when deterministic code alone cannot decide what to check. For example, a stage can read an artifact, inspect the repo, run a named tool or command, and then emit a structured decision. Keep that stage's prompt narrow: tell it the specific check to perform, the files/tools it may use, and the structured decision it must return.
+Use small dedicated model stages for adaptive gates when deterministic code alone cannot decide what to check. For example, a stage can read an artifact, inspect the repo, run a named tool or command, and then emit a structured decision by configuring `schema` on that workflow item. Keep that stage's prompt narrow: tell it the specific check to perform, the files/tools it may use, and the structured decision it must return.
 When using LLM judges, mitigate bias by defining score anchors, asking for evidence, calibrating against examples, and keeping length/order effects in mind. Track pass rates and failures over time for reusable workflows.
@@ -1794,5 +1801,5 @@ Good workflows are information-flow systems, not just prompt sequences. Keep sta
 - Do not call `kill` when the user asks to interrupt or pause resumably.
 - Keep stage names readable because they appear in workflow status and UI.
 - Do not write stage prompts that depend on hidden workflow-wide awareness; make each model stage locally scoped and self-described.
-- Do not parse model gate decisions from ad-hoc prose with regular expressions; use structured output schemas/tools or a focused checking stage that returns a structured decision.
-- Return compact structured output and save large artifacts to files.
+- Do not parse model gate decisions from ad-hoc prose with regular expressions; configure `schema` on a focused workflow item so Atomic injects the canonical `structured_output` tool for that item.
+- Return compact structured output for decisions and save large artifacts to files; schema-enabled workflow items preserve final JSON inline, but artifact handoffs should still use files when the next stage does not need the whole payload in context.

package/examples/extensions/README.md CHANGED Viewed

@@ -36,7 +36,7 @@ cp permission-gate.ts ~/.atomic/agent/extensions/
 | `questionnaire.ts` | Multi-question input with tab bar navigation between questions |
 | `tool-override.ts` | Override built-in tools (e.g., add logging/access control to `read`) |
 | `dynamic-tools.ts` | Register tools after startup (`session_start`) and at runtime via command, with prompt snippets and tool-specific prompt guidelines |
-| `structured-output.ts` | Final structured-output tool that returns `terminate: true` so the agent can end on the tool call |
+| `structured-output.ts` | Opt-in schema-specific `structured_output` tool using Atomic's canonical terminating output factory |
 | `built-in-tool-renderer.ts` | Custom compact rendering for built-in tools (read, bash, edit, write) while keeping original behavior |
 | `minimal-mode.ts` | Override built-in tool rendering for minimal display (only tool calls, no output in collapsed mode) |
 | `truncated-tool.ts` | Wraps ripgrep with proper output truncation (50KB/2000 lines) |

package/examples/extensions/custom-provider-anthropic/package-lock.json CHANGED Viewed

@@ -1,12 +1,12 @@
 {
   "name": "atomic-extension-custom-provider-anthropic",
-  "version": "0.79.1",
+  "version": "0.79.3",
   "lockfileVersion": 3,
   "requires": true,
   "packages": {
     "": {
       "name": "atomic-extension-custom-provider-anthropic",
-      "version": "0.79.1",
+      "version": "0.79.3",
       "dependencies": {
         "@anthropic-ai/sdk": "^0.52.0"
       }

package/examples/extensions/custom-provider-anthropic/package.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "name": "atomic-extension-custom-provider-anthropic",
   "private": true,
-  "version": "0.79.1",
+  "version": "0.79.3",
   "type": "module",
   "scripts": {
     "clean": "echo 'nothing to clean'",

package/examples/extensions/custom-provider-gitlab-duo/package.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "name": "atomic-extension-custom-provider-gitlab-duo",
   "private": true,
-  "version": "0.79.1",
+  "version": "0.79.3",
   "type": "module",
   "scripts": {
     "clean": "echo 'nothing to clean'",

package/examples/extensions/gondolin/package-lock.json CHANGED Viewed

@@ -1,12 +1,12 @@
 {
   "name": "atomic-extension-gondolin",
-  "version": "0.79.1",
+  "version": "0.79.3",
   "lockfileVersion": 3,
   "requires": true,
   "packages": {
     "": {
       "name": "atomic-extension-gondolin",
-      "version": "0.79.1",
+      "version": "0.79.3",
       "dependencies": {
         "@earendil-works/gondolin": "0.12.0"
       }

package/examples/extensions/gondolin/package.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
 	"name": "atomic-extension-gondolin",
 	"private": true,
-	"version": "0.79.1",
+	"version": "0.79.3",
 	"type": "module",
 	"scripts": {
 		"clean": "echo 'nothing to clean'",

package/examples/extensions/sandbox/package-lock.json CHANGED Viewed

@@ -1,12 +1,12 @@
 {
   "name": "atomic-extension-sandbox",
-  "version": "1.9.1",
+  "version": "1.9.3",
   "lockfileVersion": 3,
   "requires": true,
   "packages": {
     "": {
       "name": "atomic-extension-sandbox",
-      "version": "1.9.1",
+      "version": "1.9.3",
       "dependencies": {
         "@anthropic-ai/sandbox-runtime": "^0.0.26"
       }

package/examples/extensions/sandbox/package.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "name": "atomic-extension-sandbox",
   "private": true,
-  "version": "1.9.1",
+  "version": "1.9.3",
   "type": "module",
   "scripts": {
     "clean": "echo 'nothing to clean'",

package/examples/extensions/structured-output.ts CHANGED Viewed

@@ -1,65 +1,34 @@
 /**
- * Structured Output Tool
+ * Schema-specific structured_output tool
  *
- * Demonstrates `terminate: true` so the agent can end on a tool call
- * without paying for an extra follow-up LLM turn.
+ * Atomic does not register `structured_output` in normal agent sessions by
+ * default. This extension demonstrates the canonical factory for adding a
+ * schema-backed terminating final-answer tool only when this extension is
+ * enabled.
+ *
+ * Custom factory names are opt-in tools too: `createStructuredOutputTool({ name:
+ * "final_decision", ... })` registers `final_decision`; include that name in any
+ * explicit `tools` allowlist. The default factory name registers
+ * `structured_output` for this extension/runtime only.
  */
-import { defineTool, type ExtensionAPI } from "@bastani/atomic";
-import { Text } from "@earendil-works/pi-tui";
+import {
+	createStructuredOutputTool,
+	type ExtensionAPI,
+} from "@bastani/atomic";
 import { Type } from "typebox";
-interface StructuredOutputDetails {
-	headline: string;
-	summary: string;
-	actionItems: string[];
-}
-const structuredOutputTool = defineTool({
-	name: "structured_output",
-	label: "Structured Output",
-	description:
-		"Return a final structured answer. Use this as your last action when the user asks for structured output or a machine-readable summary.",
-	promptSnippet: "Emit a final structured answer as a terminating tool result",
-	promptGuidelines: [
-		"Use structured_output as your final action when the user asks for structured output, JSON-like output, or a machine-readable summary.",
-		"After calling structured_output, do not emit another assistant response in the same turn.",
-	],
-	parameters: Type.Object({
-		headline: Type.String({ description: "Short title for the result" }),
-		summary: Type.String({ description: "One-paragraph summary" }),
-		actionItems: Type.Array(Type.String(), { description: "Concrete next steps or key bullets" }),
-	}),
-	async execute(_toolCallId, params) {
-		return {
-			content: [{ type: "text", text: `Saved structured output: ${params.headline}` }],
-			details: {
-				headline: params.headline,
-				summary: params.summary,
-				actionItems: params.actionItems,
-			} satisfies StructuredOutputDetails,
-			terminate: true,
-		};
-	},
-	renderResult(result, _options, theme) {
-		const details = result.details as StructuredOutputDetails | undefined;
-		if (!details) {
-			const text = result.content[0];
-			return new Text(text?.type === "text" ? text.text : "", 0, 0);
-		}
+const SummarySchema = Type.Object({
+	headline: Type.String({ description: "Short title for the result" }),
+	summary: Type.String({ description: "One-paragraph summary" }),
+	actionItems: Type.Array(Type.String(), { description: "Concrete next steps or key bullets" }),
+}, { additionalProperties: false });
-		const lines = [
-			theme.fg("toolTitle", theme.bold(details.headline)),
-			theme.fg("text", details.summary),
-			"",
-			...details.actionItems.map((item, index) => theme.fg("muted", `${index + 1}. ${item}`)),
-		];
-		return new Text(lines.join("\n"), 0, 0);
-	},
+const structuredOutputTool = createStructuredOutputTool({
+	schema: SummarySchema,
 });
 export default function (pi: ExtensionAPI) {
+	// Register structured_output for sessions that load this extension.
 	pi.registerTool(structuredOutputTool);
 }

package/examples/extensions/with-deps/package-lock.json CHANGED Viewed

@@ -1,12 +1,12 @@
 {
   "name": "atomic-extension-with-deps",
-  "version": "0.79.1",
+  "version": "0.79.3",
   "lockfileVersion": 3,
   "requires": true,
   "packages": {
     "": {
       "name": "atomic-extension-with-deps",
-      "version": "0.79.1",
+      "version": "0.79.3",
       "dependencies": {
         "ms": "^2.1.3"
       },

package/examples/extensions/with-deps/package.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "name": "atomic-extension-with-deps",
   "private": true,
-  "version": "0.79.1",
+  "version": "0.79.3",
   "type": "module",
   "scripts": {
     "clean": "echo 'nothing to clean'",

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@bastani/atomic",
-  "version": "0.8.28",
+  "version": "0.8.29-alpha.3",
   "description": "Atomic coding agent CLI with read, bash, edit, write tools and session management",
   "type": "module",
   "atomicConfig": {
@@ -21,7 +21,8 @@
   "exports": {
     ".": {
       "types": "./dist/index.d.ts",
-      "import": "./dist/index.js"
+      "import": "./dist/index.js",
+      "default": "./dist/index.js"
     },
     "./hooks": {
       "types": "./dist/core/hooks/index.d.ts",
@@ -67,9 +68,11 @@
     "prepublishOnly": "bun run clean && bun run build"
   },
   "dependencies": {
-    "@earendil-works/pi-agent-core": "^0.79.1",
-    "@earendil-works/pi-ai": "^0.79.1",
-    "@earendil-works/pi-tui": "^0.79.1",
+    "@bastani/atomic-natives": "0.8.29-alpha.3",
+    "@bufbuild/protobuf": "^2.0.0",
+    "@earendil-works/pi-agent-core": "^0.79.3",
+    "@earendil-works/pi-ai": "^0.79.3",
+    "@earendil-works/pi-tui": "^0.79.3",
     "@modelcontextprotocol/ext-apps": "^1.7.2",
     "@modelcontextprotocol/sdk": "^1.25.1",
     "@mozilla/readability": "^0.6.0",
@@ -85,7 +88,7 @@
     "linkedom": "^0.18.12",
     "minimatch": "^10.2.3",
     "open": "^11.0.0",
-    "p-limit": "^6.1.0",
+    "p-limit": "^7.3.0",
     "proper-lockfile": "^4.1.2",
     "turndown": "^7.2.0",
     "typebox": "^1.1.24",
@@ -101,14 +104,14 @@
     }
   },
   "optionalDependencies": {
-    "@mariozechner/clipboard": "^0.3.6"
+    "@mariozechner/clipboard": "^0.3.9"
   },
   "devDependencies": {
     "@types/cross-spawn": "6.0.6",
-    "@types/diff": "^7.0.2",
+    "@types/diff": "^8.0.0",
     "@types/hosted-git-info": "^3.0.5",
     "@types/ms": "^2.1.0",
-    "@types/node": "^25.9.1",
+    "@types/node": "^25.9.3",
     "@types/proper-lockfile": "^4.1.4",
     "@typescript/native-preview": "7.0.0-dev.20260511.1",
     "shx": "^0.4.0",