npm - @bastani/atomic - Versions diffs - 0.8.30-alpha.3 → 0.8.31-alpha.1 - Mend

@bastani/atomic 0.8.30-alpha.3 → 0.8.31-alpha.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (123) hide show

package/CHANGELOG.md +20 -0
package/dist/builtin/cursor/CHANGELOG.md +7 -1
package/dist/builtin/cursor/package.json +2 -2
package/dist/builtin/intercom/CHANGELOG.md +6 -0
package/dist/builtin/intercom/package.json +2 -2
package/dist/builtin/mcp/CHANGELOG.md +6 -0
package/dist/builtin/mcp/package.json +3 -3
package/dist/builtin/subagents/CHANGELOG.md +6 -0
package/dist/builtin/subagents/package.json +4 -4
package/dist/builtin/web-access/CHANGELOG.md +6 -0
package/dist/builtin/web-access/package.json +2 -2
package/dist/builtin/workflows/CHANGELOG.md +12 -0
package/dist/builtin/workflows/builtin/deep-research-codebase.ts +1 -1
package/dist/builtin/workflows/builtin/goal.ts +2 -2
package/dist/builtin/workflows/builtin/open-claude-design.ts +1 -1
package/dist/builtin/workflows/builtin/ralph.ts +61 -11
package/dist/builtin/workflows/package.json +2 -2
package/dist/builtin/workflows/src/extension/workflow-schema.ts +3 -1
package/dist/builtin/workflows/src/runs/foreground/stage-runner.ts +5 -0
package/dist/builtin/workflows/src/runs/shared/model-fallback.ts +95 -8
package/dist/builtin/workflows/src/shared/authoring-contract.d.ts +11 -0
package/dist/cli/args.d.ts +1 -0
package/dist/cli/args.d.ts.map +1 -1
package/dist/cli/args.js +20 -0
package/dist/cli/args.js.map +1 -1
package/dist/cli/list-models.d.ts.map +1 -1
package/dist/cli/list-models.js +2 -1
package/dist/cli/list-models.js.map +1 -1
package/dist/core/agent-session-services.d.ts +2 -0
package/dist/core/agent-session-services.d.ts.map +1 -1
package/dist/core/agent-session-services.js +2 -0
package/dist/core/agent-session-services.js.map +1 -1
package/dist/core/agent-session.d.ts +17 -0
package/dist/core/agent-session.d.ts.map +1 -1
package/dist/core/agent-session.js +161 -18
package/dist/core/agent-session.js.map +1 -1
package/dist/core/compaction/branch-summarization.d.ts.map +1 -1
package/dist/core/compaction/branch-summarization.js +20 -5
package/dist/core/compaction/branch-summarization.js.map +1 -1
package/dist/core/compaction/context-compaction.d.ts.map +1 -1
package/dist/core/compaction/context-compaction.js +14 -3
package/dist/core/compaction/context-compaction.js.map +1 -1
package/dist/core/context-window.d.ts +29 -0
package/dist/core/context-window.d.ts.map +1 -0
package/dist/core/context-window.js +86 -0
package/dist/core/context-window.js.map +1 -0
package/dist/core/copilot-errors.d.ts +9 -0
package/dist/core/copilot-errors.d.ts.map +1 -0
package/dist/core/copilot-errors.js +32 -0
package/dist/core/copilot-errors.js.map +1 -0
package/dist/core/copilot-model-catalog.d.ts +132 -0
package/dist/core/copilot-model-catalog.d.ts.map +1 -0
package/dist/core/copilot-model-catalog.js +254 -0
package/dist/core/copilot-model-catalog.js.map +1 -0
package/dist/core/export-html/template.js +10 -1
package/dist/core/extensions/types.d.ts +3 -1
package/dist/core/extensions/types.d.ts.map +1 -1
package/dist/core/extensions/types.js.map +1 -1
package/dist/core/model-registry.d.ts +10 -0
package/dist/core/model-registry.d.ts.map +1 -1
package/dist/core/model-registry.js +107 -4
package/dist/core/model-registry.js.map +1 -1
package/dist/core/model-resolver.d.ts.map +1 -1
package/dist/core/model-resolver.js +4 -0
package/dist/core/model-resolver.js.map +1 -1
package/dist/core/provider-attribution.d.ts.map +1 -1
package/dist/core/provider-attribution.js +17 -7
package/dist/core/provider-attribution.js.map +1 -1
package/dist/core/sdk.d.ts +8 -0
package/dist/core/sdk.d.ts.map +1 -1
package/dist/core/sdk.js +47 -0
package/dist/core/sdk.js.map +1 -1
package/dist/core/session-manager.d.ts +8 -1
package/dist/core/session-manager.d.ts.map +1 -1
package/dist/core/session-manager.js +19 -3
package/dist/core/session-manager.js.map +1 -1
package/dist/core/settings-manager.d.ts +6 -0
package/dist/core/settings-manager.d.ts.map +1 -1
package/dist/core/settings-manager.js +69 -0
package/dist/core/settings-manager.js.map +1 -1
package/dist/index.d.ts +2 -1
package/dist/index.d.ts.map +1 -1
package/dist/index.js +1 -0
package/dist/index.js.map +1 -1
package/dist/main.d.ts.map +1 -1
package/dist/main.js +24 -1
package/dist/main.js.map +1 -1
package/dist/modes/index.d.ts +1 -1
package/dist/modes/index.d.ts.map +1 -1
package/dist/modes/index.js.map +1 -1
package/dist/modes/interactive/components/context-window-selector.d.ts +53 -0
package/dist/modes/interactive/components/context-window-selector.d.ts.map +1 -0
package/dist/modes/interactive/components/context-window-selector.js +136 -0
package/dist/modes/interactive/components/context-window-selector.js.map +1 -0
package/dist/modes/interactive/components/tree-selector.d.ts.map +1 -1
package/dist/modes/interactive/components/tree-selector.js +7 -0
package/dist/modes/interactive/components/tree-selector.js.map +1 -1
package/dist/modes/interactive/interactive-mode.d.ts +5 -0
package/dist/modes/interactive/interactive-mode.d.ts.map +1 -1
package/dist/modes/interactive/interactive-mode.js +91 -1
package/dist/modes/interactive/interactive-mode.js.map +1 -1
package/dist/modes/rpc/rpc-client.d.ts +14 -2
package/dist/modes/rpc/rpc-client.d.ts.map +1 -1
package/dist/modes/rpc/rpc-client.js +23 -3
package/dist/modes/rpc/rpc-client.js.map +1 -1
package/dist/modes/rpc/rpc-mode.d.ts +1 -1
package/dist/modes/rpc/rpc-mode.d.ts.map +1 -1
package/dist/modes/rpc/rpc-mode.js +30 -1
package/dist/modes/rpc/rpc-mode.js.map +1 -1
package/dist/modes/rpc/rpc-types.d.ts +23 -0
package/dist/modes/rpc/rpc-types.d.ts.map +1 -1
package/dist/modes/rpc/rpc-types.js.map +1 -1
package/docs/custom-provider.md +4 -1
package/docs/json.md +3 -1
package/docs/models.md +78 -2
package/docs/providers.md +3 -0
package/docs/rpc.md +80 -1
package/docs/sdk.md +23 -3
package/docs/session-format.md +15 -1
package/docs/sessions.md +1 -1
package/docs/settings.md +7 -2
package/docs/workflows.md +26 -4
package/package.json +5 -5

package/CHANGELOG.md CHANGED Viewed

@@ -2,6 +2,26 @@
 ## [Unreleased]
+### Added
+- Added configurable context-window support for models that declare `contextWindowOptions`, including explicit `--context-window` CLI/settings control, a GitHub Copilot CLI-style `/model`-flow picker (numbered `Default`/`Long context` tiers with token counts), session replay, SDK/runtime/RPC APIs, and docs while preserving each model's scalar default context window. For GitHub Copilot, context windows are measured in **input (prompt) tokens** (consistent with every other provider) and derived **dynamically from GitHub's live CAPI model catalog** (`GET /models`) instead of a hardcoded model list: Atomic resolves each model's input budget as `max_prompt_tokens || max_context_window_tokens || 128_000` and, for tiered models, exposes the per-tier input budgets (`token_prices.<tier>.context_max`) as a selectable default/long window — gated on the user actually having the GitHub Copilot provider and cached on disk for 30 minutes (for example `github-copilot/gpt-5.5` resolves to `272k` default / `922k` long, and the Claude/Gemini long-context models to `200k` default / `936k` long). Atomic raises the local budget and sends `X-GitHub-Api-Version: 2026-06-01`, while GitHub applies the long-context billing tier server-side by prompt token count. Long-context Copilot requests consume more AI credits and require Copilot long-context/usage-based billing entitlement; offline, unauthenticated, or non-Copilot sessions leave the built-in window untouched and show no picker; custom providers and explicit model overrides can still expose their own selectable windows ([#1409](https://github.com/bastani-inc/atomic/issues/1409)).
+- Exported context-window helper functions and types from the package root, including parser/formatter/normalizer/selection utilities and the `Model<Api>` augmentation for `contextWindowOptions`/`defaultContextWindow`, so SDK consumers can use the public API without importing internal source paths ([#1409](https://github.com/bastani-inc/atomic/issues/1409)).
+- Added RPC mode runtime context-window commands so headless clients can read supported token budgets with `get_available_context_windows` and select the active runtime budget with `set_context_window` without persisting `defaultContextWindow` settings ([#1409](https://github.com/bastani-inc/atomic/issues/1409)).
+### Changed
+- Changed built-in GitHub Copilot context windows to be measured in **input (prompt) tokens** (matching every other provider) and derived from GitHub's live CAPI model catalog (`GET /models`, cached 30 minutes, gated on the Copilot provider) instead of a hardcoded long-context model list, so newly added/removed Copilot models and retiered windows are reflected automatically without shipping a stale snapshot. Each model's window now resolves to `max_prompt_tokens || max_context_window_tokens || 128_000`, and tiered models expose their per-tier input budgets (`token_prices.<tier>.context_max`) as the selectable default/long windows (e.g. `gpt-5.5` 272k/922k, Claude/Gemini 200k/936k) — replacing the previous input+output totals — while preserving custom provider entries and explicit `models.json` overrides and relying on GitHub's API-version header and server-side tier selection rather than payload fields or model-id variants ([#1409](https://github.com/bastani-inc/atomic/issues/1409)).
+- Bumped the bundled upstream pi runtime libraries `@earendil-works/pi-agent-core`, `@earendil-works/pi-ai`, and `@earendil-works/pi-tui` from `^0.79.4` to `^0.79.6` so Atomic's installed pi runtime packages pick up upstream v0.79.5/v0.79.6 provider, model, thinking-payload, and shared TUI compatibility fixes; no Atomic coding-agent source changes were made for upstream coding-agent-only marked export or fetch-override behavior in this dependency sync ([#1413](https://github.com/bastani-inc/atomic/issues/1413)).
+### Fixed
+- Fixed a GitHub Copilot context-window warning on restart: after selecting a long-context window (e.g. `claude-opus-4.8` → `936k`) and reopening Atomic, startup validated the persisted selection before the (async, auth-gated) Copilot catalog loaded, so the model still looked limited to its default window and Atomic warned “Context window 936k is not supported… Supported values: 200k” and reset the choice. The model registry now seeds the Copilot context-window catalog synchronously from its on-disk cache at construction (ignoring the refresh TTL, gated on a `github-copilot` credential), so a returning user's selection is recognized immediately while the live refresh still runs in the background ([#1409](https://github.com/bastani-inc/atomic/issues/1409)).
+- Fixed context-window startup, session-switch, settings, and RPC edge cases: unknown provider fallback models no longer inherit selectable context-window options from provider defaults, fatal startup diagnostics no longer persist `defaultContextWindow`, `AgentSession.setModel()` preserves an incoming target model's explicit selected context window, model-switch paths that change effective context windows now notify listeners via `context_window_changed`, the interactive context-window picker keys selection on raw token counts so colliding formatted labels never change which window is selected, RPC `set_model` returns the effective post-switch session model, and explicit startup `contextWindow` selections are journaled even when they equal the model scalar default ([#1409](https://github.com/bastani-inc/atomic/issues/1409)).
+- Fixed `AgentSession.setContextWindow()` so bare SDK/runtime calls update the active session, append `context_window_change`, and emit `context_window_changed` without persisting `defaultContextWindow`; callers must pass `{ persistDefault: true }` to update settings ([#1409](https://github.com/bastani-inc/atomic/issues/1409)).
+- Fixed `packages/coding-agent` source-CLI subprocess tests (`session-id-readonly`, `startup-session-name`, `stdout-cleanliness`) crashing with `ERR_MODULE_NOT_FOUND` (for example `src/core/tools/oversized-tool-result.js`) when the Vitest worker pool runs under Node. They now launch the TypeScript source CLI with Bun explicitly via a `bunExecutable()` helper (matching `context-window-cli`/`rpc-context-window`) instead of assuming `process.execPath` is Bun, so the package test suite is portable across environments. The repo-wide `.js`->`.ts` source-import convention and shipped `dist/` are unchanged ([#1419](https://github.com/bastani-inc/atomic/issues/1419)).
+## [0.8.30] - 2026-06-17
 ### Changed
 - Bumped the bundled upstream pi runtime libraries `@earendil-works/pi-agent-core`, `@earendil-works/pi-ai`, and `@earendil-works/pi-tui` from `^0.79.3` to `^0.79.4`, added `semver` as an explicit runtime dependency for package/version checks, and aligned companion extension peer ranges so Atomic inherits upstream provider/model metadata updates, agent-core fixes, the new terminal background-color query used by first-run theme detection, and shared TUI wrapping/keyboard compatibility fixes.

package/dist/builtin/cursor/CHANGELOG.md CHANGED Viewed

@@ -4,7 +4,13 @@
 ### Changed
-- Published a synchronized Atomic 0.8.30-alpha.1 prerelease; no functional Cursor provider changes were made after 0.8.29.
+- Published a synchronized Atomic 0.8.31-alpha.1 prerelease; no functional Cursor provider changes were made after 0.8.30.
+## [0.8.30] - 2026-06-17
+### Changed
+- Published a synchronized Atomic 0.8.30 stable release; no functional Cursor provider changes were made after 0.8.29.
 ## [0.8.29] - 2026-06-15

package/dist/builtin/cursor/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@bastani/cursor",
-  "version": "0.8.30-alpha.3",
+  "version": "0.8.31-alpha.1",
   "private": true,
   "description": "Experimental first-party Atomic extension for Cursor OAuth, model discovery, and streaming provider registration.",
   "contributors": [
@@ -40,7 +40,7 @@
     }
   },
   "dependencies": {
-    "@bastani/atomic-natives": "0.8.30-alpha.3",
+    "@bastani/atomic-natives": "0.8.31-alpha.1",
     "@bufbuild/protobuf": "^2.0.0"
   }
 }

package/dist/builtin/intercom/CHANGELOG.md CHANGED Viewed

@@ -6,6 +6,12 @@ All notable changes to the `pi-intercom` extension will be documented in this fi
 ### Changed
+- Aligned the intercom extension peer dependency with upstream pi TUI `^0.79.6` so coordination UI surfaces consume the latest shared TUI compatibility fixes; no intercom extension code changes were made for this metadata sync ([#1413](https://github.com/bastani-inc/atomic/issues/1413)).
+## [0.8.30] - 2026-06-17
+### Changed
 - Aligned the intercom extension peer dependency with upstream pi TUI `^0.79.4`; no intercom extension code changes were made.
 ## [0.8.29] - 2026-06-15

package/dist/builtin/intercom/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@bastani/intercom",
-  "version": "0.8.30-alpha.3",
+  "version": "0.8.31-alpha.1",
   "private": true,
   "description": "Atomic extension providing a private coordination channel between parent and child agent sessions. Fork of: https://github.com/nicobailon/pi-intercom",
   "contributors": [
@@ -39,7 +39,7 @@
   },
   "peerDependencies": {
     "@bastani/atomic": "*",
-    "@earendil-works/pi-tui": "^0.79.4"
+    "@earendil-works/pi-tui": "^0.79.6"
   },
   "peerDependenciesMeta": {
     "@bastani/atomic": {

package/dist/builtin/mcp/CHANGELOG.md CHANGED Viewed

@@ -9,6 +9,12 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
 ### Changed
+- Aligned the MCP extension peer dependencies with upstream pi AI/TUI `^0.79.6` so MCP-backed sessions can use the host's latest provider, model, thinking-payload, and shared TUI compatibility fixes; no MCP extension code changes were made for this metadata sync ([#1413](https://github.com/bastani-inc/atomic/issues/1413)).
+## [0.8.30] - 2026-06-17
+### Changed
 - Aligned the MCP extension peer dependencies with upstream pi AI/TUI `^0.79.4`; no MCP extension code changes were made.
 ## [0.8.29] - 2026-06-15

package/dist/builtin/mcp/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@bastani/mcp",
-  "version": "0.8.30-alpha.3",
+  "version": "0.8.31-alpha.1",
   "private": true,
   "description": "Atomic extension that adapts MCP (Model Context Protocol) servers into the coding agent. Fork of: https://github.com/nicobailon/pi-mcp-adapter",
   "contributors": [
@@ -32,8 +32,8 @@
   },
   "peerDependencies": {
     "@bastani/atomic": "*",
-    "@earendil-works/pi-ai": "^0.79.4",
-    "@earendil-works/pi-tui": "^0.79.4",
+    "@earendil-works/pi-ai": "^0.79.6",
+    "@earendil-works/pi-tui": "^0.79.6",
     "zod": "^3.25.0 || ^4.0.0"
   },
   "peerDependenciesMeta": {

package/dist/builtin/subagents/CHANGELOG.md CHANGED Viewed

@@ -4,6 +4,12 @@
 ### Changed
+- Aligned the subagents extension peer dependencies with upstream pi `^0.79.6` runtime packages (`@earendil-works/pi-agent-core`, `@earendil-works/pi-ai`, and `@earendil-works/pi-tui`) so child sessions can use the host's latest provider, model, thinking-payload, and shared TUI compatibility fixes; no subagents extension code changes were made for this metadata sync ([#1413](https://github.com/bastani-inc/atomic/issues/1413)).
+## [0.8.30] - 2026-06-17
+### Changed
 - Aligned the subagents extension peer dependencies with upstream pi `^0.79.4` runtime packages (`@earendil-works/pi-agent-core`, `@earendil-works/pi-ai`, and `@earendil-works/pi-tui`); no subagents extension code changes were made for this metadata sync.
 - Removed subagent acceptance gates, deterministic task-text acceptance inference, the remaining no-mutation completion guard, acceptance-report prompt injection/parsing, acceptance/completion-guard status metadata, and related tool/schema/config fields; completed child output is now preserved without acceptance or mutation-intent evaluation. Migration guidance now directs users to remove stale acceptance fields from subagent calls/chains/parallel items and move validation requirements into task text; JSON chain rewrites drop legacy acceptance entries ([#1398](https://github.com/bastani-inc/atomic/issues/1398)).

package/dist/builtin/subagents/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@bastani/subagents",
-  "version": "0.8.30-alpha.3",
+  "version": "0.8.31-alpha.1",
   "private": true,
   "description": "Atomic extension for delegating tasks to subagents with chains, parallel execution, and TUI clarification. Fork of: https://github.com/nicobailon/pi-subagents",
   "contributors": [
@@ -38,9 +38,9 @@
   },
   "peerDependencies": {
     "@bastani/atomic": "*",
-    "@earendil-works/pi-agent-core": "^0.79.4",
-    "@earendil-works/pi-ai": "^0.79.4",
-    "@earendil-works/pi-tui": "^0.79.4"
+    "@earendil-works/pi-agent-core": "^0.79.6",
+    "@earendil-works/pi-ai": "^0.79.6",
+    "@earendil-works/pi-tui": "^0.79.6"
   },
   "peerDependenciesMeta": {
     "@bastani/atomic": {

package/dist/builtin/web-access/CHANGELOG.md CHANGED Viewed

@@ -6,6 +6,12 @@ All notable changes to this project will be documented in this file.
 ### Changed
+- Aligned the web-access extension peer dependency with upstream pi TUI `^0.79.6` so web-access curator and summary UI surfaces consume the latest shared TUI compatibility fixes; no web-access extension code changes were made for this metadata sync ([#1413](https://github.com/bastani-inc/atomic/issues/1413)).
+## [0.8.30] - 2026-06-17
+### Changed
 - Aligned the web-access extension peer dependency with upstream pi TUI `^0.79.4`; no web-access extension code changes were made.
 ## [0.8.29] - 2026-06-15

package/dist/builtin/web-access/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@bastani/web-access",
-  "version": "0.8.30-alpha.3",
+  "version": "0.8.31-alpha.1",
   "private": true,
   "description": "Atomic extension for web search, URL fetching, GitHub repo cloning, PDF/video extraction. Fork of: https://github.com/nicobailon/pi-web-access",
   "contributors": [
@@ -30,7 +30,7 @@
   },
   "peerDependencies": {
     "@bastani/atomic": "*",
-    "@earendil-works/pi-tui": "^0.79.4"
+    "@earendil-works/pi-tui": "^0.79.6"
   },
   "peerDependenciesMeta": {
     "@bastani/atomic": {

package/dist/builtin/workflows/CHANGELOG.md CHANGED Viewed

@@ -6,6 +6,18 @@ The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.1.0/),
 ## [Unreleased]
+### Added
+- Added a per-model context-window authoring token to workflow model strings: a parenthesized size token placed in the model-name portion, *before* the optional `:reasoning` suffix, e.g. `github-copilot/claude-opus-4.8 (1m):xhigh`. Adopting GitHub Copilot's `Claude Opus 4.8 (1M context)` naming convention keeps the window separate from the reasoning level so the two never collide. The token is resolved against the candidate model's advertised windows — an exact match wins, otherwise the largest supported window not exceeding the request (so `(1m)` selects a model's ~936K long-context tier), and it falls back to the model's default (short) window when no larger tier is available. It applies only to the candidate that carries the token, leaving primary and other fallback models untouched. Also surfaced `contextWindow`/`contextWindowStrict` on `StageOptions` and the workflow tool's direct-task schema for stage-level selection.
+### Changed
+- Changed the builtin `ralph` workflow review fan-out from two reviewers to three independent reviewers, each running on a different primary model family (Claude Fable 5, GPT-5.5 Codex, and Gemini 3.1 Pro) with shared fallbacks, so the adversarial review gets cross-model coverage instead of repeated passes from one model. The review loop stops only when all three reviewers independently approve (find no issues), so a P0–P3 finding from any single reviewer keeps Ralph iterating instead of being out-voted by a majority quorum. Also strengthened the orchestrator's implementation-notes contract to require verifiable evidence for any claims recorded in the notes and reviewer artifacts.
+- Changed the builtin `deep-research-codebase`, `goal`, `ralph`, and `open-claude-design` workflows to run their GitHub Copilot `claude-opus-4.8` fallbacks at the model's largest advertised long-context (~1M/936K) window via the new `(1m)` token, automatically degrading to the 200K short window when Copilot's long-context tier is unavailable. Other models in each fallback chain are unaffected.
+- Aligned the workflows extension peer dependency with upstream pi TUI `^0.79.6` so workflow graph, custom UI, and prompt-broker integrations consume the latest shared TUI compatibility fixes; no workflows extension code changes were made for this metadata sync ([#1413](https://github.com/bastani-inc/atomic/issues/1413)).
+## [0.8.30] - 2026-06-17
 ### Changed
 - Aligned the workflows extension peer dependency with upstream pi TUI `^0.79.4` so workflow graph, custom UI, and prompt-broker integrations consume the latest shared TUI fixes; no workflows extension code changes were made for this metadata sync.

package/dist/builtin/workflows/builtin/deep-research-codebase.ts CHANGED Viewed

@@ -399,7 +399,7 @@ export default defineWorkflow("deep-research-codebase")
         "openai-codex/gpt-5.5:xhigh",
         "github-copilot/gpt-5.5:xhigh",
         "openai/gpt-5.5:xhigh",
-        "github-copilot/claude-opus-4.8:xhigh",
+        "github-copilot/claude-opus-4.8 (1m):xhigh",
         "anthropic/claude-opus-4-8:xhigh"
       ],
       excludedTools: ["ask_user_question"],

package/dist/builtin/workflows/builtin/goal.ts CHANGED Viewed

@@ -976,7 +976,7 @@ export default defineWorkflow("goal")
       fallbackModels: [
           "github-copilot/gpt-5.5:medium",
           "openai/gpt-5.5:medium",
-          "github-copilot/claude-opus-4.8:medium",
+          "github-copilot/claude-opus-4.8 (1m):medium",
           "anthropic/claude-opus-4-8:medium",
       ],
       tools: goalRunnerTools,
@@ -988,7 +988,7 @@ export default defineWorkflow("goal")
           "openai-codex/gpt-5.5:xhigh",
           "github-copilot/gpt-5.5:xhigh",
           "openai/gpt-5.5:xhigh",
-          "github-copilot/claude-opus-4.8:xhigh",
+          "github-copilot/claude-opus-4.8 (1m):xhigh",
           "anthropic/claude-opus-4-8:xhigh"
       ],
       tools: goalRunnerTools,

package/dist/builtin/workflows/builtin/open-claude-design.ts CHANGED Viewed

@@ -407,7 +407,7 @@ export default defineWorkflow("open-claude-design")
     const designModelConfig = {
       model: "anthropic/claude-fable-5:xhigh",
       fallbackModels: [
-          "github-copilot/claude-opus-4.8:xhigh",
+          "github-copilot/claude-opus-4.8 (1m):xhigh",
           "anthropic/claude-opus-4-8:xhigh",
           "github-copilot/claude-sonnet-4.6:high",
           "anthropic/claude-sonnet-4-6:high",

package/dist/builtin/workflows/builtin/ralph.ts CHANGED Viewed

@@ -22,6 +22,11 @@ const DEFAULT_MAX_LOOPS = 10;
 const DEFAULT_RESEARCH_DIR = "research";
 const IMPLEMENTATION_NOTES_FILENAME = "implementation-notes.md";
 const MAX_RESEARCH_SLUG_LENGTH = 80;
+// Reviewer fan-out launches three independent reviewers; the loop stops only when
+// all three reviewers independently approve (find no issues). Requiring unanimous
+// approval means a P0–P3 finding from any single reviewer keeps the loop iterating
+// instead of being out-voted by a majority, so lower-severity issues stay surfaced.
+const REVIEWER_COUNT = 3;
 type ReviewFinding = {
   readonly title: string;
@@ -376,7 +381,7 @@ function renderForkedOrchestratorPrompt(args: {
       "implementation_notes",
       [
         `Keep updating the running Markdown implementation notes file at: ${args.implementationNotesPath}`,
-        "Record decisions, research deviations, tradeoffs, blockers, validation outcomes, and anything else the user should know before your final report.",
+        "Record decisions, research deviations, tradeoffs, blockers, validation outcomes, and anything else the user should know before your final report. Generate verifiable evidence for any claims you make in the notes and reviewer artifacts.",
       ].join("\n"),
     ],
     ["e2e_verification", E2E_VERIFICATION_GUIDANCE],
@@ -464,7 +469,7 @@ async function runRalphWorkflow(
       "openai-codex/gpt-5.5:xhigh",
       "github-copilot/gpt-5.5:xhigh",
       "openai/gpt-5.5:xhigh",
-      "github-copilot/claude-opus-4.8:xhigh",
+      "github-copilot/claude-opus-4.8 (1m):xhigh",
       "anthropic/claude-opus-4-8:xhigh"
     ],
     noTools: "all" as const,
@@ -475,7 +480,7 @@ async function runRalphWorkflow(
     fallbackModels: [
         "github-copilot/gpt-5.5:medium",
         "openai/gpt-5.5:medium",
-        "github-copilot/claude-opus-4.8:medium",
+        "github-copilot/claude-opus-4.8 (1m):medium",
         "anthropic/claude-opus-4-8:medium",
     ],
     excludedTools: ["ask_user_question"],
@@ -486,19 +491,47 @@ async function runRalphWorkflow(
     fallbackModels: [
         "github-copilot/gpt-5.5:medium",
         "openai/gpt-5.5:medium",
-        "github-copilot/claude-opus-4.8:medium",
+        "github-copilot/claude-opus-4.8 (1m):medium",
         "anthropic/claude-opus-4-8:medium",
     ],
     excludedTools: ["ask_user_question"],
   };
-  const reviewerModelConfig = {
+  const reviewerAModelConfig = {
     model: "anthropic/claude-fable-5:xhigh",
     fallbackModels: [
+      "github-copilot/claude-opus-4.8 (1m):xhigh",
+      "anthropic/claude-opus-4-8:xhigh",
       "openai-codex/gpt-5.5:xhigh",
+      "github-copilot/gpt-5.5:xhigh",
+      "openai/gpt-5.5:xhigh"
+    ],
+    excludedTools: ["ask_user_question"],
+    schema: reviewDecisionSchema,
+  };
+  const reviewerBModelConfig = {
+    model: "openai-codex/gpt-5.5:xhigh",
+    fallbackModels: [
       "github-copilot/gpt-5.5:xhigh",
       "openai/gpt-5.5:xhigh",
-      "github-copilot/claude-opus-4.8:xhigh",
+      "anthropic/claude-fable-5:xhigh",
+      "github-copilot/claude-opus-4.8 (1m):xhigh",
+      "anthropic/claude-opus-4-8:xhigh"
+    ],
+    excludedTools: ["ask_user_question"],
+    schema: reviewDecisionSchema,
+  };
+  const reviewerCModelConfig = {
+    model: "github-copilot/gemini-3.1-pro-preview (1m):high",
+    fallbackModels: [
+      "google/gemini-3.1-pro-preview:high",
+      "openai-codex/gpt-5.5:xhigh",
+      "github-copilot/gpt-5.5:xhigh",
+      "openai/gpt-5.5:xhigh",
+      "anthropic/claude-fable-5:xhigh",
+      "github-copilot/claude-opus-4.8 (1m):xhigh",
       "anthropic/claude-opus-4-8:xhigh"
     ],
     excludedTools: ["ask_user_question"],
@@ -789,7 +822,7 @@ async function runRalphWorkflow(
               implementationNotesPath,
               orchestratorReportPath,
             ],
-            ...reviewerModelConfig,
+            ...reviewerAModelConfig,
           },
           {
             name: "reviewer-b",
@@ -799,7 +832,17 @@ async function runRalphWorkflow(
               implementationNotesPath,
               orchestratorReportPath,
             ],
-            ...reviewerModelConfig,
+            ...reviewerBModelConfig,
+          },
+          {
+            name: "reviewer-c",
+            task: reviewPrompt,
+            reads: [
+              researchPath,
+              implementationNotesPath,
+              orchestratorReportPath,
+            ],
+            ...reviewerCModelConfig,
           },
         ],
         {
@@ -828,9 +871,16 @@ async function runRalphWorkflow(
       });
       return { reviewer, artifact_path: artifactPath, decision };
     }));
+    const approvalCount = reviewEntries.filter((review) =>
+      reviewDecisionApproved(review.decision),
+    ).length;
+    // Require unanimous approval: every reviewer must have run and independently
+    // approved. A fan-out error that collapses to a single error entry (fewer than
+    // REVIEWER_COUNT reviews) or any reviewer surfacing a finding keeps the loop
+    // iterating rather than letting a majority paper over outstanding issues.
     approved =
-      reviewEntries.length > 0 &&
-      reviewEntries.every((review) => reviewDecisionApproved(review.decision));
+      reviewEntries.length === REVIEWER_COUNT &&
+      approvalCount === REVIEWER_COUNT;
     latestReviewReportPath = await writeJsonArtifact(
       join(artifactDir, `review-round-${iteration}.json`),
       { iteration, reviews: reviewEntries },
@@ -916,7 +966,7 @@ async function runRalphWorkflow(
 export default defineWorkflow("ralph")
   .description(
-    "Prompt-engineer → research → orchestrate → parallel review loop with bounded iteration.",
+    "Prompt-engineer → research → orchestrate → multi-model parallel review loop with bounded iteration.",
   )
   .input("prompt", Type.String({ description: "The task or goal to research, execute, and refine." }))
   .input("max_loops", Type.Number({

package/dist/builtin/workflows/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@bastani/workflows",
-  "version": "0.8.30-alpha.3",
+  "version": "0.8.31-alpha.1",
   "private": true,
   "description": "Atomic extension for multi-stage workflow authoring and execution.",
   "contributors": [
@@ -83,7 +83,7 @@
   },
   "peerDependencies": {
     "@bastani/atomic": "*",
-    "@earendil-works/pi-tui": "^0.79.4"
+    "@earendil-works/pi-tui": "^0.79.6"
   },
   "peerDependenciesMeta": {
     "@bastani/atomic": {

package/dist/builtin/workflows/src/extension/workflow-schema.ts CHANGED Viewed

@@ -66,7 +66,9 @@ const StageSessionOptionProperties = {
   agentDir: Type.Optional(Type.String()),
   authStorage: Type.Optional(SdkSessionOptionSchema("authStorage")),
   modelRegistry: Type.Optional(SdkSessionOptionSchema("modelRegistry")),
-  model: Type.Optional(Type.Unsafe<WorkflowModelValue>({ description: "Primary model id or SDK model object. String ids may include a reasoning suffix, e.g. openai/gpt-5:high; valid levels: off|minimal|low|medium|high|xhigh." })),
+  model: Type.Optional(Type.Unsafe<WorkflowModelValue>({ description: "Primary model id or SDK model object. String ids may include a reasoning suffix, e.g. openai/gpt-5:high; valid levels: off|minimal|low|medium|high|xhigh. A parenthesized context-window token may precede the suffix, e.g. github-copilot/claude-opus-4.8 (1m):high." })),
+  contextWindow: Type.Optional(Type.Number({ description: "Context-window token budget for the stage session (e.g. 1000000). Non-strict by default: an unsupported value keeps the model's default window. Prefer the per-model `(1m)` token in a model/fallbackModels entry when only specific models should use a larger window." })),
+  contextWindowStrict: Type.Optional(Type.Boolean({ description: "Treat an unsupported contextWindow as an error instead of falling back to the model's default window." })),
   thinkingLevel: Type.Optional(SdkSessionOptionSchema("thinkingLevel")),
   scopedModels: Type.Optional(Type.Array(SdkSessionOptionArrayElementSchema("scopedModels"))),
   noTools: Type.Optional(Type.Unsafe<NonNullable<CreateAgentSessionOptions["noTools"]>>({

package/dist/builtin/workflows/src/runs/foreground/stage-runner.ts CHANGED Viewed

@@ -755,6 +755,11 @@ export function createStageContext(opts: StageRunnerOpts): InternalStageContext
           ...(effectiveStageOptions ?? {}),
           model: candidate.value,
           ...(candidate.reasoningLevel !== undefined ? { thinkingLevel: candidate.reasoningLevel } : {}),
+          // A per-candidate context window (parsed from a parenthesized token in
+          // the model string) overrides any stage-level contextWindow so only
+          // that specific model — e.g. a github-copilot opus fallback — requests
+          // its larger window; other candidates keep the stage default.
+          ...(candidate.contextWindow !== undefined ? { contextWindow: candidate.contextWindow } : {}),
           fallbackModels: undefined,
           fallbackThinkingLevels: undefined,
         };

package/dist/builtin/workflows/src/runs/shared/model-fallback.ts CHANGED Viewed

@@ -1,3 +1,4 @@
+import { getModelDefaultContextWindow, getSupportedContextWindows, parseContextWindowValue } from "@bastani/atomic";
 import type { CreateAgentSessionOptions } from "@bastani/atomic";
 import type {
   WorkflowModelCatalogPort,
@@ -10,14 +11,91 @@ export interface WorkflowResolvedModelCandidate {
   readonly id: string;
   readonly value: WorkflowModelValue;
   readonly reasoningLevel?: WorkflowThinkingLevel;
+  /**
+   * Resolved context-window token budget for this candidate's session, parsed
+   * from a parenthesized authoring token in the model string (e.g.
+   * `github-copilot/claude-opus-4.8 (1m):xhigh`). Resolved against the
+   * candidate model's advertised windows: an exact match wins, otherwise the
+   * largest supported window <= the request (so `(1m)` selects a model's ~936K
+   * long-context tier). Left `undefined` when the model exposes no matching
+   * window, so the session keeps the model's default (short) window.
+   */
+  readonly contextWindow?: number;
 }
 function makeCandidate(
   id: string,
   value: WorkflowModelValue,
   level: WorkflowThinkingLevel | undefined,
+  contextWindow?: number,
 ): WorkflowResolvedModelCandidate {
-  return level !== undefined ? { id, value, reasoningLevel: level } : { id, value };
+  return {
+    id,
+    value,
+    ...(level !== undefined ? { reasoningLevel: level } : {}),
+    ...(contextWindow !== undefined ? { contextWindow } : {}),
+  };
+}
+/**
+ * Extract a trailing parenthesized context-window authoring token, e.g. the
+ * `(1m)` in `github-copilot/claude-opus-4.8 (1m)`. Mirrors GitHub Copilot's
+ * model-name convention (`Claude Opus 4.8 (1M context)`) and intentionally
+ * lives in the model-name portion — *not* a `:` suffix — so it never collides
+ * with the `:off|minimal|low|medium|high|xhigh` reasoning-level suffix.
+ *
+ * Parsed with plain string scanning rather than a regular expression so that
+ * adversarial model strings (e.g. `(` followed by long whitespace runs) cannot
+ * trigger super-linear backtracking (CodeQL js/polynomial-redos).
+ */
+function extractContextWindowToken(
+  model: string,
+): { readonly baseModel: string; readonly requestedContextWindow?: number } {
+  const trimmedEnd = model.trimEnd();
+  if (!trimmedEnd.endsWith(")")) return { baseModel: model };
+  const open = trimmedEnd.lastIndexOf("(");
+  // Require at least one character before the `(` so a bare `(1m)` is not a model.
+  if (open <= 0) return { baseModel: model };
+  const inner = trimmedEnd.slice(open + 1, -1);
+  // The token must be a single flat `(...)` group with no nested parentheses.
+  if (inner.includes("(") || inner.includes(")")) return { baseModel: model };
+  const token = inner.trim();
+  const baseModel = trimmedEnd.slice(0, open).trim();
+  if (token.length === 0 || baseModel.length === 0) return { baseModel: model };
+  const parsed = parseContextWindowValue(token);
+  // A parenthesized token that does not parse as a context size (e.g. an
+  // accidental `(preview)`) is left attached to the model id so the normal
+  // "not available" lookup surfaces the typo instead of being silently dropped.
+  if (parsed.value === undefined) return { baseModel: model };
+  return { baseModel, requestedContextWindow: parsed.value };
+}
+/**
+ * Resolve a requested context-window budget against a candidate model's
+ * advertised windows. Returns the exact value when supported, otherwise the
+ * largest supported window that does not exceed the request (so `(1m)` lands on
+ * a ~936K long-context tier), or `undefined` when nothing fits — in which case
+ * the session keeps the model's default window. Model values that are plain
+ * strings (not resolved against the live catalog) cannot be introspected and
+ * yield `undefined`.
+ */
+function resolveRequestedContextWindow(
+  value: WorkflowModelValue,
+  requested: number,
+): number | undefined {
+  if (typeof value === "string") return undefined;
+  const supported = getSupportedContextWindows(value);
+  if (supported.length === 0) return undefined;
+  const chosen = supported.includes(requested)
+    ? requested
+    : (() => {
+        const atOrBelow = supported.filter((window) => window <= requested);
+        return atOrBelow.length > 0 ? Math.max(...atOrBelow) : undefined;
+      })();
+  if (chosen === undefined) return undefined;
+  // Only override when the request actually upgrades past the model's default
+  // window; otherwise leave it unset so the session simply keeps its default.
+  return chosen === getModelDefaultContextWindow(value) ? undefined : chosen;
 }
 const WORKFLOW_THINKING_LEVELS = ["off", "minimal", "low", "medium", "high", "xhigh"] as const satisfies readonly WorkflowThinkingLevel[];
@@ -34,7 +112,7 @@ export function splitReasoningSuffix(model: string): { readonly baseModel: strin
 }
 function candidateKey(candidate: WorkflowResolvedModelCandidate): string {
-  return `${candidate.id}::${candidate.reasoningLevel ?? ""}`;
+  return `${candidate.id}::${candidate.reasoningLevel ?? ""}::${candidate.contextWindow ?? ""}`;
 }
 interface ModelResolutionFailure {
@@ -99,16 +177,25 @@ function resolveStringModel(
 ): WorkflowResolvedModelCandidate | ModelResolutionFailure {
   const input = rawInput.trim();
   if (!input) return { input: rawInput, reason: "empty model id" };
-  const { baseModel, level } = splitReasoningSuffix(input);
+  const { baseModel: afterReasoning, level } = splitReasoningSuffix(input);
+  const { baseModel, requestedContextWindow } = extractContextWindowToken(afterReasoning);
+  const candidate = (id: string, value: WorkflowModelValue): WorkflowResolvedModelCandidate =>
+    makeCandidate(
+      id,
+      value,
+      level,
+      requestedContextWindow === undefined ? undefined : resolveRequestedContextWindow(value, requestedContextWindow),
+    );
   if (availableModels === undefined) {
-    return makeCandidate(baseModel, baseModel, level);
+    return candidate(baseModel, baseModel);
   }
   const models = uniqueByFullId(availableModels);
   const explicit = models.find((model) => model.fullId === baseModel);
   if (explicit !== undefined) {
-    return makeCandidate(explicit.fullId, explicit.model ?? explicit.fullId, level);
+    return candidate(explicit.fullId, explicit.model ?? explicit.fullId);
   }
   if (baseModel.includes("/")) {
@@ -122,7 +209,7 @@ function resolveStringModel(
     // currentModel — discarding the workflow's defined primary and fallbacks.
     // Pass it through with the reasoning suffix split off; the runtime fallback
     // loop skips it only if the SDK genuinely cannot create a session for it.
-    return makeCandidate(baseModel, baseModel, level);
+    return candidate(baseModel, baseModel);
   }
   const byBareId = models.filter((model) => model.id === baseModel);
@@ -131,14 +218,14 @@ function resolveStringModel(
   }
   if (byBareId.length === 1) {
     const only = byBareId[0]!;
-    return makeCandidate(only.fullId, only.model ?? only.fullId, level);
+    return candidate(only.fullId, only.model ?? only.fullId);
   }
   const preferred = preferredProvider === undefined
     ? undefined
     : byBareId.find((model) => model.provider === preferredProvider);
   if (preferred !== undefined) {
-    return makeCandidate(preferred.fullId, preferred.model ?? preferred.fullId, level);
+    return candidate(preferred.fullId, preferred.model ?? preferred.fullId);
   }
   return {

package/dist/builtin/workflows/src/shared/authoring-contract.d.ts CHANGED Viewed

@@ -116,6 +116,17 @@ export interface StageOptions<TSchemaDef extends TSchema | undefined = TSchema |
     /** Optional structured final-answer schema. When set, the stage receives a schema-specific final-answer tool. */
     readonly schema?: TSchemaDef;
     readonly model?: WorkflowModelValue;
+    /**
+     * Context-window token budget for the stage session. May also be expressed
+     * per-model via a parenthesized token in a `model`/`fallbackModels` entry
+     * (e.g. `github-copilot/claude-opus-4.8 (1m):xhigh`), which is preferred when
+     * only specific fallbacks should use a larger window. Non-strict by default:
+     * an unsupported value keeps the model's default window (see
+     * `contextWindowStrict`).
+     */
+    readonly contextWindow?: number;
+    /** Treat an unsupported `contextWindow` as an error instead of falling back to the model default. */
+    readonly contextWindowStrict?: boolean;
     readonly mcp?: StageMcpOptions;
     readonly tools?: readonly string[];
     readonly noTools?: "all" | "builtin";

package/dist/cli/args.d.ts CHANGED Viewed

@@ -11,6 +11,7 @@ export interface Args {
     systemPrompt?: string;
     appendSystemPrompt?: string[];
     thinking?: ThinkingLevel;
+    contextWindow?: number;
     continue?: boolean;
     resume?: boolean;
     help?: boolean;