npm - @bastani/atomic - Versions diffs - 0.8.30 → 0.8.31-alpha.2 - Mend

@bastani/atomic 0.8.30 → 0.8.31-alpha.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (205) hide show

package/CHANGELOG.md +29 -0
package/README.md +12 -10
package/dist/builtin/cursor/CHANGELOG.md +4 -0
package/dist/builtin/cursor/package.json +2 -2
package/dist/builtin/intercom/CHANGELOG.md +4 -0
package/dist/builtin/intercom/package.json +2 -2
package/dist/builtin/mcp/CHANGELOG.md +4 -0
package/dist/builtin/mcp/package.json +3 -3
package/dist/builtin/subagents/CHANGELOG.md +13 -0
package/dist/builtin/subagents/agents/codebase-online-researcher.md +8 -8
package/dist/builtin/subagents/agents/debugger.md +6 -6
package/dist/builtin/subagents/package.json +4 -4
package/dist/builtin/subagents/skills/effective-liteparse/SKILL.md +118 -0
package/dist/builtin/subagents/skills/effective-liteparse/scripts/search.py +128 -0
package/dist/builtin/subagents/skills/playwright-cli/SKILL.md +404 -0
package/dist/builtin/subagents/skills/playwright-cli/references/element-attributes.md +23 -0
package/dist/builtin/subagents/skills/playwright-cli/references/playwright-tests.md +39 -0
package/dist/builtin/subagents/skills/playwright-cli/references/request-mocking.md +87 -0
package/dist/builtin/subagents/skills/playwright-cli/references/running-code.md +241 -0
package/dist/builtin/subagents/skills/playwright-cli/references/session-management.md +225 -0
package/dist/builtin/subagents/skills/playwright-cli/references/spec-driven-testing.md +305 -0
package/dist/builtin/subagents/skills/playwright-cli/references/storage-state.md +275 -0
package/dist/builtin/subagents/skills/playwright-cli/references/test-generation.md +134 -0
package/dist/builtin/subagents/skills/playwright-cli/references/tracing.md +139 -0
package/dist/builtin/subagents/skills/playwright-cli/references/video-recording.md +143 -0
package/dist/builtin/web-access/CHANGELOG.md +4 -0
package/dist/builtin/web-access/package.json +2 -2
package/dist/builtin/workflows/CHANGELOG.md +16 -0
package/dist/builtin/workflows/README.md +4 -4
package/dist/builtin/workflows/builtin/deep-research-codebase.ts +1 -1
package/dist/builtin/workflows/builtin/goal.ts +2 -2
package/dist/builtin/workflows/builtin/open-claude-design.ts +60 -57
package/dist/builtin/workflows/builtin/ralph.ts +117 -14
package/dist/builtin/workflows/builtin/shared-prompts.ts +1 -1
package/dist/builtin/workflows/package.json +2 -2
package/dist/builtin/workflows/skills/research-codebase/SKILL.md +1 -1
package/dist/builtin/workflows/src/extension/workflow-schema.ts +3 -1
package/dist/builtin/workflows/src/runs/foreground/stage-runner.ts +5 -0
package/dist/builtin/workflows/src/runs/shared/model-fallback.ts +95 -8
package/dist/builtin/workflows/src/shared/authoring-contract.d.ts +11 -0
package/dist/cli/args.d.ts +1 -0
package/dist/cli/args.d.ts.map +1 -1
package/dist/cli/args.js +21 -1
package/dist/cli/args.js.map +1 -1
package/dist/cli/list-models.d.ts.map +1 -1
package/dist/cli/list-models.js +2 -1
package/dist/cli/list-models.js.map +1 -1
package/dist/core/agent-session-services.d.ts +2 -0
package/dist/core/agent-session-services.d.ts.map +1 -1
package/dist/core/agent-session-services.js +2 -0
package/dist/core/agent-session-services.js.map +1 -1
package/dist/core/agent-session.d.ts +18 -0
package/dist/core/agent-session.d.ts.map +1 -1
package/dist/core/agent-session.js +182 -19
package/dist/core/agent-session.js.map +1 -1
package/dist/core/compaction/branch-summarization.d.ts.map +1 -1
package/dist/core/compaction/branch-summarization.js +20 -5
package/dist/core/compaction/branch-summarization.js.map +1 -1
package/dist/core/compaction/context-compaction.d.ts.map +1 -1
package/dist/core/compaction/context-compaction.js +14 -3
package/dist/core/compaction/context-compaction.js.map +1 -1
package/dist/core/context-window.d.ts +39 -0
package/dist/core/context-window.d.ts.map +1 -0
package/dist/core/context-window.js +99 -0
package/dist/core/context-window.js.map +1 -0
package/dist/core/copilot-errors.d.ts +9 -0
package/dist/core/copilot-errors.d.ts.map +1 -0
package/dist/core/copilot-errors.js +32 -0
package/dist/core/copilot-errors.js.map +1 -0
package/dist/core/copilot-model-catalog.d.ts +135 -0
package/dist/core/copilot-model-catalog.d.ts.map +1 -0
package/dist/core/copilot-model-catalog.js +257 -0
package/dist/core/copilot-model-catalog.js.map +1 -0
package/dist/core/export-html/template.js +10 -1
package/dist/core/extensions/types.d.ts +3 -1
package/dist/core/extensions/types.d.ts.map +1 -1
package/dist/core/extensions/types.js.map +1 -1
package/dist/core/model-registry.d.ts +10 -0
package/dist/core/model-registry.d.ts.map +1 -1
package/dist/core/model-registry.js +107 -4
package/dist/core/model-registry.js.map +1 -1
package/dist/core/model-resolver.d.ts.map +1 -1
package/dist/core/model-resolver.js +4 -0
package/dist/core/model-resolver.js.map +1 -1
package/dist/core/project-trust.d.ts.map +1 -1
package/dist/core/project-trust.js +2 -1
package/dist/core/project-trust.js.map +1 -1
package/dist/core/provider-attribution.d.ts.map +1 -1
package/dist/core/provider-attribution.js +17 -7
package/dist/core/provider-attribution.js.map +1 -1
package/dist/core/sdk.d.ts +8 -0
package/dist/core/sdk.d.ts.map +1 -1
package/dist/core/sdk.js +58 -0
package/dist/core/sdk.js.map +1 -1
package/dist/core/session-manager.d.ts +8 -1
package/dist/core/session-manager.d.ts.map +1 -1
package/dist/core/session-manager.js +19 -3
package/dist/core/session-manager.js.map +1 -1
package/dist/core/settings-manager.d.ts +15 -0
package/dist/core/settings-manager.d.ts.map +1 -1
package/dist/core/settings-manager.js +124 -1
package/dist/core/settings-manager.js.map +1 -1
package/dist/core/system-prompt.d.ts.map +1 -1
package/dist/core/system-prompt.js +1 -0
package/dist/core/system-prompt.js.map +1 -1
package/dist/core/tools/edit-diff.d.ts +1 -2
package/dist/core/tools/edit-diff.d.ts.map +1 -1
package/dist/core/tools/edit-diff.js +1 -2
package/dist/core/tools/edit-diff.js.map +1 -1
package/dist/index.d.ts +3 -1
package/dist/index.d.ts.map +1 -1
package/dist/index.js +2 -0
package/dist/index.js.map +1 -1
package/dist/main.d.ts.map +1 -1
package/dist/main.js +24 -1
package/dist/main.js.map +1 -1
package/dist/modes/index.d.ts +1 -1
package/dist/modes/index.d.ts.map +1 -1
package/dist/modes/index.js.map +1 -1
package/dist/modes/interactive/components/config-selector.d.ts.map +1 -1
package/dist/modes/interactive/components/config-selector.js +5 -7
package/dist/modes/interactive/components/config-selector.js.map +1 -1
package/dist/modes/interactive/components/context-window-selector.d.ts +53 -0
package/dist/modes/interactive/components/context-window-selector.d.ts.map +1 -0
package/dist/modes/interactive/components/context-window-selector.js +136 -0
package/dist/modes/interactive/components/context-window-selector.js.map +1 -0
package/dist/modes/interactive/components/model-selector.d.ts.map +1 -1
package/dist/modes/interactive/components/model-selector.js +2 -1
package/dist/modes/interactive/components/model-selector.js.map +1 -1
package/dist/modes/interactive/components/scoped-models-selector.d.ts.map +1 -1
package/dist/modes/interactive/components/scoped-models-selector.js +4 -1
package/dist/modes/interactive/components/scoped-models-selector.js.map +1 -1
package/dist/modes/interactive/components/settings-selector.d.ts +2 -0
package/dist/modes/interactive/components/settings-selector.d.ts.map +1 -1
package/dist/modes/interactive/components/settings-selector.js +165 -15
package/dist/modes/interactive/components/settings-selector.js.map +1 -1
package/dist/modes/interactive/components/tree-selector.d.ts.map +1 -1
package/dist/modes/interactive/components/tree-selector.js +51 -4
package/dist/modes/interactive/components/tree-selector.js.map +1 -1
package/dist/modes/interactive/interactive-mode.d.ts +6 -1
package/dist/modes/interactive/interactive-mode.d.ts.map +1 -1
package/dist/modes/interactive/interactive-mode.js +115 -55
package/dist/modes/interactive/interactive-mode.js.map +1 -1
package/dist/modes/interactive/model-search.d.ts +7 -0
package/dist/modes/interactive/model-search.d.ts.map +1 -0
package/dist/modes/interactive/model-search.js +6 -0
package/dist/modes/interactive/model-search.js.map +1 -0
package/dist/modes/interactive/theme/theme-controller.d.ts +30 -0
package/dist/modes/interactive/theme/theme-controller.d.ts.map +1 -0
package/dist/modes/interactive/theme/theme-controller.js +108 -0
package/dist/modes/interactive/theme/theme-controller.js.map +1 -0
package/dist/modes/interactive/theme/theme-schema.json +2 -1
package/dist/modes/interactive/theme/theme.d.ts +5 -0
package/dist/modes/interactive/theme/theme.d.ts.map +1 -1
package/dist/modes/interactive/theme/theme.js +70 -29
package/dist/modes/interactive/theme/theme.js.map +1 -1
package/dist/modes/rpc/rpc-client.d.ts +14 -2
package/dist/modes/rpc/rpc-client.d.ts.map +1 -1
package/dist/modes/rpc/rpc-client.js +23 -3
package/dist/modes/rpc/rpc-client.js.map +1 -1
package/dist/modes/rpc/rpc-mode.d.ts +1 -1
package/dist/modes/rpc/rpc-mode.d.ts.map +1 -1
package/dist/modes/rpc/rpc-mode.js +31 -2
package/dist/modes/rpc/rpc-mode.js.map +1 -1
package/dist/modes/rpc/rpc-types.d.ts +23 -0
package/dist/modes/rpc/rpc-types.d.ts.map +1 -1
package/dist/modes/rpc/rpc-types.js.map +1 -1
package/dist/package-manager-cli.d.ts.map +1 -1
package/dist/package-manager-cli.js +39 -9
package/dist/package-manager-cli.js.map +1 -1
package/docs/custom-provider.md +4 -1
package/docs/extensions.md +21 -0
package/docs/json.md +3 -1
package/docs/models.md +78 -2
package/docs/packages.md +13 -9
package/docs/providers.md +3 -0
package/docs/quickstart.md +14 -0
package/docs/rpc.md +80 -1
package/docs/sdk.md +35 -11
package/docs/session-format.md +15 -1
package/docs/sessions.md +1 -1
package/docs/settings.md +12 -2
package/docs/themes.md +3 -1
package/docs/tui.md +1 -1
package/docs/usage.md +12 -9
package/docs/workflows.md +34 -10
package/examples/extensions/custom-provider-anthropic/package-lock.json +2 -2
package/examples/extensions/custom-provider-anthropic/package.json +1 -1
package/examples/extensions/custom-provider-gitlab-duo/package.json +1 -1
package/examples/extensions/gondolin/package-lock.json +2 -2
package/examples/extensions/gondolin/package.json +1 -1
package/examples/extensions/preset.ts +10 -4
package/examples/extensions/provider-payload.ts +5 -5
package/examples/extensions/sandbox/index.ts +2 -2
package/examples/extensions/sandbox/package-lock.json +3 -3
package/examples/extensions/sandbox/package.json +2 -2
package/examples/extensions/subagent/agents.ts +2 -2
package/examples/extensions/subagent/index.ts +4 -2
package/examples/extensions/with-deps/package-lock.json +2 -2
package/examples/extensions/with-deps/package.json +1 -1
package/package.json +5 -5
package/dist/builtin/subagents/skills/browser/EXAMPLES.md +0 -151
package/dist/builtin/subagents/skills/browser/LICENSE.txt +0 -21
package/dist/builtin/subagents/skills/browser/REFERENCE.md +0 -451
package/dist/builtin/subagents/skills/browser/SKILL.md +0 -170

package/docs/rpc.md CHANGED Viewed

@@ -13,6 +13,7 @@ atomic --mode rpc [options]
 Common options:
 - `--provider <name>`: Set the LLM provider (anthropic, openai, google, etc.)
 - `--model <pattern>`: Model pattern or ID (supports `provider/id` and optional `:<thinking>`)
+- `--context-window <tokens>`: Select a supported context-window size for the startup model (`400k`, `1m`, or raw tokens)
 - `--name <name>` / `-n <name>`: Set the session display name at startup
 - `--no-session`: Disable session persistence
 - `--session-dir <path>`: Custom session storage directory
@@ -190,7 +191,7 @@ Response:
 }
 ```
-The `model` field is a full [Model](#model) object or `null`. The `sessionName` field is the display name set via `set_session_name`, or omitted if not set.
+The `model` field is a full [Model](#model) object or `null`. Its `contextWindow` is the active/effective token budget; selectable models may also include `defaultContextWindow` and `contextWindowOptions`. The `sessionName` field is the display name set via `set_session_name`, or omitted if not set.
 #### get_messages
@@ -276,6 +277,66 @@ Response contains an array of full [Model](#model) objects:
 }
 ```
+### Context Window
+#### get_available_context_windows
+List the context-window token budgets supported by the current model and read the active/effective runtime selection.
+```json
+{"type": "get_available_context_windows"}
+```
+Response:
+```json
+{
+  "type": "response",
+  "command": "get_available_context_windows",
+  "success": true,
+  "data": {
+    "contextWindows": [400000, 1000000],
+    "currentContextWindow": 400000,
+    "supportsSelection": true
+  }
+}
+```
+- `contextWindows`: supported token budgets for the active model, sorted ascending.
+- `currentContextWindow`: the active/effective token budget on `model.contextWindow`; omitted when no model is selected.
+- `supportsSelection`: `true` when the active model exposes more than one supported budget.
+#### set_context_window
+Set the active context-window token budget for the current model at runtime.
+```json
+{"type": "set_context_window", "contextWindow": 1000000}
+```
+Compact string values are also accepted:
+```json
+{"type": "set_context_window", "contextWindow": "1m"}
+```
+Response:
+```json
+{"type": "response", "command": "set_context_window", "success": true}
+```
+This command calls `AgentSession.setContextWindow(...)` without `{ persistDefault: true }`: it updates the active model, appends a `context_window_change` session entry and emits `context_window_changed` when the budget changes, but it does **not** write context-window defaults to settings. Use startup `--context-window` or an interactive context-window selection when you intentionally want the effective selection persisted under `defaultContextWindows["provider/modelId"]`.
+Unsupported or malformed selections return the standard RPC error response:
+```json
+{
+  "type": "response",
+  "command": "set_context_window",
+  "success": false,
+  "error": "Context window 2m is not supported by custom/selectable-context. Supported values: 400k, 1m."
+}
+```
+Larger provider context windows may consume more credits/cost. For allowlisted GitHub Copilot long-context models (including `github-copilot/gpt-5.5` and `github-copilot/gemini-3.1-pro-preview`), selecting `1m` raises Atomic's local budget and sends `X-GitHub-Api-Version: 2026-06-01`; GitHub applies the long-context billing tier server-side by prompt token count. That tier consumes more Copilot AI credits and requires Copilot long-context/usage-based billing entitlement, otherwise requests over GitHub's server cap are rejected with a friendly hint.
 ### Thinking
 #### set_thinking_level
@@ -760,6 +821,7 @@ Events are streamed to stdout as JSON lines during agent operation. Events do NO
 | `tool_execution_update` | Tool execution progress (streaming output) |
 | `tool_execution_end` | Tool completes |
 | `queue_update` | Pending steering/follow-up queue changed |
+| `context_window_changed` | Active context-window token budget changed |
 | `compaction_start` | Default Verbatim Compaction begins |
 | `compaction_end` | Default Verbatim Compaction completes |
 | `context_compaction_start` | Compatibility `context_compact` RPC begins |
@@ -911,6 +973,19 @@ Emitted whenever the pending steering or follow-up queue changes.
 }
 ```
+### context_window_changed
+Emitted when the active context-window token budget changes through RPC `set_context_window`, `AgentSession.setContextWindow()` in an SDK-backed runtime, or because in-place tree navigation replayed a branch-scoped `context_window_change` entry. Navigation replay updates the active model for accurate budgeting and compaction but does not append another session entry or write context-window defaults to settings.
+```json
+{
+  "type": "context_window_changed",
+  "contextWindow": 1000000
+}
+```
+Larger provider context windows may consume more credits/cost. Prefer the model default unless the additional repository/session context is useful for the current task. For allowlisted GitHub Copilot long-context models such as `github-copilot/gpt-5.5` and `github-copilot/gemini-3.1-pro-preview`, a `1m` selection raises Atomic's local budget and sends `X-GitHub-Api-Version: 2026-06-01`; GitHub applies the long-context billing tier server-side by prompt size, consumes more Copilot AI credits, and requires long-context/usage-based billing entitlement.
 ### compaction_start / compaction_end
 Emitted when default Verbatim Compaction runs, whether manual or automatic. The result records deletion targets and stats rather than a generated summary.
@@ -1234,6 +1309,8 @@ Source files and installed definitions:
   "reasoning": true,
   "input": ["text", "image"],
   "contextWindow": 200000,
+  "defaultContextWindow": 200000,
+  "contextWindowOptions": [200000, 1000000],
   "maxTokens": 16384,
   "cost": {
     "input": 3.0,
@@ -1244,6 +1321,8 @@ Source files and installed definitions:
 }
 ```
+`contextWindow` is the active/effective token budget used by Atomic's local budgeting, footer/stats, and compaction logic. `defaultContextWindow` is the model's scalar default before a session/runtime override, and `contextWindowOptions` lists selectable token budgets when the model supports more than one size. RPC clients can read/select the active runtime budget with `get_available_context_windows` and `set_context_window`; the runtime command does not persist context-window defaults to settings.
 ### UserMessage
 ```json

package/docs/sdk.md CHANGED Viewed

@@ -107,11 +107,14 @@ interface AgentSession {
   sessionFile: string | undefined;
   sessionId: string;
-  // Model control
+  // Model, thinking, and context-window control
   setModel(model: Model): Promise<void>;
   setThinkingLevel(level: ThinkingLevel): void;
+  setContextWindow(contextWindow: number, options?: { persistDefault?: boolean }): void;
   cycleModel(): Promise<ModelCycleResult | undefined>;
   cycleThinkingLevel(): ThinkingLevel | undefined;
+  getAvailableContextWindows(): number[];
+  supportsContextWindowSelection(): boolean;
   // State access
   agent: Agent;
@@ -121,7 +124,7 @@ interface AgentSession {
   isStreaming: boolean;
   // In-place tree navigation within the current session file
-  navigateTree(targetId: string, options?: { summarize?: boolean; customInstructions?: string; replaceInstructions?: boolean; label?: string }): Promise<{ editorText?: string; cancelled: boolean }>;
+  navigateTree(targetId: string, options?: { summarize?: boolean; customInstructions?: string; replaceInstructions?: boolean; label?: string }): Promise<{ editorText?: string; cancelled: boolean; aborted?: boolean; summaryEntry?: BranchSummaryEntry }>;
   // Verbatim Compaction (deletion-only Context Compaction)
   compact(): Promise<ContextCompactionResult>;
@@ -337,10 +340,13 @@ session.subscribe((event) => {
       // event.toolResults: tool results from this turn
       break;
-    // Session events (queue, compaction, retry)
+    // Session events (queue, context-window, compaction, retry)
     case "queue_update":
       console.log(event.steering, event.followUp);
       break;
+    case "context_window_changed":
+      console.log(`Context window: ${event.contextWindow}`);
+      break;
     case "compaction_start":
     case "compaction_end":
     case "auto_retry_start":
@@ -412,6 +418,8 @@ const available = await modelRegistry.getAvailable();
 const { session } = await createAgentSession({
   model: opus,
   thinkingLevel: "medium", // off, minimal, low, medium, high, xhigh
+  contextWindow: 1_000_000, // optional; must be supported by the selected model unless non-strict fallback is acceptable
+  contextWindowStrict: true, // optional; return contextWindowError instead of warning/fallback when unsupported
   // Models for cycling (CTRL+P in interactive mode)
   scopedModels: [
@@ -429,6 +437,12 @@ If no model is provided:
 2. Uses default from settings
 3. Falls back to first available model
+Context-window selection is independent from `thinkingLevel`. `contextWindow` accepts a raw token count such as `400_000` or `1_000_000`; for most providers the value must be present in the model's supported context windows (`model.contextWindowOptions` plus the scalar default). GitHub Copilot is the only provider with rounded long-context budget handling: when a tiered Copilot model advertises a long tier below the branded request (for example `936_000` for a `1_000_000` request), Atomic selects the largest advertised Copilot long tier at or below the request instead of falling back to the short tier. Settings lookup first checks the selected model's `defaultContextWindows["provider/modelId"]` entry, then the optional global `defaultContextWindow` fallback; unsupported model-specific settings keep the model default and return `contextWindowWarning`, while unsupported global fallback values are ignored silently as not applicable to the active model. When you pass `contextWindowStrict: true`, an unsupported explicit selection is reported as `contextWindowError` so callers can fail before prompting. A successful explicit `contextWindow` startup option is journaled as a `context_window_change` entry even when it equals the scalar model default, so the user's explicit budget choice survives future settings changes and resume.
+At runtime, use `session.getAvailableContextWindows()` to inspect supported values, `session.supportsContextWindowSelection()` to check whether more than one value is selectable, and `session.setContextWindow(tokens, { persistDefault })` to change the active model budget. `setContextWindow()` journals a `context_window_change` entry only when the active value changes. Passing `{ persistDefault: true }` also writes the effective selected budget to `defaultContextWindows["provider/modelId"]` in settings instead of the global fallback, so a Copilot prompt cap such as `936k` does not leak into Anthropic, Cursor, or other providers. Tree navigation replays the target branch's `context_window_change` state into the active model without adding another journal entry or changing settings. Larger provider context windows may consume more credits/cost, so opt into larger values deliberately. For allowlisted GitHub Copilot long-context models (including `github-copilot/gpt-5.5` and `github-copilot/gemini-3.1-pro-preview`), selecting `1m` raises Atomic's local budget to the model's advertised `922k`/`936k` tier and sends `X-GitHub-Api-Version: 2026-06-01`; GitHub applies the long-context tier server-side by prompt token count, consumes more Copilot AI credits, and requires long-context/usage-based billing entitlement.
+The package root exports the same context-window helpers and types used by the runtime: `parseContextWindowValue()`, `formatContextWindow()`, `validateContextWindowValue()`, `normalizeContextWindowOptions()`, `getModelDefaultContextWindow()`, `getSupportedContextWindows()`, `withContextWindowOptions()`, `selectContextWindow()`, `ContextWindowParseResult`, `ContextWindowSelection`, `ContextWindowSelectionError`, and `ContextWindowSelectionOptions`. Importing from `@bastani/atomic` also includes the `@earendil-works/pi-ai` `Model<Api>` augmentation for `contextWindowOptions` and `defaultContextWindow`, so SDK consumers can use the helper types without importing internal source paths.
 > See [examples/sdk/02-custom-model.ts](https://github.com/bastani-inc/atomic/blob/main/packages/coding-agent/examples/sdk/02-custom-model.ts)
 ### API Keys and OAuth
@@ -532,11 +546,11 @@ const { session } = await createAgentSession({
 ```typescript
 import { createAgentSession, type BashCommandPolicy } from "@bastani/atomic";
-const browseOnly: BashCommandPolicy = {
+const playwrightCliOnly: BashCommandPolicy = {
   default: "deny",
   allow: [
-    "which browse",
-    { prefix: "browse " },
+    "which playwright-cli",
+    { prefix: "playwright-cli " },
     { prefix: "grep " },
     { glob: "bun test test/unit/*.test.ts" },
     { regex: "^rg\\b" },
@@ -547,19 +561,19 @@ const browseOnly: BashCommandPolicy = {
 const { session } = await createAgentSession({
   tools: ["read", "bash"],
-  bashPolicy: browseOnly,
+  bashPolicy: playwrightCliOnly,
 });
 ```
 Rules match exact command strings, prefixes, command-string globs, or JavaScript regular expressions. `default` defaults to `"allow"` for backward compatibility; set `default: "deny"` for an allowlist-only shell. Omitting `bashPolicy`, passing `{}`, or passing a default-allow policy with no `allow`/`deny` rules is a compatibility no-op and does not parse the command. Empty `allow`/`deny` arrays and match-only default-allow policies are treated the same; malformed policy objects still fail closed.
-Glob rules match command target strings, not filesystem path segments. `*` and `?` can match `/`, so `{ glob: "browse *" }` matches `browse http://localhost:3000`, `browse docs/index.html`, and `browse ./preview/output.html`, while still matching the whole target so `echo browse docs/index.html` does not match unless the pattern includes leading wildcards. Backslash escapes the next glob character when you need a literal `*`, `?`, or bracket; inside bracket classes, escaped metacharacters such as `\-`, `\^`, `\]`, `\[`, and `\\` stay literal instead of becoming regex ranges, negation markers, class delimiters, or backslash escapes. Malformed glob bracket classes or ranges, such as `{ glob: "echo [z-a]" }`, fail closed as `invalid-policy` rather than surfacing raw regular-expression errors.
+Glob rules match command target strings, not filesystem path segments. `*` and `?` can match `/`, so `{ glob: "playwright-cli *" }` matches `playwright-cli http://localhost:3000`, `playwright-cli docs/index.html`, and `playwright-cli ./preview/output.html`, while still matching the whole target so `echo playwright-cli docs/index.html` does not match unless the pattern includes leading wildcards. Backslash escapes the next glob character when you need a literal `*`, `?`, or bracket; inside bracket classes, escaped metacharacters such as `\-`, `\^`, `\]`, `\[`, and `\\` stay literal instead of becoming regex ranges, negation markers, class delimiters, or backslash escapes. Malformed glob bracket classes or ranges, such as `{ glob: "echo [z-a]" }`, fail closed as `invalid-policy` rather than surfacing raw regular-expression errors.
 Runtime policy validation is part of enforcement for JavaScript/JSON callers: a provided policy must be a non-null object with only the top-level keys `default`, `allow`, `deny`, and `match`; typoed or extra keys such as `denny` or `extra` are rejected as `invalid-policy` even when the policy otherwise looks like default-allow. `allow`/`deny` must be arrays when present, rules must be non-empty strings or one-variant objects with string values, regex flags must be strings, and invalid regexes, invalid globs, or stateful `g`/`y` flags are rejected as `invalid-policy` before shell execution.
-By default, `match: "segments"` parses shell separators and substitutions and requires every executable segment to pass. Separators include pipes, `&&`, `||`, `;`, background `&`, and unquoted line terminators: LF, CRLF, and bare CR are command separators rather than ordinary whitespace. Bash noclobber redirection `>|` is treated as redirection syntax rather than a pipeline separator after a command head, so `echo ok >|/tmp/out` remains one `echo` segment. For example, `browse snapshot | grep title` must satisfy both the `browse` rule and the `grep` rule, and `browse snapshot; rm -rf /` or `browse snapshot\nrm -rf /` is blocked when `rm` is denied or when `default: "deny"` has no matching allow rule. Segment mode also checks command substitutions (`$(...)`, backticks) and process substitutions (`<(...)`, `>(...)`). Syntax Atomic cannot safely segment is rejected before a shell process starts.
+By default, `match: "segments"` parses shell separators and substitutions and requires every executable segment to pass. Separators include pipes, `&&`, `||`, `;`, background `&`, and unquoted line terminators: LF, CRLF, and bare CR are command separators rather than ordinary whitespace. Bash noclobber redirection `>|` is treated as redirection syntax rather than a pipeline separator after a command head, so `echo ok >|/tmp/out` remains one `echo` segment. For example, `playwright-cli snapshot | grep title` must satisfy both the `playwright-cli` rule and the `grep` rule, and `playwright-cli snapshot; rm -rf /` or `playwright-cli snapshot\nrm -rf /` is blocked when `rm` is denied or when `default: "deny"` has no matching allow rule. Segment mode also checks command substitutions (`$(...)`, backticks) and process substitutions (`<(...)`, `>(...)`). Syntax Atomic cannot safely segment is rejected before a shell process starts.
-Segment mode requires each command head to be a statically identifiable literal word. Literal names such as `grep`, `./script`, `/usr/bin/env`, `bun`, `browse`, and names containing hyphens, underscores, dots, or slashes are accepted when they contain no shell expansion syntax. Atomic conservatively rejects Bash reserved words and compound introducers (`coproc`, `if`, `for`, `while`, `case`, `{`, `}`, `!`), leading redirection syntax (`>file cmd`, `2>file cmd`, `<file cmd`, `&>file cmd`, `>|file cmd`, `<&0 cmd`, `>&2 cmd`), redirection operators attached to the command-head word (`cmd>file`, `cmd>>file`, `cmd>|file`, `cmd2>file`, `cmd>&2`, `cmd</tmp/in`), leading environment assignment words (`PATH=/tmp:$PATH browse snapshot`, `LD_PRELOAD=/tmp/x browse snapshot`, `FOO=bar`), variable or parameter-expanded heads (`$cmd`, `${cmd}`), quote- or escape-constructed heads (`r''m`, `"rm"`, `r\m`), tilde/glob/brace-expanded heads (`~/bin/rm`, `r*m`, `{rm,echo}`), and command/process substitutions or backticks embedded in the head. Substitutions in argument positions are still parsed so nested commands must also pass the policy.
+Segment mode requires each command head to be a statically identifiable literal word. Literal names such as `grep`, `./script`, `/usr/bin/env`, `bun`, `playwright-cli`, and names containing hyphens, underscores, dots, or slashes are accepted when they contain no shell expansion syntax. Atomic conservatively rejects Bash reserved words and compound introducers (`coproc`, `if`, `for`, `while`, `case`, `{`, `}`, `!`), leading redirection syntax (`>file cmd`, `2>file cmd`, `<file cmd`, `&>file cmd`, `>|file cmd`, `<&0 cmd`, `>&2 cmd`), redirection operators attached to the command-head word (`cmd>file`, `cmd>>file`, `cmd>|file`, `cmd2>file`, `cmd>&2`, `cmd</tmp/in`), leading environment assignment words (`PATH=/tmp:$PATH playwright-cli snapshot`, `LD_PRELOAD=/tmp/x playwright-cli snapshot`, `FOO=bar`), variable or parameter-expanded heads (`$cmd`, `${cmd}`), quote- or escape-constructed heads (`r''m`, `"rm"`, `r\m`), tilde/glob/brace-expanded heads (`~/bin/rm`, `r*m`, `{rm,echo}`), and command/process substitutions or backticks embedded in the head. Substitutions in argument positions are still parsed so nested commands must also pass the policy.
 Use `match: "whole"` only when you intentionally want rules to match the raw command string as-is. Whole-command prefix rules can allow shell operators inside the same raw string.
@@ -991,6 +1005,12 @@ interface CreateAgentSessionResult {
   // Warning if session model couldn't be restored
   modelFallbackMessage?: string;
+  // Warning if a saved/default context window could not be applied to the selected model
+  contextWindowWarning?: string;
+  // Error if an explicit strict context-window selection is unsupported
+  contextWindowError?: string;
 }
 interface LoadExtensionsResult {
@@ -1236,7 +1256,8 @@ DefaultResourceLoader
 type ResourceLoader
 createEventBus
-// Helpers
+// Constants and helpers
+CONFIG_DIR_NAME
 defineTool
 STRUCTURED_OUTPUT_TOOL_NAME
 createStructuredOutputTool
@@ -1246,6 +1267,9 @@ getPackageDir
 getReadmePath
 getDocsPath
 getExamplesPath
+generateDiffString
+generateUnifiedPatch
+type EditDiffResult
 // Session management
 SessionManager

package/docs/session-format.md CHANGED Viewed

@@ -216,6 +216,16 @@ Emitted when the user changes the thinking/reasoning level.
 {"type":"thinking_level_change","id":"e5f6g7h8","parentId":"d4e5f6g7","timestamp":"2024-12-03T14:06:00.000Z","thinkingLevel":"high"}
 ```
+### ContextWindowChangeEntry
+Emitted when the user selects a supported context-window size for the active model. The value is a token count, independent of thinking/reasoning level. Explicit startup selections are journaled even when they equal the model's scalar default so the user's budget choice survives later settings changes and resume.
+```json
+{"type":"context_window_change","id":"f6g7h8i9","parentId":"e5f6g7h8","timestamp":"2024-12-03T14:07:00.000Z","contextWindow":1000000}
+```
+`buildSessionContext()` replays the latest `context_window_change` on the active branch. In-place tree navigation also applies the branch's replayed context window to the active model without appending another `context_window_change` entry or writing context-window defaults to settings. If a historical value is no longer supported by the current model, session creation/navigation falls back to the model default the same way other context-window restore paths do.
 ### CompactionEntry
 Retired summary-compaction entry. Atomic no longer produces this entry type, does not treat it as an active compaction boundary, and does not inject its generated summary into active LLM context. Historical JSONL files may still contain these lines for audit/export compatibility.
@@ -312,7 +322,7 @@ Entries form a tree:
 `buildSessionContext()` walks from the current leaf to the root, producing the message list for the LLM:
 1. Collects all entries on the active branch path
-2. Extracts current model and thinking level settings
+2. Extracts current model, thinking level, and context-window settings
 3. Applies every `ContextCompactionEntry` logical deletion on that path, filtering targeted entries/content blocks from active context while leaving retained content unchanged
 4. Converts `BranchSummaryEntry` and `CustomMessageEntry` to appropriate message formats
 5. Ignores retired `CompactionEntry` lines for active LLM context; they remain archival JSONL data only
@@ -358,6 +368,9 @@ for (const line of lines) {
     case "thinking_level_change":
       console.log(`[${entry.id}] Thinking: ${entry.thinkingLevel}`);
       break;
+    case "context_window_change":
+      console.log(`[${entry.id}] Context window: ${entry.contextWindow}`);
+      break;
   }
 }
 ```
@@ -385,6 +398,7 @@ Key methods for working with sessions programmatically.
 ### Instance Methods - Appending (all return entry ID)
 - `appendMessage(message)` - Add message
 - `appendThinkingLevelChange(level)` - Record thinking change
+- `appendContextWindowChange(contextWindow)` - Record context-window selection in tokens
 - `appendModelChange(provider, modelId)` - Record model change
 - `appendContextCompaction(deletedTargets, protectedEntryIds, stats, backupPath?)` - Add logical deletion compaction
 - `appendCustomEntry(customType, data?)` - Extension state (not in context)

package/docs/sessions.md CHANGED Viewed

@@ -142,6 +142,6 @@ See [Compaction](/compaction) for Verbatim Compaction, branch summarization inte
 ## Session Format
-Session files are JSONL and contain message entries, model changes, thinking-level changes, labels, context compactions, branch summaries, extension entries, and retired legacy `type:"compaction"` records from older sessions.
+Session files are JSONL and contain message entries, model changes, thinking-level changes, context-window changes, labels, context compactions, branch summaries, extension entries, and retired legacy `type:"compaction"` records from older sessions.
 For parsers, extensions, SDK usage, and the full SessionManager API, see [Session Format](/session-format).

package/docs/settings.md CHANGED Viewed

@@ -227,18 +227,27 @@ Normally the package manager's global modules location is queried using `root -g
 When multiple sources specify a session directory, precedence is `--session-dir`, `ATOMIC_CODING_AGENT_SESSION_DIR`, then `sessionDir` in settings.json.
-### Model Cycling
+### Models
 | Setting | Type | Default | Description |
 |---------|------|---------|-------------|
 | `enabledModels` | string[] | - | Model patterns for CTRL+P cycling (same format as `--models` CLI flag) |
+| `defaultContextWindow` | number \| string | model default | Optional global fallback context window for models that expose selectable context windows. Accepts raw token counts or compact labels such as `400k` and `1m`. Unsupported values are ignored for models that do not support them. |
+| `defaultContextWindows` | object | `{}` | Per-model preferred context windows keyed as `provider/modelId`. The interactive `/model` context picker writes this setting so a Copilot-specific prompt cap such as `936k` does not leak into Anthropic, Cursor, or other providers. |
 ```json
 {
-  "enabledModels": ["claude-*", "gpt-4o", "gemini-2*"]
+  "enabledModels": ["claude-*", "gpt-4o", "gemini-2*"],
+  "defaultContextWindow": "1m",
+  "defaultContextWindows": {
+    "github-copilot/claude-opus-4.8": "936k",
+    "github-copilot/gpt-5.5": "922k"
+  }
 }
 ```
+Context-window settings are independent of `defaultThinkingLevel`: selecting a larger context window does not change reasoning effort. Interactive users can change the active model's budget through the `/model` selection flow, which prompts for a context window whenever the chosen model supports more than one window and persists the effective selection under `defaultContextWindows["provider/modelId"]`. Atomic treats `defaultContextWindow` as a broad fallback only: if the active model does not support that value, the model's own default is used without a startup warning; targeted `defaultContextWindows` entries still warn when they become unsupported for their exact model. Larger provider context windows can carry higher usage cost. For GitHub Copilot allowlisted long-context models (including `github-copilot/gpt-5.5` and `github-copilot/gemini-3.1-pro-preview`), selecting `1m` raises Atomic's local prompt budget to the largest advertised long-context tier at or below that rounded request (for example `922k` or `936k`) and sends `X-GitHub-Api-Version: 2026-06-01`; GitHub then applies the long-context tier server-side by prompt token count. That tier consumes more Copilot AI credits and requires Copilot long-context/usage-based billing entitlement, otherwise requests over the server cap are rejected with a friendly hint. Custom providers and explicit model overrides can still declare their own selectable `contextWindowOptions`.
 ### Markdown
 | Setting | Type | Default | Description |
@@ -297,6 +306,7 @@ See [Atomic packages](/packages) for package management details.
   "defaultProvider": "anthropic",
   "defaultModel": "claude-sonnet-4-20250514",
   "defaultThinkingLevel": "medium",
+  "defaultContextWindow": "400k",
   "theme": "dark",
   "compaction": {
     "enabled": true,

package/docs/themes.md CHANGED Viewed

@@ -37,6 +37,8 @@ Select a theme via `/settings` or in `settings.json`:
 }
 ```
+Use `"theme": "light-theme/dark-theme"` for automatic mode. Atomic chooses the first theme when the terminal reports a light color scheme and the second theme for dark terminals, and it follows terminal color-scheme changes when supported.
 On first run, Atomic detects your terminal background and defaults to `dark` or `light`.
 ## Creating a Custom Theme
@@ -137,7 +139,7 @@ vim ~/.atomic/agent/themes/my-theme.json
 }
 ```
-- `name` is required and must be unique.
+- `name` is required, must be unique, and must not contain `/`.
 - `vars` is optional. Define reusable colors here, then reference them in `colors`.
 - `colors` must define all 51 required tokens.

package/docs/tui.md CHANGED Viewed

@@ -250,7 +250,7 @@ md.setText("Updated markdown");
 ### Image
-Renders images in supported terminals (Kitty, iTerm2, Ghostty, WezTerm).
+Renders images in supported terminals (Kitty, iTerm2, Ghostty, WezTerm, Warp).
 ```typescript
 const image = new Image(

package/docs/usage.md CHANGED Viewed

@@ -131,17 +131,20 @@ atomic [options] [@files...] [messages...]
 ### Package Commands
 ```bash
-atomic install <source> [-l]     # Install package, -l for project-local
-atomic remove <source> [-l]      # Remove package
-atomic uninstall <source> [-l]   # Alias for remove
-atomic update [source|self|atomic] # Update Atomic and packages; skips pinned packages
-atomic update --extensions       # Update packages only
-atomic update --self             # Update Atomic only
-atomic update --extension <src>  # Update one package
-atomic list                      # List installed packages
-atomic config                    # Enable/disable package resources
+atomic install <source> [-l]       # Install package, -l for project-local
+atomic remove <source> [-l]        # Remove package
+atomic uninstall <source> [-l]     # Alias for remove
+atomic update [source|self|atomic] # Update Atomic only, or one package source
+atomic update --all                # Update Atomic and packages; reconcile pinned git refs
+atomic update --extensions         # Update packages only; reconcile pinned git refs
+atomic update --self               # Update Atomic only
+atomic update --extension <src>    # Update one package
+atomic list                        # List installed packages
+atomic config                      # Enable/disable package resources
 ```
+These commands manage Atomic packages and `atomic update` can update the Atomic CLI installation. To uninstall Atomic itself, see [Quickstart](/quickstart#uninstall). `atomic config` and project package commands accept `--approve`/`--no-approve` to trust or ignore project-local settings for one command. `atomic update` never prompts for project trust.
 See [Atomic Packages](/packages) for package sources and security notes.
 ### Modes

package/docs/workflows.md CHANGED Viewed

@@ -153,7 +153,7 @@ For the builtin result tables below, `deep-research-codebase`, `goal`, and `ralp
 |---|---|---|
 | `deep-research-codebase` | Scout + research-history chain → parallel specialist waves → aggregator. Indexes the whole repo and synthesizes findings. | Broad or cross-cutting research before you decide what to change. Prefer `/skill:research-codebase` for one subsystem. |
 | `goal` | Persisted goal ledger → bounded worker turns → receipts → three-reviewer gate → deterministic reducer → final report. | Small-to-medium scope changes when you can identify the work surface, state the exact outcome, and name the validation that proves it is done — for example tests, lint/typecheck, docs builds, or observable behavior. |
-| `ralph` | Prompt-engineering → codebase/online research → sub-agent orchestration → parallel review → optional final-stage PR handoff. | Larger migrations, broad refactors, and multi-package changes where you want Atomic to transform the prompt into a research question, research the codebase before implementing, delegate through sub-agents, review, iterate, and optionally allow only the final `pull-request` stage to attempt PR creation with `create_pr=true`. |
+| `ralph` | Prompt-engineering → codebase/online research → sub-agent orchestration → multi-model parallel review → optional final-stage PR handoff. | Larger migrations, broad refactors, and multi-package changes where you want Atomic to transform the prompt into a research question, research the codebase before implementing, delegate through sub-agents, review, iterate, and optionally allow only the final `pull-request` stage to attempt PR creation with `create_pr=true`. |
 | `open-claude-design` | Design-system onboarding → reference import → HTML generation → impeccable-driven refinement → quality gate → rich HTML handoff. Renders a live `preview.html` you can iterate against (opens through `browser` when available). | UI, page, component, theme, or design-token work that benefits from generation + critique loops. |
 ### `deep-research-codebase`
@@ -224,7 +224,7 @@ Run examples:
 Write the `objective` like a compact acceptance spec. Say what should exist when the run is done, how you want testing handled, which command(s) or manual checks matter, and what outcome proves completion. The workflow is intentionally lean: it does not first generate an RFC or migration plan, so the developer-supplied objective is where scope, validation, and completion criteria belong.
-The worker may claim readiness, but it cannot finalize completion. Workers and reviewers are prompted to verify user-visible behavior end-to-end when practical, using browser-skilled subagents for web/frontend flows that may depend on backend/API behavior and tmux-skilled subagents for TUI or terminal-app scenarios. Three reviewers independently inspect the ledger, worker receipt, repository state, and diff against `base_branch`; each returns structured JSON with findings, evidence, verification still remaining, and an optional blocker. A TypeScript reducer marks the goal complete only when reviewer quorum approves, marks blocked only when the same dependency/tool blocker repeats for the blocker threshold, continues when evidence is missing, and returns `needs_human` when `max_turns` is exhausted or worker execution fails.
+The worker may claim readiness, but it cannot finalize completion. Workers and reviewers are prompted to verify user-visible behavior end-to-end when practical, using `playwright-cli`-skilled subagents for web/frontend flows that may depend on backend/API behavior and tmux-skilled subagents for TUI or terminal-app scenarios. Three reviewers independently inspect the ledger, worker receipt, repository state, and diff against `base_branch`; each returns structured JSON with findings, evidence, verification still remaining, and an optional blocker. A TypeScript reducer marks the goal complete only when reviewer quorum approves, marks blocked only when the same dependency/tool blocker repeats for the blocker threshold, continues when evidence is missing, and returns `needs_human` when `max_turns` is exhausted or worker execution fails.
 Result fields:
@@ -262,7 +262,7 @@ Run examples:
 /workflow ralph prompt="Safely implement the API refactor" git_worktree_dir=../atomic-ralph-api-wt base_branch=main
 ```
-Each `ralph` iteration starts by prompt-engineering the user prompt with `/skill:prompt-engineer Transform the following user prompt to a codebase and online research question which can be thoroughly explored: ...`, then researches that transformed question with `/skill:research-codebase ...` and writes the findings under `research/`. The orchestrator treats that research artifact as its primary implementation context, initializes/updates an OS-temp implementation notes file, delegates implementation through sub-agents, and asks two reviewers to inspect the patch directly against `base_branch`. Ralph's orchestrator and reviewers are prompted to verify user-visible behavior end-to-end when practical, using browser-skilled subagents for web/frontend flows that may depend on backend/API behavior and tmux-skilled subagents for TUI or terminal-app scenarios. If reviewers find issues, the next prompt-engineering and research stages receive the review artifact path so follow-up research can address unresolved findings, and research stages fork from prior research session data when available. The loop stops when every reviewer approves or `max_loops` is reached. By default Ralph does not start the final `pull-request` stage, and `pr_report` is omitted. Prompt text alone does not opt in. Pass `create_pr=true` only when you explicitly want the final `pull-request` stage to inspect provider credentials and attempt provider-appropriate PR/MR/review creation, such as GitHub `gh`, Azure Repos `az repos pr create`, or Sapling/Phabricator tooling; Ralph's own PR-creation instructions live in that final stage.
+Each `ralph` iteration starts by prompt-engineering the user prompt with `/skill:prompt-engineer Transform the following user prompt to a codebase and online research question which can be thoroughly explored: ...`, then researches that transformed question with `/skill:research-codebase ...` and writes the findings under `research/`. The orchestrator treats that research artifact as its primary implementation context, initializes/updates an OS-temp implementation notes file while generating verifiable evidence for any claims it records in the notes and reviewer artifacts, delegates implementation through sub-agents, and asks three independent reviewers to inspect the patch directly against `base_branch`. The reviewer fan-out runs each reviewer on a different primary model family (with shared fallbacks) so the adversarial review gets cross-model coverage instead of three passes from one model. Ralph's orchestrator and reviewers are prompted to verify user-visible behavior end-to-end when practical, using `playwright-cli`-skilled subagents for web/frontend flows that may depend on backend/API behavior and tmux-skilled subagents for TUI or terminal-app scenarios. For UI-applicable or full-stack changes, the orchestrator runs a `playwright-cli` end-to-end QA pass and records a reviewable proof video (referenced in the implementation notes and surfaced as `qa_video_path`); when `create_pr=true`, the final `pull-request` stage attaches or links that video to the created PR/MR/review. If reviewers find issues, the next prompt-engineering and research stages receive the review artifact path so follow-up research can address unresolved findings, and research stages fork from prior research session data when available. The loop stops only when all three reviewers independently approve (each finds no issues) or `max_loops` is reached, so a P0–P3 finding from any single reviewer keeps Ralph iterating instead of being out-voted by a majority quorum. By default Ralph does not start the final `pull-request` stage, and `pr_report` is omitted. Prompt text alone does not opt in. Pass `create_pr=true` only when you explicitly want the final `pull-request` stage to inspect provider credentials and attempt provider-appropriate PR/MR/review creation, such as GitHub `gh`, Azure Repos `az repos pr create`, or Sapling/Phabricator tooling; Ralph's own PR-creation instructions live in that final stage.
 Set `git_worktree_dir` when you want Ralph's worker stages isolated in a reusable Git worktree. Relative paths resolve from the invoking repository root, existing same-repository worktree roots are reused, and missing paths are created from `base_branch`. Ralph preserves the invoking repo-relative cwd inside the worktree, so launching from `repo/packages/api` with `git_worktree_dir=../repo-wt` runs stages from `../repo-wt/packages/api`.
@@ -276,6 +276,7 @@ Result fields:
 | `research` | Latest research report text or artifact reference. |
 | `research_path` | Path to the latest generated research artifact under `research/`. |
 | `implementation_notes_path` | OS-temp notes file containing decisions, deviations, blockers, and validation notes. |
+| `qa_video_path` | Absolute path to the reviewable QA end-to-end proof video recorded with `playwright-cli` for UI-applicable changes, when one was produced. |
 | `pr_report` | Pull-request report emitted only when `create_pr=true` and the final `pull-request` stage runs. |
 | `approved` | Whether the reviewer loop approved before completion or optional final handoff. |
 | `iterations_completed` | Number of research/orchestrate/review loops completed. |
@@ -313,6 +314,7 @@ Result fields:
 | `preview_file_url` | `file://` URL for the generated `preview.html` file. |
 | `spec_path` | Absolute path to the generated `spec.html` file. |
 | `spec_file_url` | `file://` URL for the generated `spec.html` file. |
+| `playwright_cli_status` | Outcome of the initial deterministic step that ensures the `playwright-cli` skill's `playwright-cli` command is installed. |
 `open-claude-design` has no `result` output; it exposes only the declared fields listed above. Use the declared `artifact` and `handoff` fields for generated content.
@@ -969,7 +971,7 @@ workflow({
 })
 ```
-Direct mode supports top-level/default options and per-task options such as `context`, `forkFromSessionFile`, `model`, `fallbackModels`, `thinkingLevel`, `tools`, `noTools`, `customTools`, `bashPolicy`, `mcp`, `output`, `outputMode`, `reads`, `worktree`, `gitWorktreeDir`, `baseBranch`, `maxOutput`, `artifacts`, `sessionDir`, `cwd`, and `agentDir`. Direct chains also support `chainName`, `chainDir`, and `failFast`.
+Direct mode supports top-level/default options and per-task options such as `context`, `forkFromSessionFile`, `model`, `fallbackModels`, `thinkingLevel`, `contextWindow`, `tools`, `noTools`, `customTools`, `bashPolicy`, `mcp`, `output`, `outputMode`, `reads`, `worktree`, `gitWorktreeDir`, `baseBranch`, `maxOutput`, `artifacts`, `sessionDir`, `cwd`, and `agentDir`. Direct chains also support `chainName`, `chainDir`, and `failFast`.
 For large fan-outs, prefer `outputMode: "file-only"` so the parent result contains compact file references instead of full output. Treat intercom payloads from async direct runs as user-visible workflow output.
@@ -1477,7 +1479,8 @@ Common task/stage options include:
 - `prompt` or `task`
 - `previous` for small handoff context; use artifact paths plus `reads` for large outputs, logs, research bundles, or reviewer payloads
 - `context: "fresh" | "fork"`, `forkFromSessionFile`
-- `model`, `fallbackModels`, `thinkingLevel`, `scopedModels`, `modelRegistry` — `model` and each `fallbackModels` entry accept a `model_name:thinking_effort` reasoning suffix; the standalone `thinkingLevel` is deprecated (see [Reasoning levels](#reasoning-levels))
+- `model`, `fallbackModels`, `thinkingLevel`, `scopedModels`, `modelRegistry` — `model` and each `fallbackModels` entry accept a `model_name:thinking_effort` reasoning suffix and an optional parenthesized context-window token such as `model (1m)` (see [Reasoning levels](#reasoning-levels) and [Context windows](#context-windows)); the standalone `thinkingLevel` is deprecated
+- `contextWindow`, `contextWindowStrict` — stage-wide context-window budget mapped to the SDK `createAgentSession` options of the same name (non-strict by default)
 - `tools`, `noTools`, `customTools`, `mcp: { allow?: string[], deny?: string[] }`, `bashPolicy`
 - `schema` for a structured final answer from this workflow item
 - `output`, `outputMode`, `reads`, `worktree`, `gitWorktreeDir`, `baseBranch`, `maxOutput`, `artifacts`, `sessionDir`, `cwd`, `agentDir`
@@ -1495,18 +1498,18 @@ await ctx.task("browser-preview", {
   bashPolicy: {
     default: "deny",
     allow: [
-      "which browse",
-      { prefix: "browse open " },
-      { prefix: "browse snapshot" },
+      "which playwright-cli",
+      { prefix: "playwright-cli open " },
+      { prefix: "playwright-cli snapshot" },
       { prefix: "grep " },
     ],
     deny: [{ regex: "\\brm\\b" }],
   },
-  prompt: "Open the preview with browse, then summarize the visible state.",
+  prompt: "Open the preview with playwright-cli, then summarize the visible state.",
 });
 ```
-A command such as `browse snapshot | grep title` passes only when both segments are allowed, and `browse snapshot\nrm -rf /tmp/proof` cannot be hidden behind a `{ prefix: "browse " }` rule because the newline starts a new segment. Glob rules match command strings rather than filesystem path segments: `*` and `?` may span `/`, so `{ glob: "browse *" }` matches URLs and slash-bearing paths such as `browse http://localhost:3000`, `browse docs/index.html`, and `browse ./preview/output.html` while still matching the whole target rather than `echo browse ...`; escaped bracket-class metacharacters such as `\-`, `\^`, `\]`, `\[`, and `\\` stay literal, while malformed glob ranges such as `{ glob: "echo [z-a]" }` become `invalid-policy` denials. Segment mode accepts literal heads such as `grep`, `./script`, `/usr/bin/env`, `bun`, and `browse`, and treats non-leading `>|` as redirection syntax so `echo ok >|/tmp/out` stays one segment, but conservatively rejects reserved or compound heads (`coproc`, `if`, `for`, `while`, `case`, `{`, `}`, `!`), leading redirections (`>file cmd`, `2>file cmd`, `<file cmd`, `&>file cmd`, `&>>file cmd`, `>|file cmd`, `<&0 cmd`, `>&2 cmd`), redirections attached to the command-head word (`cmd>file`, `cmd>>file`, `cmd>|file`, `cmd2>file`, `cmd>&2`, `cmd</tmp/in`), leading environment assignments (`PATH=/tmp:$PATH browse snapshot`, `LD_PRELOAD=/tmp/x browse snapshot`, `FOO=bar`), dynamic heads such as `$cmd`, `${cmd}`, `r''m`, `r\m`, `~/bin/rm`, `r*m`, `{rm,echo}`, `r$(printf m)`, or backtick-built command names. A single denied, redirection-prefixed, attached-redirection, assignment-prefixed, dynamic, or unrecognized segment blocks the whole command with a model-readable tool error and no UI prompt, so the behavior works in headless workflow runs. Use `match: "whole"` only when raw-command matching is intentional.
+A command such as `playwright-cli snapshot | grep title` passes only when both segments are allowed, and `playwright-cli snapshot\nrm -rf /tmp/proof` cannot be hidden behind a `{ prefix: "playwright-cli " }` rule because the newline starts a new segment. Glob rules match command strings rather than filesystem path segments: `*` and `?` may span `/`, so `{ glob: "playwright-cli *" }` matches URLs and slash-bearing paths such as `playwright-cli http://localhost:3000`, `playwright-cli docs/index.html`, and `playwright-cli ./preview/output.html` while still matching the whole target rather than `echo playwright-cli ...`; escaped bracket-class metacharacters such as `\-`, `\^`, `\]`, `\[`, and `\\` stay literal, while malformed glob ranges such as `{ glob: "echo [z-a]" }` become `invalid-policy` denials. Segment mode accepts literal heads such as `grep`, `./script`, `/usr/bin/env`, `bun`, and `playwright-cli`, and treats non-leading `>|` as redirection syntax so `echo ok >|/tmp/out` stays one segment, but conservatively rejects reserved or compound heads (`coproc`, `if`, `for`, `while`, `case`, `{`, `}`, `!`), leading redirections (`>file cmd`, `2>file cmd`, `<file cmd`, `&>file cmd`, `&>>file cmd`, `>|file cmd`, `<&0 cmd`, `>&2 cmd`), redirections attached to the command-head word (`cmd>file`, `cmd>>file`, `cmd>|file`, `cmd2>file`, `cmd>&2`, `cmd</tmp/in`), leading environment assignments (`PATH=/tmp:$PATH playwright-cli snapshot`, `LD_PRELOAD=/tmp/x playwright-cli snapshot`, `FOO=bar`), dynamic heads such as `$cmd`, `${cmd}`, `r''m`, `r\m`, `~/bin/rm`, `r*m`, `{rm,echo}`, `r$(printf m)`, or backtick-built command names. A single denied, redirection-prefixed, attached-redirection, assignment-prefixed, dynamic, or unrecognized segment blocks the whole command with a model-readable tool error and no UI prompt, so the behavior works in headless workflow runs. Use `match: "whole"` only when raw-command matching is intentional.
 `gitWorktreeDir` selects a reusable Git worktree root for `ctx.stage`, `ctx.task`, `ctx.chain`, and `ctx.parallel`. If the path is missing, Atomic creates it with `git worktree add --detach <path> <baseBranch>`; if it exists, it must be a same-repository worktree root. The default stage cwd becomes the matching cwd inside the worktree and preserves the invoking repo-relative subdirectory. Explicit `cwd` still wins; relative `cwd` values resolve from the worktree cwd, while absolute `cwd` values are used as provided. `gitWorktreeDir` is mutually exclusive with `worktree: true`: use `gitWorktreeDir` for named/reusable worktrees and `worktree: true` for temporary direct-mode worktrees that are cleaned up after the run.
@@ -1554,6 +1557,27 @@ The standalone `thinkingLevel` stage option is deprecated. It still applies as a
 This applies everywhere a stage accepts a model: direct `ctx.task`/`ctx.chain`/`ctx.parallel` options, `ctx.stage` options, builtin workflow stage definitions, and workflow parameters. `fallbackThinkingLevels` is an optional compatibility helper aligned by index to `fallbackModels`; it applies only to fallback entries that do not already carry a suffix. Each `WorkflowModelAttempt` reports the resolved model and the effective reasoning effort used for that attempt.
+### Context windows
+A `model`/`fallbackModels` entry may also request a context-window budget with a parenthesized size token in the model-name portion — placed *before* the optional `:reasoning` suffix so it never collides with the reasoning level. This mirrors GitHub Copilot's `Claude Opus 4.8 (1M context)` model-name convention:
+```ts
+await ctx.task("review", {
+  task: "Review the diff",
+  model: "anthropic/claude-fable-5:xhigh",
+  // The copilot opus fallback runs at its largest advertised (long-context) window.
+  fallbackModels: ["github-copilot/claude-opus-4.8 (1m):xhigh", "anthropic/claude-opus-4-8:xhigh"],
+});
+```
+The token accepts the same compact sizes as the `--context-window` flag (`1m`, `936k`, `400k`, or a raw token count) and is resolved against that specific candidate model's advertised windows:
+- an exact supported window is used as-is;
+- otherwise the largest supported window not exceeding the request is selected, so `(1m)` lands on a model's ~936K long-context tier;
+- when the model exposes no larger tier (or is unavailable), the request is dropped and the session keeps the model's default (short) window — a non-strict, automatic fallback.
+The budget applies only to the candidate that carries the token; other primary and fallback models in the same chain are unaffected. A parenthesized token that is not a valid size (for example `(preview)`) is left attached to the model id rather than being treated as a context window. For stage-wide selection you can instead set the `contextWindow` (and `contextWindowStrict`) stage option, which maps to the SDK `createAgentSession` options of the same name.
 ## Programmatic Usage
 `@bastani/workflows` is an Atomic package extension. It registers:

package/examples/extensions/custom-provider-anthropic/package-lock.json CHANGED Viewed

@@ -1,12 +1,12 @@
 {
   "name": "atomic-extension-custom-provider-anthropic",
-  "version": "0.79.4",
+  "version": "0.79.7",
   "lockfileVersion": 3,
   "requires": true,
   "packages": {
     "": {
       "name": "atomic-extension-custom-provider-anthropic",
-      "version": "0.79.4",
+      "version": "0.79.7",
       "dependencies": {
         "@anthropic-ai/sdk": "^0.52.0"
       }

package/examples/extensions/custom-provider-anthropic/package.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "name": "atomic-extension-custom-provider-anthropic",
   "private": true,
-  "version": "0.79.4",
+  "version": "0.79.7",
   "type": "module",
   "scripts": {
     "clean": "echo 'nothing to clean'",

package/examples/extensions/custom-provider-gitlab-duo/package.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "name": "atomic-extension-custom-provider-gitlab-duo",
   "private": true,
-  "version": "0.79.4",
+  "version": "0.79.7",
   "type": "module",
   "scripts": {
     "clean": "echo 'nothing to clean'",

package/examples/extensions/gondolin/package-lock.json CHANGED Viewed

@@ -1,12 +1,12 @@
 {
   "name": "atomic-extension-gondolin",
-  "version": "0.79.4",
+  "version": "0.79.7",
   "lockfileVersion": 3,
   "requires": true,
   "packages": {
     "": {
       "name": "atomic-extension-gondolin",
-      "version": "0.79.4",
+      "version": "0.79.7",
       "dependencies": {
         "@earendil-works/gondolin": "0.12.0"
       }

package/examples/extensions/gondolin/package.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
 	"name": "atomic-extension-gondolin",
 	"private": true,
-	"version": "0.79.4",
+	"version": "0.79.7",
 	"type": "module",
 	"scripts": {
 		"clean": "echo 'nothing to clean'",