npm - @iaforged/context-code - Versions diffs - 1.2.9 → 1.2.10 - Mend

@iaforged/context-code 1.2.9 → 1.2.10

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (172) hide show

package/README.md +119 -119
package/context-bootstrap.js +26 -26
package/dist/src/QueryEngine.js +394 -327
package/dist/src/bridge/bridgeUI.js +1 -1
package/dist/src/buddy/prompt.js +4 -4
package/dist/src/cli/handlers/auth.js +126 -9
package/dist/src/cli/print.js +35 -1
package/dist/src/commands/agent/agent.js +28 -2
package/dist/src/commands/agent/agentStore.js +8 -1
package/dist/src/commands/agent/index.js +1 -1
package/dist/src/commands/bridge-kick.js +9 -9
package/dist/src/commands/commit.js +34 -34
package/dist/src/commands/init-verifiers.js +3 -3
package/dist/src/commands/init.js +88 -88
package/dist/src/commands/insights.js +787 -787
package/dist/src/commands/install.js +19 -19
package/dist/src/commands/login/login.js +21 -12
package/dist/src/commands/logout/logout.js +9 -0
package/dist/src/commands/model/model.js +9 -4
package/dist/src/commands/orchestrate/SwarmUI.js +50 -0
package/dist/src/commands/orchestrate/index.js +2 -2
package/dist/src/commands/orchestrate/orchestrate.js +708 -12
package/dist/src/commands/pr_comments/index.js +33 -33
package/dist/src/commands/profile/index.js +1 -1
package/dist/src/commands/profile/profile.js +52 -3
package/dist/src/commands/provider/index.js +1 -1
package/dist/src/commands/provider/provider.js +117 -45
package/dist/src/commands/resumen/index.js +9 -0
package/dist/src/commands/resumen/resumen.js +29 -0
package/dist/src/commands/security-review.js +190 -190
package/dist/src/commands/swarm-auto/index.js +9 -0
package/dist/src/commands/swarm-auto/swarmAuto.js +111 -0
package/dist/src/commands/swarm-init/index.js +9 -0
package/dist/src/commands/swarm-init/swarmInit.js +72 -0
package/dist/src/commands/team/team.js +39 -6
package/dist/src/commands.js +14 -0
package/dist/src/components/LogoV2/CondensedLogo.js +2 -2
package/dist/src/components/PromptInput/PromptInputQueuedCommands.js +3 -3
package/dist/src/components/agents/agentFileUtils.js +6 -6
package/dist/src/components/permissions/hooks.js +5 -5
package/dist/src/constants/outputStyles.js +83 -83
package/dist/src/core/agents/blueprints.js +58 -0
package/dist/src/core/agents/cliAdapter.js +61 -0
package/dist/src/core/agents/registry.js +93 -0
package/dist/src/core/agents/runtime.js +4 -0
package/dist/src/core/agents/runtime.smoke.js +42 -0
package/dist/src/core/agents/swarm.smoke.js +48 -0
package/dist/src/core/agents/swarmTools.js +38 -0
package/dist/src/core/auth/index.js +2 -0
package/dist/src/core/auth/loginCliAdapter.js +24 -0
package/dist/src/core/auth/loginCore.js +67 -0
package/dist/src/core/auth/logoutCliAdapter.js +34 -0
package/dist/src/core/auth/logoutCore.js +52 -0
package/dist/src/core/auth/preflight.smoke.js +151 -0
package/dist/src/core/index.js +21 -0
package/dist/src/core/mcp/blueprints.js +27 -0
package/dist/src/core/mcp/common.js +14 -0
package/dist/src/core/mcp/runtime.js +67 -0
package/dist/src/core/mcp/runtime.smoke.js +50 -0
package/dist/src/core/mcp/swarmClient.js +40 -0
package/dist/src/core/mcp/swarmSetup.js +43 -0
package/dist/src/core/providers/cliAdapter.js +39 -0
package/dist/src/core/providers/contracts.js +1 -0
package/dist/src/core/providers/index.js +3 -0
package/dist/src/core/providers/llmCore.js +123 -0
package/dist/src/core/providers/providerCore.js +141 -0
package/dist/src/core/providers/providerModelCompatibility.js +98 -0
package/dist/src/core/providers/providerParitySmoke.js +83 -0
package/dist/src/core/providers/providerProfileModelSmoke.js +80 -0
package/dist/src/core/query/contracts.js +1 -0
package/dist/src/core/query/runtime.js +117 -0
package/dist/src/core/query/runtime.smoke.js +39 -0
package/dist/src/core/query/timelineThinking.smoke.js +25 -0
package/dist/src/core/query/wiring.smoke.js +76 -0
package/dist/src/core/skills/cliAdapter.js +38 -0
package/dist/src/core/skills/index.js +52 -0
package/dist/src/core/skills/runtime.smoke.js +53 -0
package/dist/src/core/tasks/runtime.js +205 -0
package/dist/src/core/tasks/runtime.smoke.js +63 -0
package/dist/src/core/tasks/sdkAdapter.js +4 -0
package/dist/src/core/tools/contracts.js +3 -0
package/dist/src/core/tools/fileResolution.js +112 -0
package/dist/src/core/tools/fileResolution.smoke.js +33 -0
package/dist/src/core/tools/filesCore.js +51 -0
package/dist/src/core/tools/filesCore.smoke.js +108 -0
package/dist/src/core/tools/gitCore.js +20 -0
package/dist/src/core/tools/imageParity.smoke.js +36 -0
package/dist/src/core/tools/notebookParity.smoke.js +68 -0
package/dist/src/core/tools/registry.js +22 -0
package/dist/src/core/tools/runtime.smoke.js +32 -0
package/dist/src/core/tools/shellCore.js +60 -0
package/dist/src/core/types/agentContext.js +9 -0
package/dist/src/core/types/auth.js +3 -0
package/dist/src/core/types/command.js +13 -0
package/dist/src/core/types/provider.js +3 -0
package/dist/src/core/types/sdkEvent.js +10 -0
package/dist/src/core/types/swarm.js +1 -0
package/dist/src/cost-tracker.js +3 -3
package/dist/src/hooks/useAwaySummary.js +22 -9
package/dist/src/main.js +32 -2
package/dist/src/screens/REPL.js +9 -0
package/dist/src/services/AgentSummary/agentSummary.js +10 -10
package/dist/src/services/autoDream/autoDream.js +5 -5
package/dist/src/services/autoDream/consolidationPrompt.js +49 -49
package/dist/src/services/compact/prompt.js +238 -238
package/dist/src/services/limits/sessionCounter.js +17 -17
package/dist/src/services/mcp/client.js +27 -1
package/dist/src/services/orchestration/execution/AgentTaskExecutor.js +39 -20
package/dist/src/services/orchestration/execution/OrchestrationExecutionRuntime.js +65 -58
package/dist/src/skills/bundled/loop.js +57 -57
package/dist/src/skills/bundled/remember.js +53 -53
package/dist/src/skills/bundled/simplify.js +49 -49
package/dist/src/skills/bundled/skillify.js +2 -2
package/dist/src/state/onChangeAppState.js +6 -0
package/dist/src/tasks/LocalAgentTask/LocalAgentTask.js +5 -5
package/dist/src/tasks/LocalMainSessionTask.js +5 -5
package/dist/src/tasks/LocalShellTask/LocalShellTask.js +13 -13
package/dist/src/tools/AgentTool/forkSubagent.js +25 -25
package/dist/src/tools/AskUserQuestionTool/prompt.js +29 -29
package/dist/src/tools/BashTool/BashTool.js +27 -2
package/dist/src/tools/BriefTool/prompt.js +14 -14
package/dist/src/tools/EnterPlanModeTool/EnterPlanModeTool.js +12 -12
package/dist/src/tools/EnterPlanModeTool/prompt.js +140 -140
package/dist/src/tools/ExitPlanModeTool/ExitPlanModeV2Tool.js +18 -18
package/dist/src/tools/ExitPlanModeTool/prompt.js +23 -23
package/dist/src/tools/ExitWorktreeTool/prompt.js +29 -29
package/dist/src/tools/FileEditTool/prompt.js +7 -7
package/dist/src/tools/FileReadTool/FileReadTool.js +18 -1
package/dist/src/tools/FileWriteTool/prompt.js +6 -6
package/dist/src/tools/GlobTool/prompt.js +4 -4
package/dist/src/tools/GrepTool/prompt.js +10 -10
package/dist/src/tools/LSPTool/prompt.js +18 -18
package/dist/src/tools/ListMcpResourcesTool/prompt.js +15 -15
package/dist/src/tools/PowerShellTool/PowerShellTool.js +25 -2
package/dist/src/tools/ReadMcpResourceTool/prompt.js +13 -13
package/dist/src/tools/SendMessageTool/prompt.js +36 -36
package/dist/src/tools/SkillTool/prompt.js +21 -21
package/dist/src/tools/SleepTool/prompt.js +10 -10
package/dist/src/tools/TaskCreateTool/prompt.js +41 -41
package/dist/src/tools/TaskGetTool/prompt.js +21 -21
package/dist/src/tools/TaskListTool/prompt.js +30 -30
package/dist/src/tools/TaskOutputTool/TaskOutputTool.js +8 -8
package/dist/src/tools/TaskStopTool/prompt.js +5 -5
package/dist/src/tools/TaskUpdateTool/prompt.js +74 -74
package/dist/src/tools/TodoWriteTool/prompt.js +178 -178
package/dist/src/tools/ToolSearchTool/prompt.js +9 -9
package/dist/src/tools/WebFetchTool/WebFetchTool.js +9 -9
package/dist/src/tools/WebFetchTool/prompt.js +31 -31
package/dist/src/tools/WebSearchTool/prompt.js +26 -26
package/dist/src/utils/agentContext.js +2 -0
package/dist/src/utils/agenticSessionSearch.js +38 -38
package/dist/src/utils/config.js +2 -0
package/dist/src/utils/genericProcessUtils.js +21 -21
package/dist/src/utils/heapDumpService.js +4 -4
package/dist/src/utils/mcpValidation.js +2 -2
package/dist/src/utils/model/modelStrings.js +1 -1
package/dist/src/utils/model/providers.js +5 -0
package/dist/src/utils/orchestration/store/providerAgentStore.js +22 -22
package/dist/src/utils/orchestration/store/providerWorkspaceStore.js +10 -10
package/dist/src/utils/orchestration/store/runStore.js +68 -68
package/dist/src/utils/orchestration/store/teamStore.js +28 -28
package/dist/src/utils/permissions/permissionExplainer.js +6 -6
package/dist/src/utils/permissions/permissionsDb.js +43 -43
package/dist/src/utils/sdkEventQueue.js +2 -0
package/dist/src/utils/secureStorage/sqliteStorage.js +12 -12
package/dist/src/utils/standardMcp/common.js +15 -0
package/dist/src/utils/standardMcp/setup.js +52 -0
package/dist/src/utils/swarm/teammatePromptAddendum.js +10 -10
package/dist/src/utils/task/framework.js +6 -6
package/package.json +1 -1
package/dist/src/commands/usage/index.js +0 -7
package/dist/src/commands/usage/usage.js +0 -5

package/dist/src/skills/bundled/remember.js CHANGED Viewed

@@ -4,59 +4,59 @@ export function registerRememberSkill() {
     if (process.env.USER_TYPE !== 'ant') {
         return;
     }
-    const SKILL_PROMPT = `# Memory Review
-## Goal
-Review the user's memory landscape and produce a clear report of proposed changes, grouped by action type. Do NOT apply changes — present proposals for user approval.
-## Steps
-### 1. Gather all memory layers
-Read CLAUDE.md and CLAUDE.local.md from the project root (if they exist). Your auto-memory content is already in your system prompt — review it there. Note which team memory sections exist, if any.
-**Success criteria**: You have the contents of all memory layers and can compare them.
-### 2. Classify each auto-memory entry
-For each substantive entry in auto-memory, determine the best destination:
-| Destination | What belongs there | Examples |
-|---|---|---|
-| **CLAUDE.md** | Project conventions and instructions for Claude that all contributors should follow | "use bun not npm", "API routes use kebab-case", "test command is bun test", "prefer functional style" |
-| **CLAUDE.local.md** | Personal instructions for Claude specific to this user, not applicable to other contributors | "I prefer concise responses", "always explain trade-offs", "don't auto-commit", "run tests before committing" |
-| **Team memory** | Org-wide knowledge that applies across repositories (only if team memory is configured) | "deploy PRs go through #deploy-queue", "staging is at staging.internal", "platform team owns infra" |
-| **Stay in auto-memory** | Working notes, temporary context, or entries that don't clearly fit elsewhere | Session-specific observations, uncertain patterns |
-**Important distinctions:**
-- CLAUDE.md and CLAUDE.local.md contain instructions for Claude, not user preferences for external tools (editor theme, IDE keybindings, etc. don't belong in either)
-- Workflow practices (PR conventions, merge strategies, branch naming) are ambiguous — ask the user whether they're personal or team-wide
-- When unsure, ask rather than guess
-**Success criteria**: Each entry has a proposed destination or is flagged as ambiguous.
-### 3. Identify cleanup opportunities
-Scan across all layers for:
-- **Duplicates**: Auto-memory entries already captured in CLAUDE.md or CLAUDE.local.md → propose removing from auto-memory
-- **Outdated**: CLAUDE.md or CLAUDE.local.md entries contradicted by newer auto-memory entries → propose updating the older layer
-- **Conflicts**: Contradictions between any two layers → propose resolution, noting which is more recent
-**Success criteria**: All cross-layer issues identified.
-### 4. Present the report
-Output a structured report grouped by action type:
-1. **Promotions** — entries to move, with destination and rationale
-2. **Cleanup** — duplicates, outdated entries, conflicts to resolve
-3. **Ambiguous** — entries where you need the user's input on destination
-4. **No action needed** — brief note on entries that should stay put
-If auto-memory is empty, say so and offer to review CLAUDE.md for cleanup.
-**Success criteria**: User can review and approve/reject each proposal individually.
-## Rules
-- Present ALL proposals before making any changes
-- Do NOT modify files without explicit user approval
-- Do NOT create new files unless the target doesn't exist yet
-- Ask about ambiguous entries — don't guess
+    const SKILL_PROMPT = `# Memory Review
+## Goal
+Review the user's memory landscape and produce a clear report of proposed changes, grouped by action type. Do NOT apply changes — present proposals for user approval.
+## Steps
+### 1. Gather all memory layers
+Read CLAUDE.md and CLAUDE.local.md from the project root (if they exist). Your auto-memory content is already in your system prompt — review it there. Note which team memory sections exist, if any.
+**Success criteria**: You have the contents of all memory layers and can compare them.
+### 2. Classify each auto-memory entry
+For each substantive entry in auto-memory, determine the best destination:
+| Destination | What belongs there | Examples |
+|---|---|---|
+| **CLAUDE.md** | Project conventions and instructions for Claude that all contributors should follow | "use bun not npm", "API routes use kebab-case", "test command is bun test", "prefer functional style" |
+| **CLAUDE.local.md** | Personal instructions for Claude specific to this user, not applicable to other contributors | "I prefer concise responses", "always explain trade-offs", "don't auto-commit", "run tests before committing" |
+| **Team memory** | Org-wide knowledge that applies across repositories (only if team memory is configured) | "deploy PRs go through #deploy-queue", "staging is at staging.internal", "platform team owns infra" |
+| **Stay in auto-memory** | Working notes, temporary context, or entries that don't clearly fit elsewhere | Session-specific observations, uncertain patterns |
+**Important distinctions:**
+- CLAUDE.md and CLAUDE.local.md contain instructions for Claude, not user preferences for external tools (editor theme, IDE keybindings, etc. don't belong in either)
+- Workflow practices (PR conventions, merge strategies, branch naming) are ambiguous — ask the user whether they're personal or team-wide
+- When unsure, ask rather than guess
+**Success criteria**: Each entry has a proposed destination or is flagged as ambiguous.
+### 3. Identify cleanup opportunities
+Scan across all layers for:
+- **Duplicates**: Auto-memory entries already captured in CLAUDE.md or CLAUDE.local.md → propose removing from auto-memory
+- **Outdated**: CLAUDE.md or CLAUDE.local.md entries contradicted by newer auto-memory entries → propose updating the older layer
+- **Conflicts**: Contradictions between any two layers → propose resolution, noting which is more recent
+**Success criteria**: All cross-layer issues identified.
+### 4. Present the report
+Output a structured report grouped by action type:
+1. **Promotions** — entries to move, with destination and rationale
+2. **Cleanup** — duplicates, outdated entries, conflicts to resolve
+3. **Ambiguous** — entries where you need the user's input on destination
+4. **No action needed** — brief note on entries that should stay put
+If auto-memory is empty, say so and offer to review CLAUDE.md for cleanup.
+**Success criteria**: User can review and approve/reject each proposal individually.
+## Rules
+- Present ALL proposals before making any changes
+- Do NOT modify files without explicit user approval
+- Do NOT create new files unless the target doesn't exist yet
+- Ask about ambiguous entries — don't guess
 `;
     registerBundledSkill({
         name: 'remember',

package/dist/src/skills/bundled/simplify.js CHANGED Viewed

@@ -1,54 +1,54 @@
 import { AGENT_TOOL_NAME } from '../../tools/AgentTool/constants.js';
 import { registerBundledSkill } from '../bundledSkills.js';
-const SIMPLIFY_PROMPT = `# Simplify: Code Review and Cleanup
-Review all changed files for reuse, quality, and efficiency. Fix any issues found.
-## Phase 1: Identify Changes
-Run \`git diff\` (or \`git diff HEAD\` if there are staged changes) to see what changed. If there are no git changes, review the most recently modified files that the user mentioned or that you edited earlier in this conversation.
-## Phase 2: Launch Three Review Agents in Parallel
-Use the ${AGENT_TOOL_NAME} tool to launch all three agents concurrently in a single message. Pass each agent the full diff so it has the complete context.
-### Agent 1: Code Reuse Review
-For each change:
-1. **Search for existing utilities and helpers** that could replace newly written code. Look for similar patterns elsewhere in the codebase — common locations are utility directories, shared modules, and files adjacent to the changed ones.
-2. **Flag any new function that duplicates existing functionality.** Suggest the existing function to use instead.
-3. **Flag any inline logic that could use an existing utility** — hand-rolled string manipulation, manual path handling, custom environment checks, ad-hoc type guards, and similar patterns are common candidates.
-### Agent 2: Code Quality Review
-Review the same changes for hacky patterns:
-1. **Redundant state**: state that duplicates existing state, cached values that could be derived, observers/effects that could be direct calls
-2. **Parameter sprawl**: adding new parameters to a function instead of generalizing or restructuring existing ones
-3. **Copy-paste with slight variation**: near-duplicate code blocks that should be unified with a shared abstraction
-4. **Leaky abstractions**: exposing internal details that should be encapsulated, or breaking existing abstraction boundaries
-5. **Stringly-typed code**: using raw strings where constants, enums (string unions), or branded types already exist in the codebase
-6. **Unnecessary JSX nesting**: wrapper Boxes/elements that add no layout value — check if inner component props (flexShrink, alignItems, etc.) already provide the needed behavior
-7. **Unnecessary comments**: comments explaining WHAT the code does (well-named identifiers already do that), narrating the change, or referencing the task/caller — delete; keep only non-obvious WHY (hidden constraints, subtle invariants, workarounds)
-### Agent 3: Efficiency Review
-Review the same changes for efficiency:
-1. **Unnecessary work**: redundant computations, repeated file reads, duplicate network/API calls, N+1 patterns
-2. **Missed concurrency**: independent operations run sequentially when they could run in parallel
-3. **Hot-path bloat**: new blocking work added to startup or per-request/per-render hot paths
-4. **Recurring no-op updates**: state/store updates inside polling loops, intervals, or event handlers that fire unconditionally — add a change-detection guard so downstream consumers aren't notified when nothing changed. Also: if a wrapper function takes an updater/reducer callback, verify it honors same-reference returns (or whatever the "no change" signal is) — otherwise callers' early-return no-ops are silently defeated
-5. **Unnecessary existence checks**: pre-checking file/resource existence before operating (TOCTOU anti-pattern) — operate directly and handle the error
-6. **Memory**: unbounded data structures, missing cleanup, event listener leaks
-7. **Overly broad operations**: reading entire files when only a portion is needed, loading all items when filtering for one
-## Phase 3: Fix Issues
-Wait for all three agents to complete. Aggregate their findings and fix each issue directly. If a finding is a false positive or not worth addressing, note it and move on — do not argue with the finding, just skip it.
-When done, briefly summarize what was fixed (or confirm the code was already clean).
+const SIMPLIFY_PROMPT = `# Simplify: Code Review and Cleanup
+Review all changed files for reuse, quality, and efficiency. Fix any issues found.
+## Phase 1: Identify Changes
+Run \`git diff\` (or \`git diff HEAD\` if there are staged changes) to see what changed. If there are no git changes, review the most recently modified files that the user mentioned or that you edited earlier in this conversation.
+## Phase 2: Launch Three Review Agents in Parallel
+Use the ${AGENT_TOOL_NAME} tool to launch all three agents concurrently in a single message. Pass each agent the full diff so it has the complete context.
+### Agent 1: Code Reuse Review
+For each change:
+1. **Search for existing utilities and helpers** that could replace newly written code. Look for similar patterns elsewhere in the codebase — common locations are utility directories, shared modules, and files adjacent to the changed ones.
+2. **Flag any new function that duplicates existing functionality.** Suggest the existing function to use instead.
+3. **Flag any inline logic that could use an existing utility** — hand-rolled string manipulation, manual path handling, custom environment checks, ad-hoc type guards, and similar patterns are common candidates.
+### Agent 2: Code Quality Review
+Review the same changes for hacky patterns:
+1. **Redundant state**: state that duplicates existing state, cached values that could be derived, observers/effects that could be direct calls
+2. **Parameter sprawl**: adding new parameters to a function instead of generalizing or restructuring existing ones
+3. **Copy-paste with slight variation**: near-duplicate code blocks that should be unified with a shared abstraction
+4. **Leaky abstractions**: exposing internal details that should be encapsulated, or breaking existing abstraction boundaries
+5. **Stringly-typed code**: using raw strings where constants, enums (string unions), or branded types already exist in the codebase
+6. **Unnecessary JSX nesting**: wrapper Boxes/elements that add no layout value — check if inner component props (flexShrink, alignItems, etc.) already provide the needed behavior
+7. **Unnecessary comments**: comments explaining WHAT the code does (well-named identifiers already do that), narrating the change, or referencing the task/caller — delete; keep only non-obvious WHY (hidden constraints, subtle invariants, workarounds)
+### Agent 3: Efficiency Review
+Review the same changes for efficiency:
+1. **Unnecessary work**: redundant computations, repeated file reads, duplicate network/API calls, N+1 patterns
+2. **Missed concurrency**: independent operations run sequentially when they could run in parallel
+3. **Hot-path bloat**: new blocking work added to startup or per-request/per-render hot paths
+4. **Recurring no-op updates**: state/store updates inside polling loops, intervals, or event handlers that fire unconditionally — add a change-detection guard so downstream consumers aren't notified when nothing changed. Also: if a wrapper function takes an updater/reducer callback, verify it honors same-reference returns (or whatever the "no change" signal is) — otherwise callers' early-return no-ops are silently defeated
+5. **Unnecessary existence checks**: pre-checking file/resource existence before operating (TOCTOU anti-pattern) — operate directly and handle the error
+6. **Memory**: unbounded data structures, missing cleanup, event listener leaks
+7. **Overly broad operations**: reading entire files when only a portion is needed, loading all items when filtering for one
+## Phase 3: Fix Issues
+Wait for all three agents to complete. Aggregate their findings and fix each issue directly. If a finding is a false positive or not worth addressing, note it and move on — do not argue with the finding, just skip it.
+When done, briefly summarize what was fixed (or confirm the code was already clean).
 `;
 export function registerSimplifySkill() {
     registerBundledSkill({

package/dist/src/skills/bundled/skillify.js CHANGED Viewed

@@ -61,8 +61,8 @@ You will use the AskUserQuestion to understand what the user wants to automate.
 - If you think the skill will require arguments, suggest arguments based on what you observed. Make sure you understand what someone would need to provide.
 - If it's not clear, ask if this skill should run inline (in the current conversation) or forked (as a sub-agent with its own context). Forked is better for self-contained tasks that don't need mid-process user input; inline is better when the user wants to steer mid-process.
 - Ask where the skill should be saved. Suggest a default based on context (repo-specific workflows → repo, cross-repo personal workflows → user). Options:
-  - **This repo** (\`.context/skills/<name>/SKILL.md\`) — for workflows specific to this project
-  - **Personal** (\`~/.context/skills/<name>/SKILL.md\`) — follows you across all repos
+  - **This repo** (\`.context/skills/<name>/SKILL.md\`) — for workflows specific to this project
+  - **Personal** (\`~/.context/skills/<name>/SKILL.md\`) — follows you across all repos
 **Round 3: Breaking down each step**
 For each major step, if it's not glaringly obvious, ask:

package/dist/src/state/onChangeAppState.js CHANGED Viewed

@@ -129,4 +129,10 @@ export function onChangeAppState({ newState, oldState, }) {
             logError(toError(error));
         }
     }
+    // orchestrationActivity — notify session metadata changed so SDK/Desktop see it.
+    if (newState.orchestrationActivity !== oldState.orchestrationActivity) {
+        notifySessionMetadataChanged({
+            orchestration_activity: newState.orchestrationActivity ?? null,
+        });
+    }
 }

package/dist/src/tasks/LocalAgentTask/LocalAgentTask.js CHANGED Viewed

@@ -145,11 +145,11 @@ export function enqueueAgentNotification({ taskId, description, status, error, s
     const resultSection = finalMessage ? `\n<result>${finalMessage}</result>` : '';
     const usageSection = usage ? `\n<usage><total_tokens>${usage.totalTokens}</total_tokens><tool_uses>${usage.toolUses}</tool_uses><duration_ms>${usage.durationMs}</duration_ms></usage>` : '';
     const worktreeSection = worktreePath ? `\n<${WORKTREE_TAG}><${WORKTREE_PATH_TAG}>${worktreePath}</${WORKTREE_PATH_TAG}>${worktreeBranch ? `<${WORKTREE_BRANCH_TAG}>${worktreeBranch}</${WORKTREE_BRANCH_TAG}>` : ''}</${WORKTREE_TAG}>` : '';
-    const message = `<${TASK_NOTIFICATION_TAG}>
-<${TASK_ID_TAG}>${taskId}</${TASK_ID_TAG}>${toolUseIdLine}
-<${OUTPUT_FILE_TAG}>${outputPath}</${OUTPUT_FILE_TAG}>
-<${STATUS_TAG}>${status}</${STATUS_TAG}>
-<${SUMMARY_TAG}>${summary}</${SUMMARY_TAG}>${resultSection}${usageSection}${worktreeSection}
+    const message = `<${TASK_NOTIFICATION_TAG}>
+<${TASK_ID_TAG}>${taskId}</${TASK_ID_TAG}>${toolUseIdLine}
+<${OUTPUT_FILE_TAG}>${outputPath}</${OUTPUT_FILE_TAG}>
+<${STATUS_TAG}>${status}</${STATUS_TAG}>
+<${SUMMARY_TAG}>${summary}</${SUMMARY_TAG}>${resultSection}${usageSection}${worktreeSection}
 </${TASK_NOTIFICATION_TAG}>`;
     enqueuePendingNotification({
         value: message,

package/dist/src/tasks/LocalMainSessionTask.js CHANGED Viewed

@@ -169,11 +169,11 @@ function enqueueMainSessionNotification(taskId, description, status, setAppState
         ? `\n<${TOOL_USE_ID_TAG}>${toolUseId}</${TOOL_USE_ID_TAG}>`
         : '';
     const outputPath = getTaskOutputPath(taskId);
-    const message = `<${TASK_NOTIFICATION_TAG}>
-<${TASK_ID_TAG}>${taskId}</${TASK_ID_TAG}>${toolUseIdLine}
-<${OUTPUT_FILE_TAG}>${outputPath}</${OUTPUT_FILE_TAG}>
-<${STATUS_TAG}>${status}</${STATUS_TAG}>
-<${SUMMARY_TAG}>${summary}</${SUMMARY_TAG}>
+    const message = `<${TASK_NOTIFICATION_TAG}>
+<${TASK_ID_TAG}>${taskId}</${TASK_ID_TAG}>${toolUseIdLine}
+<${OUTPUT_FILE_TAG}>${outputPath}</${OUTPUT_FILE_TAG}>
+<${STATUS_TAG}>${status}</${STATUS_TAG}>
+<${SUMMARY_TAG}>${summary}</${SUMMARY_TAG}>
 </${TASK_NOTIFICATION_TAG}>`;
     enqueuePendingNotification({ value: message, mode: 'task-notification' });
 }

package/dist/src/tasks/LocalShellTask/LocalShellTask.js CHANGED Viewed

@@ -71,14 +71,14 @@ function startStallWatchdog(taskId, description, kind, toolUseId, agentId) {
                 // signal and an unknown value falls through to 'completed',
                 // falsely closing the task for SDK consumers. Statusless
                 // notifications are skipped by the SDK emitter (progress ping).
-                const message = `<${TASK_NOTIFICATION_TAG}>
-<${TASK_ID_TAG}>${taskId}</${TASK_ID_TAG}>${toolUseIdLine}
-<${OUTPUT_FILE_TAG}>${outputPath}</${OUTPUT_FILE_TAG}>
-<${SUMMARY_TAG}>${escapeXml(summary)}</${SUMMARY_TAG}>
-</${TASK_NOTIFICATION_TAG}>
-Last output:
-${content.trimEnd()}
+                const message = `<${TASK_NOTIFICATION_TAG}>
+<${TASK_ID_TAG}>${taskId}</${TASK_ID_TAG}>${toolUseIdLine}
+<${OUTPUT_FILE_TAG}>${outputPath}</${OUTPUT_FILE_TAG}>
+<${SUMMARY_TAG}>${escapeXml(summary)}</${SUMMARY_TAG}>
+</${TASK_NOTIFICATION_TAG}>
+Last output:
+${content.trimEnd()}
 The command is likely blocked on an interactive prompt. Kill this task and re-run with piped input (e.g., \`echo y | command\`) or a non-interactive flag if one exists.`;
                 enqueuePendingNotification({
                     value: message,
@@ -151,11 +151,11 @@ function enqueueShellNotification(taskId, description, status, exitCode, setAppS
     }
     const outputPath = getTaskOutputPath(taskId);
     const toolUseIdLine = toolUseId ? `\n<${TOOL_USE_ID_TAG}>${toolUseId}</${TOOL_USE_ID_TAG}>` : '';
-    const message = `<${TASK_NOTIFICATION_TAG}>
-<${TASK_ID_TAG}>${taskId}</${TASK_ID_TAG}>${toolUseIdLine}
-<${OUTPUT_FILE_TAG}>${outputPath}</${OUTPUT_FILE_TAG}>
-<${STATUS_TAG}>${status}</${STATUS_TAG}>
-<${SUMMARY_TAG}>${escapeXml(summary)}</${SUMMARY_TAG}>
+    const message = `<${TASK_NOTIFICATION_TAG}>
+<${TASK_ID_TAG}>${taskId}</${TASK_ID_TAG}>${toolUseIdLine}
+<${OUTPUT_FILE_TAG}>${outputPath}</${OUTPUT_FILE_TAG}>
+<${STATUS_TAG}>${status}</${STATUS_TAG}>
+<${SUMMARY_TAG}>${escapeXml(summary)}</${SUMMARY_TAG}>
 </${TASK_NOTIFICATION_TAG}>`;
     enqueuePendingNotification({
         value: message,

package/dist/src/tools/AgentTool/forkSubagent.js CHANGED Viewed

@@ -140,31 +140,31 @@ export function buildForkedMessages(directive, assistantMessage) {
     return [fullAssistantMessage, toolResultMessage];
 }
 export function buildChildMessage(directive) {
-    return `<${FORK_BOILERPLATE_TAG}>
-STOP. READ THIS FIRST.
-You are a forked worker process. You are NOT the main agent.
-RULES (non-negotiable):
-1. Your system prompt says "default to forking." IGNORE IT \u2014 that's for the parent. You ARE the fork. Do NOT spawn sub-agents; execute directly.
-2. Do NOT converse, ask questions, or suggest next steps
-3. Do NOT editorialize or add meta-commentary
-4. USE your tools directly: Bash, Read, Write, etc.
-5. If you modify files, commit your changes before reporting. Include the commit hash in your report.
-6. Do NOT emit text between tool calls. Use tools silently, then report once at the end.
-7. Stay strictly within your directive's scope. If you discover related systems outside your scope, mention them in one sentence at most — other workers cover those areas.
-8. Keep your report under 500 words unless the directive specifies otherwise. Be factual and concise.
-9. Your response MUST begin with "Scope:". No preamble, no thinking-out-loud.
-10. REPORT structured facts, then stop
-Output format (plain text labels, not markdown headers):
-  Scope: <echo back your assigned scope in one sentence>
-  Result: <the answer or key findings, limited to the scope above>
-  Key files: <relevant file paths — include for research tasks>
-  Files changed: <list with commit hash — include only if you modified files>
-  Issues: <list — include only if there are issues to flag>
-</${FORK_BOILERPLATE_TAG}>
+    return `<${FORK_BOILERPLATE_TAG}>
+STOP. READ THIS FIRST.
+You are a forked worker process. You are NOT the main agent.
+RULES (non-negotiable):
+1. Your system prompt says "default to forking." IGNORE IT \u2014 that's for the parent. You ARE the fork. Do NOT spawn sub-agents; execute directly.
+2. Do NOT converse, ask questions, or suggest next steps
+3. Do NOT editorialize or add meta-commentary
+4. USE your tools directly: Bash, Read, Write, etc.
+5. If you modify files, commit your changes before reporting. Include the commit hash in your report.
+6. Do NOT emit text between tool calls. Use tools silently, then report once at the end.
+7. Stay strictly within your directive's scope. If you discover related systems outside your scope, mention them in one sentence at most — other workers cover those areas.
+8. Keep your report under 500 words unless the directive specifies otherwise. Be factual and concise.
+9. Your response MUST begin with "Scope:". No preamble, no thinking-out-loud.
+10. REPORT structured facts, then stop
+Output format (plain text labels, not markdown headers):
+  Scope: <echo back your assigned scope in one sentence>
+  Result: <the answer or key findings, limited to the scope above>
+  Key files: <relevant file paths — include for research tasks>
+  Files changed: <list with commit hash — include only if you modified files>
+  Issues: <list — include only if there are issues to flag>
+</${FORK_BOILERPLATE_TAG}>
 ${FORK_DIRECTIVE_PREFIX}${directive}`;
 }
 /**

package/dist/src/tools/AskUserQuestionTool/prompt.js CHANGED Viewed

@@ -3,36 +3,36 @@ export const ASK_USER_QUESTION_TOOL_NAME = 'AskUserQuestion';
 export const ASK_USER_QUESTION_TOOL_CHIP_WIDTH = 12;
 export const DESCRIPTION = 'Asks the user multiple choice questions to gather information, clarify ambiguity, understand preferences, make decisions or offer them choices.';
 export const PREVIEW_FEATURE_PROMPT = {
-    markdown: `
-Preview feature:
-Use the optional \`preview\` field on options when presenting concrete artifacts that users need to visually compare:
-- ASCII mockups of UI layouts or components
-- Code snippets showing different implementations
-- Diagram variations
-- Configuration examples
-Preview content is rendered as markdown in a monospace box. Multi-line text with newlines is supported. When any option has a preview, the UI switches to a side-by-side layout with a vertical option list on the left and preview on the right. Do not use previews for simple preference questions where labels and descriptions suffice. Note: previews are only supported for single-select questions (not multiSelect).
+    markdown: `
+Preview feature:
+Use the optional \`preview\` field on options when presenting concrete artifacts that users need to visually compare:
+- ASCII mockups of UI layouts or components
+- Code snippets showing different implementations
+- Diagram variations
+- Configuration examples
+Preview content is rendered as markdown in a monospace box. Multi-line text with newlines is supported. When any option has a preview, the UI switches to a side-by-side layout with a vertical option list on the left and preview on the right. Do not use previews for simple preference questions where labels and descriptions suffice. Note: previews are only supported for single-select questions (not multiSelect).
 `,
-    html: `
-Preview feature:
-Use the optional \`preview\` field on options when presenting concrete artifacts that users need to visually compare:
-- HTML mockups of UI layouts or components
-- Formatted code snippets showing different implementations
-- Visual comparisons or diagrams
-Preview content must be a self-contained HTML fragment (no <html>/<body> wrapper, no <script> or <style> tags — use inline style attributes instead). Do not use previews for simple preference questions where labels and descriptions suffice. Note: previews are only supported for single-select questions (not multiSelect).
+    html: `
+Preview feature:
+Use the optional \`preview\` field on options when presenting concrete artifacts that users need to visually compare:
+- HTML mockups of UI layouts or components
+- Formatted code snippets showing different implementations
+- Visual comparisons or diagrams
+Preview content must be a self-contained HTML fragment (no <html>/<body> wrapper, no <script> or <style> tags — use inline style attributes instead). Do not use previews for simple preference questions where labels and descriptions suffice. Note: previews are only supported for single-select questions (not multiSelect).
 `,
 };
-export const ASK_USER_QUESTION_TOOL_PROMPT = `Use this tool when you need to ask the user questions during execution. This allows you to:
-1. Gather user preferences or requirements
-2. Clarify ambiguous instructions
-3. Get decisions on implementation choices as you work
-4. Offer choices to the user about what direction to take.
-Usage notes:
-- Users will always be able to select "Other" to provide custom text input
-- Use multiSelect: true to allow multiple answers to be selected for a question
-- If you recommend a specific option, make that the first option in the list and add "(Recommended)" at the end of the label
-Plan mode note: In plan mode, use this tool to clarify requirements or choose between approaches BEFORE finalizing your plan. Do NOT use this tool to ask "Is my plan ready?" or "Should I proceed?" - use ${EXIT_PLAN_MODE_TOOL_NAME} for plan approval. IMPORTANT: Do not reference "the plan" in your questions (e.g., "Do you have feedback about the plan?", "Does the plan look good?") because the user cannot see the plan in the UI until you call ${EXIT_PLAN_MODE_TOOL_NAME}. If you need plan approval, use ${EXIT_PLAN_MODE_TOOL_NAME} instead.
+export const ASK_USER_QUESTION_TOOL_PROMPT = `Use this tool when you need to ask the user questions during execution. This allows you to:
+1. Gather user preferences or requirements
+2. Clarify ambiguous instructions
+3. Get decisions on implementation choices as you work
+4. Offer choices to the user about what direction to take.
+Usage notes:
+- Users will always be able to select "Other" to provide custom text input
+- Use multiSelect: true to allow multiple answers to be selected for a question
+- If you recommend a specific option, make that the first option in the list and add "(Recommended)" at the end of the label
+Plan mode note: In plan mode, use this tool to clarify requirements or choose between approaches BEFORE finalizing your plan. Do NOT use this tool to ask "Is my plan ready?" or "Should I proceed?" - use ${EXIT_PLAN_MODE_TOOL_NAME} for plan approval. IMPORTANT: Do not reference "the plan" in your questions (e.g., "Do you have feedback about the plan?", "Does the plan look good?") because the user cannot see the plan in the UI until you call ${EXIT_PLAN_MODE_TOOL_NAME}. If you need plan approval, use ${EXIT_PLAN_MODE_TOOL_NAME} instead.
 `;

package/dist/src/tools/BashTool/BashTool.js CHANGED Viewed

@@ -3,6 +3,8 @@ import { jsx as _jsx } from "react/jsx-runtime";
 import { copyFile, stat as fsStat, truncate as fsTruncate, link } from 'fs/promises';
 import { z } from 'zod/v4';
 import { getKairosActive } from '../../bootstrap/state.js';
+import { isCoreToolsEnabled } from '../../core/tools/contracts.js';
+import { startCoreShellCommand } from '../../core/tools/shellCore.js';
 import { TOOL_SUMMARY_MAX_LENGTH } from '../../constants/toolLimits.js';
 import { logEvent } from '../../services/analytics/index.js';
 import { notifyVscodeFileUpdated } from '../../services/mcp/vscodeSdkMcp.js';
@@ -759,7 +761,30 @@ async function* runShellCommand({ input, abortController, setAppState, setToolJS
     // Only enable for commands that are allowed to be auto-backgrounded
     // and when background tasks are not disabled
     const shouldAutoBackground = !isBackgroundTasksDisabled && isAutobackgroundingAllowed(command);
-    const shellCommand = await exec(command, abortController.signal, 'bash', {
+    const shellCommand = await (isCoreToolsEnabled() ? startCoreShellCommand({
+        command,
+        timeoutMs,
+        shellType: 'bash',
+        execOptions: {
+            onProgress(lastLines, allLines, totalLines, totalBytes, isIncomplete) {
+                lastProgressOutput = lastLines;
+                fullOutput = allLines;
+                lastTotalLines = totalLines;
+                lastTotalBytes = isIncomplete ? totalBytes : 0;
+                // Wake the generator so it yields the new progress data
+                const resolve = resolveProgress;
+                if (resolve) {
+                    resolveProgress = null;
+                    resolve();
+                }
+            },
+            preventCwdChanges,
+            shouldUseSandbox: shouldUseSandbox(input),
+            shouldAutoBackground
+        }
+    }, {
+        abortSignal: abortController.signal
+    }) : exec(command, abortController.signal, 'bash', {
         timeout: timeoutMs,
         onProgress(lastLines, allLines, totalLines, totalBytes, isIncomplete) {
             lastProgressOutput = lastLines;
@@ -776,7 +801,7 @@ async function* runShellCommand({ input, abortController, setAppState, setToolJS
         preventCwdChanges,
         shouldUseSandbox: shouldUseSandbox(input),
         shouldAutoBackground
-    });
+    }));
     // Start the command execution
     const resultPromise = shellCommand.result;
     // Helper to spawn a background task and return its ID

package/dist/src/tools/BriefTool/prompt.js CHANGED Viewed

@@ -1,19 +1,19 @@
 export const BRIEF_TOOL_NAME = 'SendUserMessage';
 export const LEGACY_BRIEF_TOOL_NAME = 'Brief';
 export const DESCRIPTION = 'Send a message to the user';
-export const BRIEF_TOOL_PROMPT = `Send a message the user will read. Text outside this tool is visible in the detail view, but most won't open it — the answer lives here.
-\`message\` supports markdown. \`attachments\` takes file paths (absolute or cwd-relative) for images, diffs, logs.
+export const BRIEF_TOOL_PROMPT = `Send a message the user will read. Text outside this tool is visible in the detail view, but most won't open it — the answer lives here.
+\`message\` supports markdown. \`attachments\` takes file paths (absolute or cwd-relative) for images, diffs, logs.
 \`status\` labels intent: 'normal' when replying to what they just asked; 'proactive' when you're initiating — a scheduled task finished, a blocker surfaced during background work, you need input on something they haven't asked about. Set it honestly; downstream routing uses it.`;
-export const BRIEF_PROACTIVE_SECTION = `## Talking to the user
-${BRIEF_TOOL_NAME} is where your replies go. Text outside it is visible if the user expands the detail view, but most won't — assume unread. Anything you want them to actually see goes through ${BRIEF_TOOL_NAME}. The failure mode: the real answer lives in plain text while ${BRIEF_TOOL_NAME} just says "done!" — they see "done!" and miss everything.
-So: every time the user says something, the reply they actually read comes through ${BRIEF_TOOL_NAME}. Even for "hi". Even for "thanks".
-If you can answer right away, send the answer. If you need to go look — run a command, read files, check something — ack first in one line ("On it — checking the test output"), then work, then send the result. Without the ack they're staring at a spinner.
-For longer work: ack → work → result. Between those, send a checkpoint when something useful happened — a decision you made, a surprise you hit, a phase boundary. Skip the filler ("running tests...") — a checkpoint earns its place by carrying information.
+export const BRIEF_PROACTIVE_SECTION = `## Talking to the user
+${BRIEF_TOOL_NAME} is where your replies go. Text outside it is visible if the user expands the detail view, but most won't — assume unread. Anything you want them to actually see goes through ${BRIEF_TOOL_NAME}. The failure mode: the real answer lives in plain text while ${BRIEF_TOOL_NAME} just says "done!" — they see "done!" and miss everything.
+So: every time the user says something, the reply they actually read comes through ${BRIEF_TOOL_NAME}. Even for "hi". Even for "thanks".
+If you can answer right away, send the answer. If you need to go look — run a command, read files, check something — ack first in one line ("On it — checking the test output"), then work, then send the result. Without the ack they're staring at a spinner.
+For longer work: ack → work → result. Between those, send a checkpoint when something useful happened — a decision you made, a surprise you hit, a phase boundary. Skip the filler ("running tests...") — a checkpoint earns its place by carrying information.
 Keep messages tight — the decision, the file:line, the PR number. Second person always ("your config"), never third.`;

package/dist/src/tools/EnterPlanModeTool/EnterPlanModeTool.js CHANGED Viewed

@@ -75,19 +75,19 @@ export const EnterPlanModeTool = buildTool({
     },
     mapToolResultToToolResultBlockParam({ message }, toolUseID) {
         const instructions = isPlanModeInterviewPhaseEnabled()
-            ? `${message}
+            ? `${message}
 DO NOT write or edit any files except the plan file. Detailed workflow instructions will follow.`
-            : `${message}
-In plan mode, you should:
-1. Thoroughly explore the codebase to understand existing patterns
-2. Identify similar features and architectural approaches
-3. Consider multiple approaches and their trade-offs
-4. Use AskUserQuestion if you need to clarify the approach
-5. Design a concrete implementation strategy
-6. When ready, use ExitPlanMode to present your plan for approval
+            : `${message}
+In plan mode, you should:
+1. Thoroughly explore the codebase to understand existing patterns
+2. Identify similar features and architectural approaches
+3. Consider multiple approaches and their trade-offs
+4. Use AskUserQuestion if you need to clarify the approach
+5. Design a concrete implementation strategy
+6. When ready, use ExitPlanMode to present your plan for approval
 Remember: DO NOT write or edit any files yet. This is a read-only exploration and planning phase.`;
         return {
             type: 'tool_result',