npm - @vellumai/assistant - Versions diffs - 0.4.46 → 0.4.49 - Mend

@vellumai/assistant 0.4.46 → 0.4.49

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (382) hide show

package/ARCHITECTURE.md +7 -7
package/README.md +2 -23
package/docs/architecture/integrations.md +45 -41
package/docs/architecture/keychain-broker.md +3 -3
package/docs/architecture/security.md +5 -5
package/docs/runbook-trusted-contacts.md +3 -8
package/hook-templates/debug-prompt-logger/hook.json +1 -1
package/hook-templates/debug-prompt-logger/run.sh +1 -3
package/package.json +1 -1
package/src/__tests__/actor-token-service.test.ts +0 -1
package/src/__tests__/anthropic-provider.test.ts +156 -0
package/src/__tests__/approval-cascade.test.ts +810 -0
package/src/__tests__/approval-primitive.test.ts +0 -1
package/src/__tests__/approval-routes-http.test.ts +2 -0
package/src/__tests__/assistant-attachments.test.ts +12 -34
package/src/__tests__/assistant-feature-flag-guardrails.test.ts +76 -0
package/src/__tests__/assistant-feature-flags-integration.test.ts +0 -1
package/src/__tests__/browser-fill-credential.test.ts +5 -2
package/src/__tests__/browser-skill-baseline-tool-payload.test.ts +2 -2
package/src/__tests__/bundled-skill-retrieval-guard.test.ts +2 -1
package/src/__tests__/channel-guardian.test.ts +0 -2
package/src/__tests__/channel-readiness-routes.test.ts +35 -25
package/src/__tests__/channel-readiness-service.test.ts +10 -9
package/src/__tests__/checker.test.ts +9 -29
package/src/__tests__/cli.test.ts +23 -0
package/src/__tests__/computer-use-skill-manifest-regression.test.ts +1 -1
package/src/__tests__/computer-use-tools.test.ts +2 -19
package/src/__tests__/config-watcher.test.ts +0 -1
package/src/__tests__/confirmation-request-guardian-bridge.test.ts +0 -1
package/src/__tests__/context-image-dimensions.test.ts +332 -0
package/src/__tests__/context-token-estimator.test.ts +196 -13
package/src/__tests__/conversation-attention-store.test.ts +0 -1
package/src/__tests__/conversation-attention-telegram.test.ts +0 -1
package/src/__tests__/conversation-routes-guardian-reply.test.ts +144 -0
package/src/__tests__/conversation-routes-slash-commands.test.ts +1 -0
package/src/__tests__/credential-broker-browser-fill.test.ts +23 -22
package/src/__tests__/credential-broker-server-use.test.ts +22 -21
package/src/__tests__/credential-broker.test.ts +2 -1
package/src/__tests__/credential-metadata-store.test.ts +239 -26
package/src/__tests__/credential-resolve.test.ts +5 -4
package/src/__tests__/credential-security-e2e.test.ts +8 -8
package/src/__tests__/credential-security-invariants.test.ts +111 -7
package/src/__tests__/credential-vault-unit.test.ts +287 -54
package/src/__tests__/credential-vault.test.ts +406 -12
package/src/__tests__/credentials-cli.test.ts +82 -6
package/src/__tests__/dynamic-skill-workflow-prompt.test.ts +0 -1
package/src/__tests__/ephemeral-permissions.test.ts +3 -3
package/src/__tests__/gateway-only-enforcement.test.ts +4 -2
package/src/__tests__/gateway-only-guard.test.ts +0 -1
package/src/__tests__/gemini-image-service.test.ts +75 -45
package/src/__tests__/gemini-provider.test.ts +9 -6
package/src/__tests__/guardian-action-conversation-turn.test.ts +1 -33
package/src/__tests__/guardian-action-copy-generator.test.ts +0 -20
package/src/__tests__/guardian-action-followup-executor.test.ts +1 -28
package/src/__tests__/guardian-action-followup-store.test.ts +1 -1
package/src/__tests__/guardian-action-grant-mint-consume.test.ts +0 -1
package/src/__tests__/guardian-decision-primitive-canonical.test.ts +0 -1
package/src/__tests__/guardian-grant-minting.test.ts +35 -0
package/src/__tests__/guardian-routing-invariants.test.ts +0 -1
package/src/__tests__/guardian-verification-voice-binding.test.ts +0 -1
package/src/__tests__/handlers-user-message-approval-consumption.test.ts +0 -39
package/src/__tests__/heartbeat-service.test.ts +0 -1
package/src/__tests__/host-cu-proxy.test.ts +629 -0
package/src/__tests__/host-shell-tool.test.ts +27 -15
package/src/__tests__/http-user-message-parity.test.ts +1 -0
package/src/__tests__/ingress-url-consistency.test.ts +14 -21
package/src/__tests__/integration-status.test.ts +38 -25
package/src/__tests__/intent-routing.test.ts +0 -1
package/src/__tests__/invite-routes-http.test.ts +10 -9
package/src/__tests__/keychain-broker-client.test.ts +11 -43
package/src/__tests__/managed-proxy-context.test.ts +5 -3
package/src/__tests__/media-generate-image.test.ts +63 -2
package/src/__tests__/media-reuse-story.e2e.test.ts +7 -3
package/src/__tests__/messaging-send-tool.test.ts +4 -6
package/src/__tests__/notification-routing-intent.test.ts +0 -1
package/src/__tests__/oauth-cli.test.ts +373 -14
package/src/__tests__/oauth-provider-profiles.test.ts +9 -9
package/src/__tests__/oauth-scope-policy.test.ts +4 -6
package/src/__tests__/oauth-store.test.ts +756 -0
package/src/__tests__/onboarding-starter-tasks.test.ts +0 -1
package/src/__tests__/provider-error-scenarios.test.ts +0 -1
package/src/__tests__/provider-fail-open-selection.test.ts +3 -1
package/src/__tests__/provider-managed-proxy-integration.test.ts +70 -6
package/src/__tests__/provider-streaming.benchmark.test.ts +0 -1
package/src/__tests__/public-ingress-urls.test.ts +15 -21
package/src/__tests__/recording-handler.test.ts +3 -4
package/src/__tests__/registry.test.ts +2 -2
package/src/__tests__/runtime-events-sse.test.ts +55 -7
package/src/__tests__/schedule-store.test.ts +0 -1
package/src/__tests__/scheduler-recurrence.test.ts +0 -1
package/src/__tests__/schema-transforms.test.ts +226 -0
package/src/__tests__/scoped-approval-grants.test.ts +0 -1
package/src/__tests__/scoped-grant-security-matrix.test.ts +0 -1
package/src/__tests__/script-proxy-injection-runtime.test.ts +23 -13
package/src/__tests__/script-proxy-policy-runtime.test.ts +1 -1
package/src/__tests__/script-proxy-session-manager.test.ts +1 -1
package/src/__tests__/secret-ingress-handler.test.ts +0 -1
package/src/__tests__/secret-onetime-send.test.ts +5 -3
package/src/__tests__/send-endpoint-busy.test.ts +21 -6
package/src/__tests__/sequence-store.test.ts +0 -1
package/src/__tests__/session-init.benchmark.test.ts +4 -5
package/src/__tests__/session-messaging-secret-redirect.test.ts +5 -4
package/src/__tests__/skill-include-graph.test.ts +66 -0
package/src/__tests__/skill-load-feature-flag.test.ts +0 -1
package/src/__tests__/skill-load-tool.test.ts +149 -1
package/src/__tests__/skill-projection-feature-flag.test.ts +0 -1
package/src/__tests__/skills-uninstall.test.ts +3 -3
package/src/__tests__/skills.test.ts +3 -12
package/src/__tests__/slack-channel-config.test.ts +76 -11
package/src/__tests__/slack-share-routes.test.ts +17 -14
package/src/__tests__/system-prompt.test.ts +0 -1
package/src/__tests__/telegram-bot-username-resolution.test.ts +3 -0
package/src/__tests__/telegram-invite-adapter.test.ts +18 -22
package/src/__tests__/terminal-tools.test.ts +4 -3
package/src/__tests__/test-support/computer-use-skill-harness.ts +3 -2
package/src/__tests__/tool-approval-handler.test.ts +0 -1
package/src/__tests__/tool-execution-pipeline.benchmark.test.ts +0 -1
package/src/__tests__/tool-executor-lifecycle-events.test.ts +0 -1
package/src/__tests__/tool-executor-shell-integration.test.ts +0 -1
package/src/__tests__/tool-executor.test.ts +0 -1
package/src/__tests__/tool-grant-request-escalation.test.ts +0 -1
package/src/__tests__/trust-store-pattern-matches.test.ts +29 -0
package/src/__tests__/trust-store.test.ts +1 -22
package/src/__tests__/trusted-contact-approval-notifier.test.ts +0 -1
package/src/__tests__/trusted-contact-inline-approval-integration.test.ts +0 -1
package/src/__tests__/twilio-config.test.ts +2 -1
package/src/__tests__/twilio-provider.test.ts +4 -2
package/src/__tests__/twilio-routes.test.ts +5 -20
package/src/__tests__/verification-control-plane-policy.test.ts +0 -1
package/src/__tests__/voice-scoped-grant-consumer.test.ts +0 -1
package/src/agent/ax-tree-compaction.test.ts +235 -0
package/src/agent/loop.ts +76 -130
package/src/calls/call-domain.ts +8 -10
package/src/calls/relay-server.ts +9 -13
package/src/calls/twilio-config.ts +4 -8
package/src/calls/twilio-provider.ts +2 -1
package/src/calls/twilio-rest.ts +2 -1
package/src/calls/twilio-routes.ts +1 -2
package/src/calls/voice-ingress-preflight.ts +1 -1
package/src/cli/commands/browser-relay.ts +46 -15
package/src/cli/commands/completions.ts +0 -3
package/src/cli/commands/credentials.ts +110 -23
package/src/cli/commands/oauth/apps.ts +255 -0
package/src/cli/commands/oauth/connections.ts +299 -0
package/src/cli/commands/oauth/index.ts +52 -0
package/src/cli/commands/oauth/providers.ts +242 -0
package/src/cli/commands/skills.ts +4 -338
package/src/cli/program.ts +1 -5
package/src/cli/reference.ts +1 -3
package/src/cli.ts +3 -2
package/src/config/assistant-feature-flags.ts +0 -3
package/src/config/bundled-skills/_shared/CLI_RETRIEVAL_PATTERN.md +1 -1
package/src/config/bundled-skills/claude-code/TOOLS.json +0 -4
package/src/config/bundled-skills/computer-use/SKILL.md +3 -6
package/src/config/bundled-skills/computer-use/TOOLS.json +22 -4
package/src/config/bundled-skills/contacts/tools/google-contacts.ts +29 -32
package/src/config/bundled-skills/gmail/SKILL.md +4 -4
package/src/config/bundled-skills/gmail/tools/gmail-archive.ts +54 -61
package/src/config/bundled-skills/gmail/tools/gmail-attachments.ts +25 -28
package/src/config/bundled-skills/gmail/tools/gmail-draft.ts +14 -17
package/src/config/bundled-skills/gmail/tools/gmail-filters.ts +39 -44
package/src/config/bundled-skills/gmail/tools/gmail-follow-up.ts +61 -58
package/src/config/bundled-skills/gmail/tools/gmail-forward.ts +50 -49
package/src/config/bundled-skills/gmail/tools/gmail-label.ts +11 -13
package/src/config/bundled-skills/gmail/tools/gmail-outreach-scan.ts +148 -146
package/src/config/bundled-skills/gmail/tools/gmail-send-draft.ts +4 -7
package/src/config/bundled-skills/gmail/tools/gmail-sender-digest.ts +175 -173
package/src/config/bundled-skills/gmail/tools/gmail-trash.ts +4 -7
package/src/config/bundled-skills/gmail/tools/gmail-unsubscribe.ts +71 -76
package/src/config/bundled-skills/gmail/tools/gmail-vacation.ts +32 -38
package/src/config/bundled-skills/google-calendar/SKILL.md +2 -2
package/src/config/bundled-skills/google-calendar/calendar-client.ts +90 -44
package/src/config/bundled-skills/google-calendar/tools/calendar-check-availability.ts +9 -10
package/src/config/bundled-skills/google-calendar/tools/calendar-create-event.ts +5 -6
package/src/config/bundled-skills/google-calendar/tools/calendar-get-event.ts +4 -5
package/src/config/bundled-skills/google-calendar/tools/calendar-list-events.ts +14 -15
package/src/config/bundled-skills/google-calendar/tools/calendar-rsvp.ts +37 -37
package/src/config/bundled-skills/google-calendar/tools/shared.ts +4 -9
package/src/config/bundled-skills/image-studio/tools/media-generate-image.ts +24 -3
package/src/config/bundled-skills/messaging/SKILL.md +6 -6
package/src/config/bundled-skills/messaging/tools/messaging-analyze-style.ts +62 -63
package/src/config/bundled-skills/messaging/tools/messaging-archive-by-sender.ts +15 -16
package/src/config/bundled-skills/messaging/tools/messaging-auth-test.ts +4 -5
package/src/config/bundled-skills/messaging/tools/messaging-list-conversations.ts +6 -7
package/src/config/bundled-skills/messaging/tools/messaging-mark-read.ts +4 -5
package/src/config/bundled-skills/messaging/tools/messaging-read.ts +14 -15
package/src/config/bundled-skills/messaging/tools/messaging-search.ts +4 -5
package/src/config/bundled-skills/messaging/tools/messaging-send.ts +128 -128
package/src/config/bundled-skills/messaging/tools/messaging-sender-digest.ts +33 -34
package/src/config/bundled-skills/messaging/tools/shared.ts +12 -15
package/src/config/bundled-skills/settings/SKILL.md +1 -1
package/src/config/bundled-skills/settings/TOOLS.json +2 -8
package/src/config/bundled-skills/settings/tools/voice-config-update.ts +5 -33
package/src/config/bundled-skills/slack/tools/shared.ts +4 -10
package/src/config/bundled-skills/slack/tools/slack-add-reaction.ts +4 -5
package/src/config/bundled-skills/slack/tools/slack-channel-details.ts +15 -16
package/src/config/bundled-skills/slack/tools/slack-delete-message.ts +4 -5
package/src/config/bundled-skills/slack/tools/slack-edit-message.ts +4 -5
package/src/config/bundled-skills/slack/tools/slack-leave-channel.ts +4 -5
package/src/config/bundled-skills/slack/tools/slack-scan-digest.ts +95 -92
package/src/config/env-registry.ts +14 -83
package/src/config/env.ts +11 -50
package/src/config/feature-flag-registry.json +16 -16
package/src/config/schema.ts +3 -1
package/src/config/skills.ts +21 -2
package/src/context/image-dimensions.ts +229 -0
package/src/context/token-estimator.ts +75 -12
package/src/context/window-manager.ts +49 -10
package/src/daemon/assistant-attachments.ts +1 -13
package/src/daemon/guardian-action-generators.ts +4 -5
package/src/daemon/handlers/config-ingress.ts +8 -33
package/src/daemon/handlers/config-slack-channel.ts +76 -56
package/src/daemon/handlers/config-telegram.ts +53 -24
package/src/daemon/handlers/sessions.ts +10 -24
package/src/daemon/handlers/shared.ts +0 -130
package/src/daemon/host-cu-proxy.ts +401 -0
package/src/daemon/lifecycle.ts +39 -63
package/src/daemon/message-protocol.ts +3 -0
package/src/daemon/message-types/computer-use.ts +2 -119
package/src/daemon/message-types/host-cu.ts +19 -0
package/src/daemon/message-types/integrations.ts +1 -0
package/src/daemon/message-types/messages.ts +3 -0
package/src/daemon/server.ts +14 -21
package/src/daemon/session-agent-loop-handlers.ts +2 -0
package/src/daemon/session-attachments.ts +1 -2
package/src/daemon/session-messaging.ts +3 -1
package/src/daemon/session-slash.ts +1 -1
package/src/daemon/session-surfaces.ts +40 -28
package/src/daemon/session-tool-setup.ts +20 -11
package/src/daemon/session.ts +139 -16
package/src/daemon/tool-side-effects.ts +2 -8
package/src/daemon/watch-handler.ts +2 -2
package/src/email/providers/index.ts +2 -1
package/src/events/tool-metrics-listener.ts +2 -2
package/src/hooks/manager.ts +1 -4
package/src/inbound/public-ingress-urls.ts +7 -7
package/src/instrument.ts +15 -1
package/src/logfire.ts +16 -5
package/src/media/app-icon-generator.ts +30 -4
package/src/media/avatar-router.ts +26 -3
package/src/media/gemini-image-service.ts +28 -2
package/src/memory/conversation-key-store.ts +21 -0
package/src/memory/db-init.ts +4 -0
package/src/memory/guardian-action-store.ts +1 -1
package/src/memory/migrations/149-oauth-tables.ts +60 -0
package/src/memory/migrations/index.ts +1 -0
package/src/memory/schema/guardian.ts +1 -1
package/src/memory/schema/index.ts +1 -0
package/src/memory/schema/oauth.ts +65 -0
package/src/messaging/provider.ts +19 -13
package/src/messaging/providers/gmail/adapter.ts +40 -23
package/src/messaging/providers/gmail/client.ts +283 -122
package/src/messaging/providers/gmail/people-client.ts +32 -24
package/src/messaging/providers/slack/adapter.ts +29 -19
package/src/messaging/providers/slack/client.ts +265 -78
package/src/messaging/providers/telegram-bot/adapter.ts +19 -18
package/src/messaging/providers/whatsapp/adapter.ts +17 -11
package/src/messaging/registry.ts +2 -31
package/src/notifications/copy-composer.ts +0 -5
package/src/notifications/signal.ts +4 -5
package/src/oauth/byo-connection.test.ts +537 -0
package/src/oauth/byo-connection.ts +128 -0
package/src/oauth/connect-orchestrator.ts +139 -56
package/src/oauth/connect-types.ts +17 -23
package/src/oauth/connection-resolver.ts +58 -0
package/src/oauth/connection.ts +38 -0
package/src/oauth/manual-token-connection.ts +104 -0
package/src/oauth/oauth-store.ts +496 -0
package/src/oauth/platform-connection.test.ts +192 -0
package/src/oauth/platform-connection.ts +111 -0
package/src/oauth/provider-behaviors.ts +124 -0
package/src/oauth/scope-policy.ts +9 -2
package/src/oauth/seed-providers.ts +161 -0
package/src/oauth/token-persistence.ts +74 -78
package/src/permissions/checker.ts +8 -4
package/src/permissions/defaults.ts +0 -1
package/src/permissions/prompter.ts +10 -1
package/src/permissions/trust-store.ts +13 -0
package/src/prompts/__tests__/build-cli-reference-section.test.ts +3 -1
package/src/prompts/system-prompt.ts +70 -45
package/src/providers/anthropic/client.ts +133 -24
package/src/providers/gemini/client.ts +15 -6
package/src/providers/managed-proxy/constants.ts +2 -2
package/src/providers/managed-proxy/context.ts +5 -1
package/src/providers/ratelimit.ts +17 -0
package/src/providers/registry.ts +2 -2
package/src/providers/retry.ts +1 -27
package/src/runtime/AGENTS.md +17 -0
package/src/runtime/auth/route-policy.ts +0 -3
package/src/runtime/channel-invite-transports/telegram.ts +2 -1
package/src/runtime/channel-readiness-service.ts +168 -195
package/src/runtime/channel-readiness-types.ts +4 -0
package/src/runtime/channel-reply-delivery.ts +0 -40
package/src/runtime/gateway-client.ts +0 -7
package/src/runtime/guardian-action-conversation-turn.ts +1 -3
package/src/runtime/guardian-action-followup-executor.ts +1 -1
package/src/runtime/guardian-action-message-composer.ts +3 -23
package/src/runtime/http-server.ts +17 -10
package/src/runtime/http-types.ts +2 -3
package/src/runtime/middleware/rate-limiter.ts +74 -20
package/src/runtime/middleware/twilio-validation.ts +1 -11
package/src/runtime/pending-interactions.ts +14 -12
package/src/runtime/routes/channel-delivery-routes.ts +0 -1
package/src/runtime/routes/channel-readiness-routes.ts +2 -0
package/src/runtime/routes/conversation-routes.ts +73 -19
package/src/runtime/routes/diagnostics-routes.ts +11 -9
package/src/runtime/routes/events-routes.ts +21 -11
package/src/runtime/routes/guardian-approval-interception.ts +20 -5
package/src/runtime/routes/host-cu-routes.ts +97 -0
package/src/runtime/routes/inbound-stages/background-dispatch.ts +12 -111
package/src/runtime/routes/integrations/slack/share.ts +6 -6
package/src/runtime/routes/integrations/twilio.ts +6 -5
package/src/runtime/routes/log-export-routes.ts +126 -8
package/src/runtime/routes/secret-routes.ts +3 -2
package/src/runtime/routes/settings-routes.ts +113 -48
package/src/runtime/routes/surface-action-routes.ts +1 -1
package/src/runtime/routes/watch-routes.ts +128 -0
package/src/schedule/integration-status.ts +10 -8
package/src/security/credential-key.ts +14 -0
package/src/security/keychain-broker-client.ts +5 -6
package/src/security/oauth2.ts +1 -1
package/src/security/token-manager.ts +145 -43
package/src/skills/catalog-install.ts +358 -0
package/src/skills/include-graph.ts +32 -0
package/src/telegram/bot-username.ts +2 -3
package/src/tools/apps/definitions.ts +0 -5
package/src/tools/assets/materialize.ts +0 -5
package/src/tools/assets/search.ts +0 -5
package/src/tools/browser/headless-browser.ts +1 -67
package/src/tools/browser/network-recorder.ts +1 -1
package/src/tools/browser/network-recording-types.ts +1 -1
package/src/tools/claude-code/claude-code.ts +0 -5
package/src/tools/computer-use/definitions.ts +46 -11
package/src/tools/computer-use/registry.ts +4 -5
package/src/tools/credentials/broker.ts +5 -4
package/src/tools/credentials/metadata-store.ts +22 -74
package/src/tools/credentials/resolve.ts +2 -1
package/src/tools/credentials/vault.ts +139 -151
package/src/tools/filesystem/edit.ts +1 -6
package/src/tools/filesystem/read.ts +0 -5
package/src/tools/filesystem/write.ts +1 -6
package/src/tools/host-filesystem/edit.ts +1 -6
package/src/tools/host-filesystem/read.ts +1 -6
package/src/tools/host-filesystem/write.ts +1 -6
package/src/tools/mcp/mcp-tool-factory.ts +18 -1
package/src/tools/memory/definitions.ts +0 -5
package/src/tools/network/web-fetch.ts +0 -5
package/src/tools/network/web-search.ts +0 -5
package/src/tools/registry.ts +2 -7
package/src/tools/schema-transforms.ts +99 -0
package/src/tools/skills/load.ts +62 -8
package/src/tools/swarm/delegate.ts +0 -5
package/src/tools/system/avatar-generator.ts +0 -5
package/src/tools/ui-surface/definitions.ts +0 -15
package/src/tools/watch/screen-watch.ts +0 -5
package/src/tools/watch/watch-state.ts +0 -12
package/src/util/logger.ts +7 -41
package/src/util/platform.ts +9 -28
package/src/version.ts +10 -0
package/src/watcher/providers/github.ts +51 -52
package/src/watcher/providers/gmail.ts +88 -80
package/src/watcher/providers/google-calendar.ts +94 -86
package/src/watcher/providers/linear.ts +87 -93
package/src/__tests__/computer-use-session-compaction.test.ts +0 -143
package/src/__tests__/computer-use-session-lifecycle.test.ts +0 -322
package/src/__tests__/computer-use-session-working-dir.test.ts +0 -166
package/src/__tests__/computer-use-skill-baseline.test.ts +0 -78
package/src/__tests__/computer-use-skill-endstate.test.ts +0 -105
package/src/__tests__/computer-use-skill-lifecycle-cleanup.test.ts +0 -249
package/src/__tests__/ride-shotgun-handler.test.ts +0 -452
package/src/cli/commands/dev.ts +0 -129
package/src/cli/commands/map.ts +0 -391
package/src/cli/commands/oauth.ts +0 -77
package/src/config/bundled-skills/computer-use/tools/computer-use-request-control.ts +0 -16
package/src/daemon/computer-use-session.ts +0 -1020
package/src/daemon/ride-shotgun-handler.ts +0 -567
package/src/oauth/provider-profiles.ts +0 -192
package/src/prompts/computer-use-prompt.ts +0 -98
package/src/runtime/routes/computer-use-routes.ts +0 -641
package/src/runtime/telegram-streaming-delivery.test.ts +0 -597
package/src/runtime/telegram-streaming-delivery.ts +0 -383
package/src/tools/computer-use/request-computer-control.ts +0 -61

package/src/daemon/computer-use-session.ts DELETED Viewed

@@ -1,1020 +0,0 @@
-/**
- * Computer-use session orchestrator.
- *
- * Manages the observation -> infer -> action loop for computer-use tasks,
- * bridging the macOS client (which captures screen state and executes actions)
- * with the AgentLoop (which runs inference via the Anthropic API with CU tools).
- */
-import { v4 as uuid } from "uuid";
-import { AgentLoop } from "../agent/loop.js";
-import { getConfig } from "../config/loader.js";
-import { PermissionPrompter } from "../permissions/prompter.js";
-import { SecretPrompter } from "../permissions/secret-prompter.js";
-import type { UserDecision } from "../permissions/types.js";
-import { buildComputerUseSystemPrompt } from "../prompts/computer-use-prompt.js";
-import type {
-  ContentBlock,
-  Message,
-  Provider,
-  ToolDefinition,
-} from "../providers/types.js";
-import { allComputerUseTools } from "../tools/computer-use/definitions.js";
-import { ToolExecutor } from "../tools/executor.js";
-import { getTool, registerSkillTools } from "../tools/registry.js";
-import type { Tool, ToolExecutionResult } from "../tools/types.js";
-import { allUiSurfaceTools } from "../tools/ui-surface/definitions.js";
-import { getLogger } from "../util/logger.js";
-import { getSandboxWorkingDir } from "../util/platform.js";
-import type {
-  CuObservation,
-  ServerMessage,
-  SurfaceData,
-  SurfaceType,
-  UiSurfaceShow,
-} from "./message-protocol.js";
-import { INTERACTIVE_SURFACE_TYPES } from "./message-protocol.js";
-import {
-  projectSkillTools,
-  resetSkillToolProjection,
-  type SkillProjectionCache,
-} from "./session-skill-tools.js";
-const log = getLogger("computer-use-session");
-const MAX_STEPS = 50;
-const SESSION_TIMEOUT_MS = 30 * 60 * 1000; // 30 minutes
-const MAX_HISTORY_ENTRIES = 10;
-const LOOP_DETECTION_WINDOW = 3;
-const CONSECUTIVE_UNCHANGED_WARNING_THRESHOLD = 2;
-/** Number of most-recent AX tree snapshots to keep in conversation history. */
-const MAX_AX_TREES_IN_HISTORY = 2;
-/** Regex that matches the `<ax-tree>…</ax-tree>` markers injected by buildObservationResultContent. */
-const AX_TREE_PATTERN = /<ax-tree>[\s\S]*?<\/ax-tree>/g;
-const AX_TREE_PLACEHOLDER = "<ax_tree_omitted />";
-type SessionState =
-  | "idle"
-  | "awaiting_observation"
-  | "inferring"
-  | "complete"
-  | "error";
-interface ActionRecord {
-  step: number;
-  toolName: string;
-  input: Record<string, unknown>;
-  reasoning?: string;
-  result?: string;
-}
-export class ComputerUseSession {
-  private readonly sessionId: string;
-  private readonly task: string;
-  private readonly screenWidth: number;
-  private readonly screenHeight: number;
-  private readonly provider: Provider;
-  private sendToClient: (msg: ServerMessage) => void;
-  private readonly interactionType: "computer_use" | "text_qa";
-  private readonly onTerminal?: (sessionId: string) => void;
-  private readonly preactivatedSkillIds: string[];
-  private readonly skillProjectionState = new Map<string, string>();
-  private readonly skillProjectionCache: SkillProjectionCache = {};
-  private state: SessionState = "idle";
-  private stepCount = 0;
-  private actionHistory: ActionRecord[] = [];
-  private previousAXTree: string | undefined;
-  private consecutiveUnchangedSteps = 0;
-  private abortController: AbortController | null = null;
-  private sessionTimer: ReturnType<typeof setTimeout> | null = null;
-  private pendingObservation: {
-    resolve: (result: ToolExecutionResult) => void;
-  } | null = null;
-  private pendingSurfaceActions = new Map<
-    string,
-    {
-      resolve: (result: ToolExecutionResult) => void;
-    }
-  >();
-  /** @internal */ surfaceState = new Map<
-    string,
-    { surfaceType: SurfaceType; data: SurfaceData; title?: string }
-  >();
-  private terminalNotified = false;
-  private prompter: PermissionPrompter | null = null;
-  // Tracks the agent loop promise so callers can await session completion
-  private loopPromise: Promise<void> | null = null;
-  constructor(
-    sessionId: string,
-    task: string,
-    screenWidth: number,
-    screenHeight: number,
-    provider: Provider,
-    sendToClient: (msg: ServerMessage) => void,
-    interactionType?: "computer_use" | "text_qa",
-    onTerminal?: (sessionId: string) => void,
-    preactivatedSkillIds?: string[],
-  ) {
-    this.sessionId = sessionId;
-    this.task = task;
-    this.screenWidth = screenWidth;
-    this.screenHeight = screenHeight;
-    this.provider = provider;
-    this.sendToClient = sendToClient;
-    this.interactionType = interactionType ?? "computer_use";
-    this.onTerminal = onTerminal;
-    this.preactivatedSkillIds = preactivatedSkillIds ?? ["computer-use"];
-  }
-  // ---------------------------------------------------------------------------
-  // Public API
-  // ---------------------------------------------------------------------------
-  async handleObservation(obs: CuObservation): Promise<void> {
-    if (this.state === "complete" || this.state === "error") {
-      log.warn(
-        { sessionId: this.sessionId, state: this.state },
-        "Observation received after session ended",
-      );
-      return;
-    }
-    // Track consecutive unchanged steps
-    const hadPreviousAXTree = this.previousAXTree != null;
-    if (this.stepCount > 0) {
-      if (obs.axDiff == null && hadPreviousAXTree && obs.axTree != null) {
-        this.consecutiveUnchangedSteps++;
-      } else if (obs.axDiff != null) {
-        this.consecutiveUnchangedSteps = 0;
-      }
-    }
-    // Capture previous AX tree for next turn
-    if (obs.axTree != null) {
-      this.previousAXTree = obs.axTree;
-    }
-    if (this.state === "awaiting_observation" && this.pendingObservation) {
-      // Resolve the pending proxy tool result with updated screen context
-      const content = this.buildObservationResultContent(
-        obs,
-        hadPreviousAXTree,
-      );
-      const result: ToolExecutionResult = obs.executionError
-        ? {
-            content: `Action failed: ${obs.executionError}\n\n${content}`,
-            isError: true,
-          }
-        : { content, isError: false };
-      this.state = "inferring";
-      this.pendingObservation.resolve(result);
-      this.pendingObservation = null;
-      // The agent loop continues automatically after resolution
-      return;
-    }
-    // First observation — start the agent loop
-    this.state = "inferring";
-    this.abortController = new AbortController();
-    // Safety net: abort the session if it runs longer than SESSION_TIMEOUT_MS
-    this.sessionTimer = setTimeout(() => {
-      log.warn(
-        { sessionId: this.sessionId, timeoutMs: SESSION_TIMEOUT_MS },
-        "Session timeout reached, aborting",
-      );
-      this.abort();
-    }, SESSION_TIMEOUT_MS);
-    const messages = this.buildMessages(obs, hadPreviousAXTree);
-    this.loopPromise = this.runAgentLoop(messages).catch((err) => {
-      // Catches errors from setup code (e.g. skill projection failures) that
-      // occur before runAgentLoop's internal try-catch takes over.
-      const message = err instanceof Error ? err.message : String(err);
-      log.error(
-        { err, sessionId: this.sessionId },
-        "Agent loop startup failed",
-      );
-      if (this.sessionTimer) {
-        clearTimeout(this.sessionTimer);
-        this.sessionTimer = null;
-      }
-      if (this.state !== "complete" && this.state !== "error") {
-        this.state = "error";
-        this.sendToClient({
-          type: "cu_error",
-          sessionId: this.sessionId,
-          message,
-        });
-        this.notifyTerminal();
-      }
-    });
-    await this.loopPromise;
-  }
-  abort(): void {
-    if (this.state === "complete" || this.state === "error") return;
-    log.info({ sessionId: this.sessionId }, "Aborting computer-use session");
-    if (this.sessionTimer) {
-      clearTimeout(this.sessionTimer);
-      this.sessionTimer = null;
-    }
-    this.abortController?.abort();
-    // If waiting for an observation, resolve it as cancelled
-    if (this.pendingObservation) {
-      this.pendingObservation.resolve({
-        content: "Session aborted",
-        isError: true,
-      });
-      this.pendingObservation = null;
-    }
-    // Dispose prompter to clear pending permission timers and reject promises
-    this.prompter?.dispose();
-    // Resolve any pending surface actions
-    for (const [, pending] of this.pendingSurfaceActions) {
-      pending.resolve({ content: "Session aborted", isError: true });
-    }
-    this.pendingSurfaceActions.clear();
-    this.surfaceState.clear();
-    this.state = "error";
-    this.sendToClient({
-      type: "cu_error",
-      sessionId: this.sessionId,
-      message: "Session aborted by user",
-    });
-    this.notifyTerminal();
-  }
-  isComplete(): boolean {
-    return this.state === "complete";
-  }
-  getState(): string {
-    return this.state;
-  }
-  /**
-   * Compute CU tool definitions from the bundled computer-use skill via
-   * skill projection. Returns null if projection fails so the caller can
-   * fall back to legacy hardcoded tool definitions.
-   */
-  private getProjectedCuToolDefinitions(): ToolDefinition[] | null {
-    if (this.preactivatedSkillIds.length === 0) {
-      log.warn(
-        "No preactivatedSkillIds configured, falling back to legacy CU tools",
-      );
-      return null;
-    }
-    try {
-      const projection = projectSkillTools([], {
-        preactivatedSkillIds: this.preactivatedSkillIds,
-        previouslyActiveSkillIds: this.skillProjectionState,
-        cache: this.skillProjectionCache,
-      });
-      if (projection.allowedToolNames.size === 0) {
-        log.warn(
-          { preactivatedSkillIds: this.preactivatedSkillIds },
-          "Skill projection produced no tool definitions, falling back to legacy CU tools",
-        );
-        return null;
-      }
-      // Tool definitions are no longer returned from projectSkillTools
-      // (dispatched via skill_execute). Build definitions from the registry.
-      const defs: ToolDefinition[] = [];
-      for (const name of projection.allowedToolNames) {
-        const tool = getTool(name);
-        if (tool) defs.push(tool.getDefinition());
-      }
-      return defs;
-    } catch (err) {
-      log.warn(
-        { err },
-        "Skill projection failed, falling back to legacy CU tools",
-      );
-      return null;
-    }
-  }
-  handleSurfaceAction(
-    surfaceId: string,
-    actionId: string,
-    data?: Record<string, unknown>,
-  ): void {
-    const pending = this.pendingSurfaceActions.get(surfaceId);
-    if (!pending) {
-      log.warn({ surfaceId, actionId }, "No pending surface action found");
-      return;
-    }
-    // selection_changed is a non-terminal state update — don't consume the
-    // pending entry. The selection state will be in the action button payload.
-    if (actionId === "selection_changed") {
-      return;
-    }
-    this.pendingSurfaceActions.delete(surfaceId);
-    pending.resolve({
-      content: JSON.stringify({ actionId, data: data ?? {} }),
-      isError: false,
-    });
-  }
-  // ---------------------------------------------------------------------------
-  // Agent loop execution
-  // ---------------------------------------------------------------------------
-  private async runAgentLoop(messages: Message[]): Promise<void> {
-    const systemPrompt = buildComputerUseSystemPrompt(
-      this.screenWidth,
-      this.screenHeight,
-    );
-    let cuToolDefs = this.getProjectedCuToolDefinitions();
-    if (!cuToolDefs) {
-      // Fallback: register the legacy CU tools as skill-origin tools so
-      // ToolExecutor can resolve them via getTool(), but using the same
-      // ownerSkillId as the bundled computer-use skill. This avoids
-      // core-vs-skill collisions that would permanently block skill
-      // projection recovery on subsequent sessions.
-      const fallbackSkillId = this.preactivatedSkillIds[0] ?? "computer-use";
-      const fallbackTools: Tool[] = allComputerUseTools.map((t) => ({
-        ...t,
-        origin: "skill" as const,
-        ownerSkillId: fallbackSkillId,
-        ownerSkillBundled: true,
-      }));
-      registerSkillTools(fallbackTools);
-      // Track in the session map so resetSkillToolProjection cleans up
-      this.skillProjectionState.set(fallbackSkillId, "fallback");
-      cuToolDefs = allComputerUseTools.map((t) => t.getDefinition());
-    }
-    const toolDefs: ToolDefinition[] = [
-      ...cuToolDefs,
-      ...allUiSurfaceTools.map((t) => t.getDefinition()),
-    ];
-    this.prompter = new PermissionPrompter(this.sendToClient);
-    const prompter = this.prompter;
-    const secretPrompter = new SecretPrompter(this.sendToClient);
-    const executor = new ToolExecutor(prompter);
-    const proxyResolver = async (
-      toolName: string,
-      input: Record<string, unknown>,
-    ): Promise<ToolExecutionResult> => {
-      // ── Surface tool proxying ──────────────────────────────────────
-      if (toolName === "ui_show") {
-        const surfaceId = uuid();
-        const surfaceType = input.surface_type as SurfaceType;
-        const title = typeof input.title === "string" ? input.title : undefined;
-        const data = input.data as SurfaceData;
-        const actions = input.actions as
-          | Array<{ id: string; label: string; style?: string }>
-          | undefined;
-        // Interactive surfaces default to awaiting user action.
-        // Tables and lists only block when explicit action buttons are provided;
-        // selectionMode alone should not gate blocking because selection_changed
-        // fires on every click and would immediately resolve multi-select surfaces.
-        const hasActions = Array.isArray(actions) && actions.length > 0;
-        const isInteractive =
-          surfaceType === "card"
-            ? hasActions
-            : surfaceType === "list"
-              ? hasActions
-              : surfaceType === "table"
-                ? hasActions
-                : INTERACTIVE_SURFACE_TYPES.includes(surfaceType);
-        const awaitAction = (input.await_action as boolean) ?? isInteractive;
-        // Track surface state for ui_update merging
-        this.surfaceState.set(surfaceId, { surfaceType, data, title });
-        this.sendToClient({
-          type: "ui_surface_show",
-          sessionId: this.sessionId,
-          surfaceId,
-          surfaceType,
-          title,
-          data,
-          actions: actions?.map((a) => ({
-            id: a.id,
-            label: a.label,
-            style: (a.style ?? "secondary") as
-              | "primary"
-              | "secondary"
-              | "destructive",
-          })),
-        } as unknown as UiSurfaceShow);
-        if (awaitAction) {
-          return new Promise<ToolExecutionResult>((resolve) => {
-            this.pendingSurfaceActions.set(surfaceId, { resolve });
-          });
-        }
-        return { content: JSON.stringify({ surfaceId }), isError: false };
-      }
-      if (toolName === "ui_update") {
-        const surfaceId = input.surface_id as string;
-        const patch = input.data as Record<string, unknown>;
-        // Merge the partial patch into the stored full surface data
-        const stored = this.surfaceState.get(surfaceId);
-        let mergedData: SurfaceData;
-        if (stored) {
-          mergedData = { ...stored.data, ...patch } as SurfaceData;
-          stored.data = mergedData;
-        } else {
-          mergedData = patch as unknown as SurfaceData;
-        }
-        this.sendToClient({
-          type: "ui_surface_update",
-          sessionId: this.sessionId,
-          surfaceId,
-          data: mergedData,
-        });
-        return { content: "Surface updated", isError: false };
-      }
-      if (toolName === "ui_dismiss") {
-        const surfaceId = input.surface_id as string;
-        this.sendToClient({
-          type: "ui_surface_dismiss",
-          sessionId: this.sessionId,
-          surfaceId,
-        });
-        this.pendingSurfaceActions.delete(surfaceId);
-        this.surfaceState.delete(surfaceId);
-        return { content: "Surface dismissed", isError: false };
-      }
-      // ── Computer-use tool proxying ─────────────────────────────────
-      const reasoning =
-        typeof input.reasoning === "string" ? input.reasoning : undefined;
-      // Record action in history
-      this.actionHistory.push({
-        step: this.stepCount + 1,
-        toolName,
-        input,
-        reasoning,
-      });
-      // Check for terminal tools
-      if (
-        toolName === "computer_use_done" ||
-        toolName === "computer_use_respond"
-      ) {
-        const summary =
-          toolName === "computer_use_done"
-            ? typeof input.summary === "string"
-              ? input.summary
-              : "Task completed"
-            : typeof input.answer === "string"
-              ? input.answer
-              : "No answer provided";
-        this.sendToClient({
-          type: "cu_complete",
-          sessionId: this.sessionId,
-          summary,
-          stepCount: this.stepCount,
-          isResponse: toolName === "computer_use_respond" ? true : undefined,
-        });
-        this.state = "complete";
-        // Stop AgentLoop immediately so terminal tools cannot trigger extra provider calls.
-        this.abortController?.abort();
-        this.notifyTerminal();
-        return { content: "Session complete", isError: false };
-      }
-      this.stepCount++;
-      // Enforce step limit — abort the loop so toolChoice:'any' can't force another turn
-      if (this.stepCount > MAX_STEPS) {
-        this.state = "error";
-        this.sendToClient({
-          type: "cu_error",
-          sessionId: this.sessionId,
-          message: `Step limit (${MAX_STEPS}) exceeded`,
-        });
-        this.abortController?.abort();
-        this.notifyTerminal();
-        return { content: `Step limit (${MAX_STEPS}) exceeded`, isError: true };
-      }
-      // Send action to client for execution
-      this.sendToClient({
-        type: "cu_action",
-        sessionId: this.sessionId,
-        toolName,
-        input,
-        reasoning,
-        stepNumber: this.stepCount,
-      });
-      // Wait for next observation from client
-      this.state = "awaiting_observation";
-      return new Promise<ToolExecutionResult>((resolve) => {
-        this.pendingObservation = { resolve };
-      });
-    };
-    // Build a set of tool names the CU session is allowed to execute.
-    // This prevents tools registered globally (e.g. computer_use_request_control)
-    // but not advertised to the CU model from executing during CU sessions.
-    const allowedToolNames = new Set(toolDefs.map((td) => td.name));
-    const toolExecutor = async (
-      name: string,
-      input: Record<string, unknown>,
-    ): Promise<ToolExecutionResult> => {
-      return executor.execute(name, input, {
-        workingDir: getSandboxWorkingDir(),
-        sessionId: this.sessionId,
-        conversationId: this.sessionId,
-        trustClass: "guardian",
-        proxyToolResolver: proxyResolver,
-        allowedToolNames,
-        requestSecret: async (params) => {
-          return secretPrompter.prompt(
-            params.service,
-            params.field,
-            params.label,
-            params.description,
-            params.placeholder,
-            this.sessionId,
-            params.purpose,
-            params.allowedTools,
-            params.allowedDomains,
-          );
-        },
-      });
-    };
-    // Wrap the provider so that old AX tree snapshots are stripped from
-    // conversation history before each API call, keeping only the most recent
-    // MAX_AX_TREES_IN_HISTORY entries.  This prevents TTFT from growing
-    // linearly with step count.
-    const compactingProvider: Provider = {
-      name: this.provider.name,
-      sendMessage: (msgs, tools, sys, opts) => {
-        const compacted = ComputerUseSession.compactHistory(msgs);
-        return this.provider.sendMessage(compacted, tools, sys, opts);
-      },
-    };
-    const cuConfig = getConfig();
-    const agentLoop = new AgentLoop(
-      compactingProvider,
-      systemPrompt,
-      {
-        maxTokens: 4096,
-        maxInputTokens: cuConfig.contextWindow.maxInputTokens,
-        toolChoice: { type: "any" },
-      },
-      toolDefs,
-      toolExecutor,
-    );
-    try {
-      await agentLoop.run(
-        messages,
-        (event) => {
-          switch (event.type) {
-            case "error":
-              log.error(
-                { err: event.error, sessionId: this.sessionId },
-                "Agent loop error",
-              );
-              if (this.state !== "complete") {
-                this.state = "error";
-                this.sendToClient({
-                  type: "cu_error",
-                  sessionId: this.sessionId,
-                  message: event.error.message,
-                });
-                this.notifyTerminal();
-              }
-              break;
-            case "usage":
-              log.info(
-                {
-                  sessionId: this.sessionId,
-                  inputTokens: event.inputTokens,
-                  outputTokens: event.outputTokens,
-                  model: event.model,
-                },
-                "Usage",
-              );
-              break;
-            // Other events (text_delta, thinking_delta, etc.) are not surfaced to the CU client
-          }
-        },
-        this.abortController?.signal,
-      );
-      // If the loop exits without completing, treat as error
-      if (this.state !== "complete" && this.state !== "error") {
-        this.state = "error";
-        this.sendToClient({
-          type: "cu_error",
-          sessionId: this.sessionId,
-          message: "Agent loop ended unexpectedly",
-        });
-        this.notifyTerminal();
-      }
-    } catch (err) {
-      if (this.abortController?.signal.aborted) {
-        log.info({ sessionId: this.sessionId }, "Agent loop aborted");
-        return;
-      }
-      const message = err instanceof Error ? err.message : String(err);
-      log.error({ err, sessionId: this.sessionId }, "Agent loop failed");
-      if (this.state !== "complete") {
-        this.state = "error";
-        this.sendToClient({
-          type: "cu_error",
-          sessionId: this.sessionId,
-          message,
-        });
-        this.notifyTerminal();
-      }
-    } finally {
-      // Always clean up skill projection state and session timer
-      resetSkillToolProjection(this.skillProjectionState);
-      if (this.sessionTimer) {
-        clearTimeout(this.sessionTimer);
-        this.sessionTimer = null;
-      }
-    }
-  }
-  private notifyTerminal(): void {
-    if (this.terminalNotified) return;
-    this.terminalNotified = true;
-    resetSkillToolProjection(this.skillProjectionState);
-    this.onTerminal?.(this.sessionId);
-  }
-  // ---------------------------------------------------------------------------
-  // History compaction — strip old AX tree snapshots from tool results
-  // ---------------------------------------------------------------------------
-  /**
-   * Returns a shallow copy of `messages` where all but the most recent
-   * `MAX_AX_TREES_IN_HISTORY` `<ax-tree>` blocks have been replaced with a
-   * short placeholder.  This keeps the conversation context small so that
-   * TTFT does not grow linearly with step count.
-   */
-  static compactHistory(messages: Message[]): Message[] {
-    // Collect indices of user messages that contain an <ax-tree> block
-    const indicesWithAxTree: number[] = [];
-    for (let i = 0; i < messages.length; i++) {
-      const msg = messages[i];
-      if (msg.role !== "user") continue;
-      for (const block of msg.content) {
-        if (
-          block.type === "tool_result" &&
-          typeof block.content === "string" &&
-          block.content.includes("<ax-tree>")
-        ) {
-          indicesWithAxTree.push(i);
-          break;
-        }
-      }
-    }
-    if (indicesWithAxTree.length <= MAX_AX_TREES_IN_HISTORY) {
-      return messages;
-    }
-    const toStrip = new Set(
-      indicesWithAxTree.slice(0, -MAX_AX_TREES_IN_HISTORY),
-    );
-    return messages.map((msg, idx) => {
-      if (!toStrip.has(idx)) return msg;
-      return {
-        ...msg,
-        content: msg.content.map((block) => {
-          if (
-            block.type === "tool_result" &&
-            typeof block.content === "string" &&
-            block.content.includes("<ax-tree>")
-          ) {
-            return {
-              ...block,
-              content: block.content.replace(
-                AX_TREE_PATTERN,
-                AX_TREE_PLACEHOLDER,
-              ),
-            };
-          }
-          return block;
-        }),
-      };
-    });
-  }
-  /**
-   * Escapes any literal `</ax-tree>` occurrences inside AX tree content so
-   * that the non-greedy compaction regex (`AX_TREE_PATTERN`) does not stop
-   * prematurely when the user happens to be viewing XML/HTML source that
-   * contains the closing tag.  The escaped content does not need to be
-   * unescaped because compaction replaces the entire block with a placeholder.
-   */
-  static escapeAxTreeContent(content: string): string {
-    return content.replace(/<\/ax-tree>/gi, "&lt;/ax-tree&gt;");
-  }
-  // ---------------------------------------------------------------------------
-  // Build rich tool-result content from an observation so the model sees
-  // updated screen state on each turn (not just "Action executed").
-  // ---------------------------------------------------------------------------
-  private buildObservationResultContent(
-    obs: CuObservation,
-    hadPreviousAXTree: boolean,
-  ): string {
-    const parts: string[] = [];
-    // Surface user guidance prominently so the model sees it first
-    if (obs.userGuidance) {
-      parts.push(`USER GUIDANCE: ${obs.userGuidance}`);
-      parts.push("");
-    }
-    if (obs.executionResult) {
-      parts.push(obs.executionResult);
-      parts.push("");
-    }
-    // AX tree diff
-    if (obs.axDiff) {
-      parts.push(obs.axDiff);
-      parts.push("");
-    } else if (hadPreviousAXTree && obs.axTree != null) {
-      const lastAction = this.actionHistory[this.actionHistory.length - 1];
-      const wasWait = lastAction?.toolName === "computer_use_wait";
-      if (
-        this.consecutiveUnchangedSteps >=
-        CONSECUTIVE_UNCHANGED_WARNING_THRESHOLD
-      ) {
-        parts.push(
-          `WARNING: ${this.consecutiveUnchangedSteps} consecutive actions had NO VISIBLE EFFECT on the UI. You MUST try a completely different approach.`,
-        );
-      } else if (!wasWait) {
-        parts.push(
-          "Your last action had NO VISIBLE EFFECT on the UI. Try something different.",
-        );
-      }
-      parts.push("");
-    }
-    // Current screen state — wrapped in markers so compactHistory can strip old snapshots
-    if (obs.axTree) {
-      parts.push("<ax-tree>");
-      parts.push("CURRENT SCREEN STATE:");
-      parts.push(ComputerUseSession.escapeAxTreeContent(obs.axTree));
-      parts.push("</ax-tree>");
-    }
-    const screenshotMetadata = this.formatScreenshotMetadata(obs);
-    if (screenshotMetadata.length > 0) {
-      parts.push("");
-      parts.push(...screenshotMetadata);
-    }
-    return parts.join("\n").trim() || "Action executed";
-  }
-  // ---------------------------------------------------------------------------
-  // Message building (replicates AnthropicProvider.buildMessages from Swift)
-  // ---------------------------------------------------------------------------
-  private buildMessages(
-    obs: CuObservation,
-    hadPreviousAXTree: boolean,
-  ): Message[] {
-    const contentBlocks: ContentBlock[] = [];
-    // Screenshot image block
-    if (obs.screenshot) {
-      contentBlocks.push({
-        type: "image",
-        source: {
-          type: "base64",
-          media_type: "image/jpeg",
-          data: obs.screenshot,
-        },
-      });
-    }
-    // Text block
-    const textParts: string[] = [];
-    const trimmedTask = this.task.trim();
-    if (trimmedTask) {
-      textParts.push(`TASK: ${trimmedTask}`);
-    } else {
-      textParts.push("TASK: No explicit task provided.");
-    }
-    textParts.push("");
-    // AX tree diff (compact summary of what changed)
-    if (obs.axDiff && this.actionHistory.length > 0) {
-      textParts.push(obs.axDiff);
-      textParts.push("");
-    } else if (
-      hadPreviousAXTree &&
-      obs.axTree != null &&
-      this.actionHistory.length > 0
-    ) {
-      // AX tree unchanged — tell the model its action had no effect
-      const lastAction = this.actionHistory[this.actionHistory.length - 1];
-      const wasWait = lastAction?.toolName === "computer_use_wait";
-      textParts.push("CHANGES SINCE LAST ACTION:");
-      if (
-        this.consecutiveUnchangedSteps >=
-        CONSECUTIVE_UNCHANGED_WARNING_THRESHOLD
-      ) {
-        textParts.push(
-          `WARNING: ${this.consecutiveUnchangedSteps} consecutive actions had NO VISIBLE EFFECT on the UI. You MUST try a completely different approach — do not repeat any of your recent actions.`,
-        );
-      } else if (!wasWait) {
-        const actionDesc = `${lastAction?.toolName ?? "unknown"}`;
-        textParts.push(
-          `Your last action (${actionDesc}) had NO VISIBLE EFFECT on the UI. The screen is identical to the previous step. Do NOT repeat the same action — try something different.`,
-        );
-      } else {
-        textParts.push(
-          "No visible changes detected — the UI is identical to the previous step.",
-        );
-      }
-      textParts.push("");
-    }
-    // Current screen state
-    if (obs.axTree) {
-      textParts.push(
-        "CURRENT SCREEN STATE (accessibility tree of the focused window):",
-      );
-      textParts.push(obs.axTree);
-      textParts.push("");
-      textParts.push(
-        "Use element_id with the [ID] numbers shown above to target elements.",
-      );
-      // Secondary windows for cross-app awareness
-      if (obs.secondaryWindows) {
-        textParts.push("");
-        textParts.push(obs.secondaryWindows);
-        textParts.push("");
-        textParts.push(
-          "Note: The element [ID]s above are from other windows — you can reference them for context but can only interact with the focused window's elements.",
-        );
-      }
-      if (obs.screenshot) {
-        textParts.push("");
-        textParts.push(
-          "A screenshot of the FULL SCREEN is also attached above. Use it to see content outside the focused window (e.g., reference documents, PDFs, other apps visible behind the current window).",
-        );
-        const screenshotMetadata = this.formatScreenshotMetadata(obs);
-        if (screenshotMetadata.length > 0) {
-          textParts.push(...screenshotMetadata);
-        }
-      }
-    } else if (obs.screenshot) {
-      textParts.push("CURRENT SCREEN STATE:");
-      textParts.push(
-        "See the screenshot above. No accessibility tree available — estimate coordinates from the image.",
-      );
-      const screenshotMetadata = this.formatScreenshotMetadata(obs);
-      if (screenshotMetadata.length > 0) {
-        textParts.push(...screenshotMetadata);
-      }
-    } else {
-      textParts.push("CURRENT SCREEN STATE:");
-      textParts.push("No screen data available.");
-    }
-    // Action history
-    if (this.actionHistory.length > 0) {
-      textParts.push("");
-      textParts.push("ACTIONS TAKEN SO FAR:");
-      let windowedHistory: ActionRecord[];
-      if (this.actionHistory.length > MAX_HISTORY_ENTRIES) {
-        textParts.push(
-          `  [... ${this.actionHistory.length - MAX_HISTORY_ENTRIES} earlier actions omitted]`,
-        );
-        windowedHistory = this.actionHistory.slice(-MAX_HISTORY_ENTRIES);
-      } else {
-        windowedHistory = this.actionHistory;
-      }
-      for (const record of windowedHistory) {
-        const result = record.result ?? "executed";
-        textParts.push(`  ${record.step}. ${record.toolName} → ${result}`);
-      }
-    }
-    // Loop detection warning
-    if (this.actionHistory.length >= LOOP_DETECTION_WINDOW) {
-      const recent = this.actionHistory.slice(-LOOP_DETECTION_WINDOW);
-      const allIdentical = recent.every(
-        (r) =>
-          r.toolName === recent[0].toolName &&
-          JSON.stringify(r.input) === JSON.stringify(recent[0].input),
-      );
-      if (allIdentical) {
-        textParts.push("");
-        textParts.push(
-          `WARNING: You have repeated the exact same action (${recent[0].toolName}) ${LOOP_DETECTION_WINDOW} times in a row. You MUST try a completely different approach or call computer_use_done with an explanation of why you are stuck.`,
-        );
-      }
-    }
-    // Surface user guidance prominently
-    if (obs.userGuidance) {
-      textParts.push("");
-      textParts.push(`USER GUIDANCE: ${obs.userGuidance}`);
-    }
-    // Prompt for next action
-    textParts.push("");
-    if (this.actionHistory.length === 0) {
-      textParts.push(
-        "This is the first action. Examine the screen state and decide what to do first.",
-      );
-    } else {
-      textParts.push("Decide the next action to take.");
-    }
-    contentBlocks.push({
-      type: "text",
-      text: textParts.join("\n"),
-    });
-    return [{ role: "user", content: contentBlocks }];
-  }
-  private formatScreenshotMetadata(obs: CuObservation): string[] {
-    if (!obs.screenshot) return [];
-    const lines: string[] = [];
-    if (obs.screenshotWidthPx != null && obs.screenshotHeightPx != null) {
-      lines.push(
-        `Screenshot metadata: ${obs.screenshotWidthPx}x${obs.screenshotHeightPx} px`,
-      );
-    }
-    if (obs.screenWidthPt != null && obs.screenHeightPt != null) {
-      lines.push(
-        `Screen metadata: ${obs.screenWidthPt}x${obs.screenHeightPt} pt`,
-      );
-    }
-    if (obs.coordinateOrigin) {
-      lines.push(`Coordinate origin: ${obs.coordinateOrigin}`);
-    }
-    if (obs.captureDisplayId != null) {
-      lines.push(`Capture display ID: ${obs.captureDisplayId}`);
-    }
-    return lines;
-  }
-  hasPendingConfirmation(requestId: string): boolean {
-    return this.prompter?.hasPendingRequest(requestId) ?? false;
-  }
-  handleConfirmationResponse(
-    requestId: string,
-    decision: UserDecision,
-    selectedPattern?: string,
-    selectedScope?: string,
-    decisionContext?: string,
-  ): void {
-    this.prompter?.resolveConfirmation(
-      requestId,
-      decision,
-      selectedPattern,
-      selectedScope,
-      decisionContext,
-    );
-  }
-}