npm - @vellumai/assistant - Versions diffs - 0.4.35 → 0.4.37 - Mend

@vellumai/assistant 0.4.35 → 0.4.37

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (239) hide show

package/AGENTS.md +1 -1
package/ARCHITECTURE.md +44 -49
package/README.md +32 -20
package/docs/architecture/keychain-broker.md +186 -0
package/docs/architecture/security.md +110 -116
package/docs/runbook-trusted-contacts.md +2 -2
package/docs/skills.md +25 -25
package/package.json +5 -2
package/src/__tests__/__snapshots__/ipc-snapshot.test.ts.snap +11 -2
package/src/__tests__/actor-token-service.test.ts +1 -0
package/src/__tests__/amazon-cdp-integration.test.ts +74 -0
package/src/__tests__/assistant-feature-flags-integration.test.ts +38 -9
package/src/__tests__/assistant-id-boundary-guard.test.ts +29 -0
package/src/__tests__/browser-fill-credential.test.ts +1 -1
package/src/__tests__/bundle-scanner.test.ts +1 -1
package/src/__tests__/channel-guardian.test.ts +102 -102
package/src/__tests__/channel-invite-transport.test.ts +155 -256
package/src/__tests__/channel-readiness-routes.test.ts +336 -0
package/src/__tests__/checker.test.ts +6 -6
package/src/__tests__/chrome-cdp.test.ts +350 -0
package/src/__tests__/computer-use-session-lifecycle.test.ts +3 -3
package/src/__tests__/computer-use-session-working-dir.test.ts +86 -52
package/src/__tests__/computer-use-skill-lifecycle-cleanup.test.ts +1 -1
package/src/__tests__/config-loader-migration.test.ts +85 -0
package/src/__tests__/conversation-pairing.test.ts +370 -5
package/src/__tests__/credential-broker-browser-fill.test.ts +1 -10
package/src/__tests__/credential-broker-server-use.test.ts +1 -10
package/src/__tests__/credential-security-e2e.test.ts +7 -1
package/src/__tests__/credential-security-invariants.test.ts +14 -20
package/src/__tests__/credential-vault-unit.test.ts +1 -11
package/src/__tests__/credential-vault.test.ts +5 -19
package/src/__tests__/credentials-cli.test.ts +814 -0
package/src/__tests__/dynamic-skill-workflow-prompt.test.ts +23 -4
package/src/__tests__/email-invite-adapter.test.ts +78 -0
package/src/__tests__/email-service-config-fallback.test.ts +102 -0
package/src/__tests__/encrypted-store.test.ts +6 -6
package/src/__tests__/ephemeral-permissions.test.ts +3 -3
package/src/__tests__/gateway-only-enforcement.test.ts +5 -1
package/src/__tests__/guardian-actions-endpoint.test.ts +70 -12
package/src/__tests__/guardian-outbound-http.test.ts +53 -47
package/src/__tests__/handle-user-message-secret-resume.test.ts +23 -0
package/src/__tests__/handlers-add-trust-rule-metadata.test.ts +32 -23
package/src/__tests__/handlers-telegram-config.test.ts +8 -2
package/src/__tests__/handlers-twitter-config.test.ts +2 -2
package/src/__tests__/handlers-user-message-approval-consumption.test.ts +108 -7
package/src/__tests__/ingress-reconcile.test.ts +6 -0
package/src/__tests__/intent-routing.test.ts +23 -4
package/src/__tests__/invite-routes-http.test.ts +12 -0
package/src/__tests__/ipc-snapshot.test.ts +8 -2
package/src/__tests__/keychain-broker-client.test.ts +543 -0
package/src/__tests__/llm-usage-store.test.ts +344 -0
package/src/__tests__/mcp-client-auth.test.ts +2 -2
package/src/__tests__/media-reuse-story.e2e.test.ts +1 -1
package/src/__tests__/migration-transport.test.ts +49 -0
package/src/__tests__/notification-broadcaster.test.ts +205 -5
package/src/__tests__/notification-deep-link.test.ts +365 -1
package/src/__tests__/oauth-connect-handler.test.ts +2 -2
package/src/__tests__/onboarding-starter-tasks.test.ts +17 -4
package/src/__tests__/proxy-approval-callback.test.ts +1 -1
package/src/__tests__/recording-handler.test.ts +1 -1
package/src/__tests__/recording-intent-handler.test.ts +6 -1
package/src/__tests__/recording-state-machine.test.ts +1 -1
package/src/__tests__/relay-server.test.ts +9 -1
package/src/__tests__/ride-shotgun-handler.test.ts +499 -0
package/src/__tests__/runtime-attachment-metadata.test.ts +160 -1
package/src/__tests__/script-proxy-injection-runtime.test.ts +299 -2
package/src/__tests__/script-proxy-profile-template-fallback.test.ts +1 -1
package/src/__tests__/secret-onetime-send.test.ts +8 -2
package/src/__tests__/secure-keys.test.ts +175 -216
package/src/__tests__/session-confirmation-signals.test.ts +1 -1
package/src/__tests__/session-messaging-secret-redirect.test.ts +1 -1
package/src/__tests__/session-queue.test.ts +2 -1
package/src/__tests__/session-tool-setup-app-refresh.test.ts +2 -2
package/src/__tests__/skill-feature-flags-integration.test.ts +29 -4
package/src/__tests__/skill-feature-flags.test.ts +12 -9
package/src/__tests__/skill-load-feature-flag.test.ts +26 -5
package/src/__tests__/skill-projection.benchmark.test.ts +0 -1
package/src/__tests__/skills.test.ts +34 -4
package/src/__tests__/slack-channel-config.test.ts +2 -2
package/src/__tests__/system-prompt.test.ts +26 -4
package/src/__tests__/telegram-bot-username-resolution.test.ts +212 -0
package/src/__tests__/telegram-invite-adapter.test.ts +164 -0
package/src/__tests__/tool-execution-pipeline.benchmark.test.ts +1 -1
package/src/__tests__/tool-permission-simulate-handler.test.ts +8 -2
package/src/__tests__/trusted-contact-approval-notifier.test.ts +9 -1
package/src/__tests__/twitter-auth-handler.test.ts +2 -2
package/src/__tests__/twitter-oauth-client.test.ts +1 -1
package/src/__tests__/usage-routes.test.ts +339 -0
package/src/__tests__/whatsapp-invite-adapter.test.ts +94 -0
package/src/agent/loop.ts +3 -0
package/src/amazon/checkout.ts +0 -1
package/src/approvals/guardian-request-resolvers.ts +9 -1
package/src/bundler/app-bundler.ts +28 -12
package/src/bundler/bundle-scanner.ts +1 -1
package/src/bundler/bundle-signer.ts +3 -3
package/src/bundler/manifest.ts +1 -1
package/src/bundler/signature-verifier.ts +3 -3
package/src/channels/config.ts +1 -1
package/src/cli/AGENTS.md +63 -0
package/src/cli/__tests__/notifications.test.ts +470 -0
package/src/cli/amazon.ts +344 -167
package/src/cli/audit.ts +85 -0
package/src/cli/autonomy.ts +369 -0
package/src/cli/channels.ts +51 -0
package/src/cli/completions.ts +208 -0
package/src/cli/config.ts +220 -0
package/src/cli/contacts.ts +471 -0
package/src/cli/credentials.ts +564 -0
package/src/cli/default-action.ts +14 -0
package/src/cli/dev.ts +131 -0
package/src/cli/doctor.ts +398 -0
package/src/cli/email.ts +494 -0
package/src/cli/influencer.ts +72 -0
package/src/cli/integrations.ts +248 -57
package/src/cli/keys.ts +114 -0
package/src/cli/map.ts +46 -54
package/src/cli/mcp.ts +111 -3
package/src/cli/{config-commands.ts → memory.ts} +134 -245
package/src/cli/notifications.ts +407 -0
package/src/cli/program.ts +65 -0
package/src/cli/reference.ts +48 -0
package/src/cli/sequence.ts +154 -0
package/src/cli/sessions.ts +262 -0
package/src/cli/trust.ts +175 -0
package/src/cli/twitter.ts +323 -106
package/src/config/__tests__/build-cli-reference-section.test.ts +49 -0
package/src/config/bundled-skills/amazon/SKILL.md +2 -2
package/src/config/bundled-skills/app-builder/TOOLS.json +26 -0
package/src/config/bundled-skills/app-builder/tools/app-generate-icon.ts +13 -0
package/src/config/bundled-skills/contacts/SKILL.md +178 -10
package/src/config/bundled-skills/doordash/doordash-cli.ts +23 -168
package/src/config/bundled-skills/google-oauth-setup/SKILL.md +135 -34
package/src/config/bundled-skills/messaging/tools/shared.ts +4 -1
package/src/config/bundled-skills/twilio-setup/SKILL.md +70 -17
package/src/config/bundled-tool-registry.ts +2 -0
package/src/config/core-schema.ts +7 -0
package/src/config/feature-flag-registry.json +16 -0
package/src/config/loader.ts +26 -0
package/src/config/schema.ts +4 -0
package/src/config/skill-state.ts +0 -13
package/src/config/system-prompt.ts +27 -0
package/src/contacts/contact-store.ts +25 -0
package/src/daemon/computer-use-session.ts +1 -1
package/src/daemon/handlers/apps.ts +1 -0
package/src/daemon/handlers/config-channels.ts +3 -3
package/src/daemon/handlers/config-dispatch.ts +29 -0
package/src/daemon/handlers/config-inbox.ts +4 -3
package/src/daemon/handlers/config.ts +3 -43
package/src/daemon/handlers/contacts.ts +34 -0
package/src/daemon/handlers/index.ts +17 -3
package/src/daemon/handlers/session-user-message.ts +7 -0
package/src/daemon/handlers/sessions.ts +21 -2
package/src/daemon/handlers/shared.ts +17 -0
package/src/daemon/ipc-contract/apps.ts +2 -0
package/src/daemon/ipc-contract/computer-use.ts +9 -0
package/src/daemon/ipc-contract/contacts.ts +3 -3
package/src/daemon/ipc-contract/inbox.ts +2 -0
package/src/daemon/ipc-contract/messages.ts +4 -0
package/src/daemon/ipc-contract/sessions.ts +8 -0
package/src/daemon/ipc-contract-inventory.json +1 -0
package/src/daemon/lifecycle.ts +0 -5
package/src/daemon/ride-shotgun-handler.ts +139 -25
package/src/daemon/session-agent-loop-handlers.ts +100 -0
package/src/daemon/session-agent-loop.ts +72 -0
package/src/daemon/session-tool-setup.ts +7 -0
package/src/daemon/session.ts +23 -1
package/src/daemon/tool-side-effects.ts +39 -1
package/src/email/service.ts +59 -2
package/src/index.ts +2 -60
package/src/mcp/mcp-oauth-provider.ts +90 -8
package/src/media/app-icon-generator.ts +86 -0
package/src/memory/db-init.ts +11 -0
package/src/memory/llm-usage-store.ts +186 -0
package/src/memory/migrations/137-usage-dashboard-indexes.ts +26 -0
package/src/memory/migrations/139-drop-usage-composite-indexes.ts +30 -0
package/src/memory/migrations/index.ts +2 -0
package/src/memory/schema-migration.ts +1 -0
package/src/memory/shared-app-links-store.ts +1 -1
package/src/messaging/registry.ts +27 -0
package/src/notifications/README.md +79 -70
package/src/notifications/broadcaster.ts +2 -1
package/src/notifications/conversation-pairing.ts +147 -13
package/src/notifications/copy-composer.ts +7 -3
package/src/notifications/destination-resolver.ts +14 -1
package/src/notifications/emit-signal.ts +3 -2
package/src/notifications/signal.ts +105 -1
package/src/notifications/types.ts +16 -0
package/src/permissions/checker.ts +29 -3
package/src/permissions/prompter.ts +11 -3
package/src/runtime/access-request-helper.ts +2 -1
package/src/runtime/auth/route-policy.ts +7 -1
package/src/runtime/channel-invite-transport.ts +40 -63
package/src/runtime/channel-invite-transports/email.ts +13 -39
package/src/runtime/channel-invite-transports/slack.ts +5 -34
package/src/runtime/channel-invite-transports/sms.ts +8 -29
package/src/runtime/channel-invite-transports/telegram.ts +69 -28
package/src/runtime/channel-invite-transports/voice.ts +0 -7
package/src/runtime/channel-invite-transports/whatsapp.ts +43 -0
package/src/runtime/channel-readiness-service.ts +202 -45
package/src/runtime/confirmation-request-guardian-bridge.ts +2 -1
package/src/runtime/guardian-outbound-actions.ts +8 -5
package/src/runtime/http-server.ts +2 -0
package/src/runtime/invite-instruction-generator.ts +178 -0
package/src/runtime/invite-service.ts +22 -25
package/src/runtime/migrations/migration-transport.ts +13 -0
package/src/runtime/routes/app-routes.ts +1 -1
package/src/runtime/routes/approval-strategies/guardian-callback-strategy.ts +8 -7
package/src/runtime/routes/channel-readiness-routes.ts +30 -11
package/src/runtime/routes/contact-routes.ts +54 -26
package/src/runtime/routes/inbound-stages/bootstrap-intercept.ts +1 -1
package/src/runtime/routes/inbound-stages/escalation-intercept.ts +2 -1
package/src/runtime/routes/inbound-stages/verification-intercept.ts +2 -1
package/src/runtime/routes/integration-routes.ts +1 -1
package/src/runtime/routes/invite-routes.ts +1 -1
package/src/runtime/routes/secret-routes.ts +31 -7
package/src/runtime/routes/twilio-routes.ts +32 -1
package/src/runtime/routes/usage-routes.ts +114 -0
package/src/runtime/tool-grant-request-helper.ts +2 -1
package/src/security/encrypted-store.ts +9 -5
package/src/security/keychain-broker-client.ts +393 -0
package/src/security/secure-keys.ts +106 -321
package/src/tools/apps/executors.ts +73 -0
package/src/tools/browser/auto-navigate.ts +15 -6
package/src/tools/browser/chrome-cdp.ts +211 -0
package/src/tools/browser/network-recorder.test.ts +83 -0
package/src/tools/browser/network-recorder.ts +8 -7
package/src/tools/browser/x-auto-navigate.ts +12 -6
package/src/tools/credentials/policy-types.ts +24 -0
package/src/tools/credentials/vault.ts +22 -27
package/src/tools/network/script-proxy/session-manager.ts +47 -3
package/src/tools/permission-checker.ts +1 -0
package/src/tools/types.ts +2 -0
package/src/tools/ui-surface/definitions.ts +1 -2
package/src/tools/watch/watch-state.ts +2 -0
package/src/__tests__/key-migration.test.ts +0 -240
package/src/__tests__/keychain.test.ts +0 -286
package/src/cli/core-commands.ts +0 -899
package/src/security/keychain-to-encrypted-migration.ts +0 -66
package/src/security/keychain.ts +0 -490

package/src/cli/twitter.ts CHANGED Viewed

@@ -118,12 +118,57 @@ export function registerTwitterCommand(program: Command): void {
     )
     .option("--json", "Machine-readable JSON output");
+  tw.addHelpText(
+    "after",
+    `
+Twitter (X) uses a dual-path architecture for interacting with the platform:
+  1. OAuth (official API) — uses an authenticated Twitter OAuth application for
+     posting and replying. Requires a connected OAuth credential.
+  2. Browser session (Ride Shotgun) — uses cookies captured from a real Chrome
+     session to call Twitter's internal GraphQL API. Supports all read operations
+     and posting as a fallback.
+The strategy system controls which path is used for operations that support both:
+  oauth    — always use the OAuth API; fail if unavailable
+  browser  — always use the browser session; fail if unavailable
+  auto     — try OAuth first, fall back to browser session (default)
+Session management:
+  - "login" imports cookies from a Ride Shotgun recording file
+  - "refresh" launches Chrome with CDP, navigates to x.com/login, and runs a
+    Ride Shotgun learn session to capture fresh cookies automatically
+  - "status" shows whether browser session and OAuth are active
+  - "logout" clears the saved browser session cookies
+Examples:
+  $ vellum x status
+  $ vellum x post "Hello world"
+  $ vellum x timeline elonmusk --count 10
+  $ vellum x search "from:vaborsh AI agents" --product Latest
+  $ vellum x strategy set oauth`,
+  );
   // =========================================================================
   // login — import session from a recording
   // =========================================================================
   tw.command("login")
     .description("Import a Twitter session from a Ride Shotgun recording")
     .requiredOption("--recording <path>", "Path to the recording JSON file")
+    .addHelpText(
+      "after",
+      `
+Imports cookies from a Ride Shotgun recording file to establish a browser
+session. The recording file is a JSON file produced by a Ride Shotgun learn
+session that contains captured cookies for x.com.
+After import, all browser-path commands (timeline, search, bookmarks, etc.)
+will use these cookies for authentication.
+Examples:
+  $ vellum x login --recording /tmp/ride-shotgun/recording-abc123.json
+  $ vellum x login --recording ~/recordings/twitter-session.json`,
+    )
     .action(async (opts: { recording: string }, cmd: Command) => {
       await run(cmd, async () => {
         const session = importFromRecording(opts.recording);
@@ -140,6 +185,16 @@ export function registerTwitterCommand(program: Command): void {
   // =========================================================================
   tw.command("logout")
     .description("Clear the saved Twitter session")
+    .addHelpText(
+      "after",
+      `
+Deletes all saved browser session cookies. After logout, browser-path commands
+will fail until a new session is imported via "login" or captured via "refresh".
+OAuth credentials are not affected.
+Examples:
+  $ vellum x logout`,
+    )
     .action((_opts: unknown, cmd: Command) => {
       clearSession();
       output({ ok: true, message: "Session cleared" }, getJson(cmd));
@@ -155,6 +210,24 @@ export function registerTwitterCommand(program: Command): void {
         "NOTE: Chrome will restart with debugging enabled; your tabs will be restored.",
     )
     .option("--duration <seconds>", "Recording duration in seconds", "180")
+    .addHelpText(
+      "after",
+      `
+Restarts Chrome with CDP (Chrome DevTools Protocol) enabled, navigates to
+x.com/login, and runs a Ride Shotgun learn session to capture fresh cookies.
+Sign in when Chrome opens — the session will be recorded automatically.
+The --duration flag sets how long (in seconds) the recording runs before
+stopping. Default is 180 seconds (3 minutes). After the recording completes,
+cookies are imported automatically and Chrome is minimized.
+Requires the assistant to be running (Ride Shotgun runs via the assistant).
+Examples:
+  $ vellum x refresh
+  $ vellum x refresh --duration 120
+  $ vellum x refresh --duration 300`,
+    )
     .action(async (opts: { duration: string }, cmd: Command) => {
       const json = getJson(cmd);
       const duration = parseInt(opts.duration, 10);
@@ -166,7 +239,7 @@ export function registerTwitterCommand(program: Command): void {
           // Hide Chrome after capturing session
           try {
-            await minimizeChromeWindow();
+            await minimizeChromeWindow(); // uses default CDP port
           } catch {
             /* best-effort */
           }
@@ -201,6 +274,22 @@ export function registerTwitterCommand(program: Command): void {
   // =========================================================================
   tw.command("status")
     .description("Check Twitter session, OAuth, and strategy status")
+    .addHelpText(
+      "after",
+      `
+Shows the current state of both authentication paths:
+  Browser session — whether cookies are loaded, cookie count, import timestamp,
+    and the recording ID they came from.
+  OAuth — whether an OAuth credential is connected, the linked account, the
+    current strategy setting, and whether a strategy has been explicitly configured.
+If the assistant is not running, OAuth fields will be reported as undefined.
+Examples:
+  $ vellum x status
+  $ vellum x status --json`,
+    )
     .action(async (_opts: unknown, cmd: Command) => {
       const session = loadSession();
       const browserInfo: Record<string, unknown> = session
@@ -258,6 +347,26 @@ export function registerTwitterCommand(program: Command): void {
     .description(
       "Get or set the Twitter operation strategy (oauth, browser, auto)",
     )
+    .addHelpText(
+      "after",
+      `
+The strategy controls which authentication path is used for operations that
+support both OAuth and browser session:
+  oauth    — always use the official Twitter OAuth API. Fails if no OAuth
+             credential is connected. Best for reliable posting.
+  browser  — always use the browser session (captured cookies). Fails if no
+             session is loaded. Required for read-only endpoints not available
+             via OAuth (bookmarks, notifications, search).
+  auto     — try OAuth first, fall back to browser session. This is the default.
+Run without a subcommand to display the current strategy. Use "set" to change it.
+Examples:
+  $ vellum x strategy
+  $ vellum x strategy set oauth
+  $ vellum x strategy set auto`,
+    )
     .action(async (_opts: unknown, cmd: Command) => {
       const json = getJson(cmd);
       try {
@@ -279,6 +388,21 @@ export function registerTwitterCommand(program: Command): void {
     .command("set")
     .description("Set the Twitter operation strategy")
     .argument("<value>", "Strategy value: oauth, browser, or auto")
+    .addHelpText(
+      "after",
+      `
+Arguments:
+  value   Strategy to use: "oauth", "browser", or "auto"
+Sets the preferred strategy for Twitter operations that support dual-path
+routing. The setting is persisted by the assistant and applies to all subsequent
+operations until changed.
+Examples:
+  $ vellum x strategy set oauth
+  $ vellum x strategy set browser
+  $ vellum x strategy set auto`,
+    )
     .action(async (value: string, _opts: unknown, cmd: Command) => {
       const json = getJson(cmd);
       try {
@@ -311,6 +435,20 @@ export function registerTwitterCommand(program: Command): void {
   tw.command("post")
     .description("Post a tweet")
     .argument("<text>", "Tweet text")
+    .addHelpText(
+      "after",
+      `
+Arguments:
+  text   The tweet text to post (max 280 characters)
+Posts a new tweet using the routed dual-path system. The path used (oauth or
+browser) depends on the current strategy setting. The response includes the
+tweet ID, URL, and which path was used.
+Examples:
+  $ vellum x post "Hello world"
+  $ vellum x post "Check out this thread on AI agents" --json`,
+    )
     .action(async (text: string, _opts: unknown, cmd: Command) => {
       await run(cmd, async () => {
         const { result, pathUsed } = await routedPostTweet(text);
@@ -330,6 +468,21 @@ export function registerTwitterCommand(program: Command): void {
     .description("Reply to a tweet")
     .argument("<tweetUrl>", "Tweet URL or tweet ID")
     .argument("<text>", "Reply text")
+    .addHelpText(
+      "after",
+      `
+Arguments:
+  tweetUrl   Full tweet URL (e.g. https://x.com/user/status/123456) or a bare tweet ID
+  text       The reply text to post (max 280 characters)
+Posts a reply to the specified tweet. Accepts either a full tweet URL or a bare
+numeric tweet ID. The tweet ID is extracted from the last numeric segment of the
+URL. Uses the routed dual-path system based on the current strategy.
+Examples:
+  $ vellum x reply https://x.com/elonmusk/status/1234567890 "Great point!"
+  $ vellum x reply 1234567890 "Interesting thread"`,
+    )
     .action(
       async (tweetUrl: string, text: string, _opts: unknown, cmd: Command) => {
         await run(cmd, async () => {
@@ -359,6 +512,21 @@ export function registerTwitterCommand(program: Command): void {
     .description("Fetch a user's recent tweets")
     .argument("<screenName>", "Twitter screen name (without @)")
     .option("--count <n>", "Number of tweets to fetch", "20")
+    .addHelpText(
+      "after",
+      `
+Arguments:
+  screenName   Twitter screen name without the @ prefix (e.g. "elonmusk", not "@elonmusk")
+Fetches a user's recent tweets via the browser session. Resolves the screen name
+to a user ID first, then retrieves their tweet timeline. The --count flag controls
+how many tweets to return (default: 20).
+Examples:
+  $ vellum x timeline elonmusk
+  $ vellum x timeline vaborsh --count 50
+  $ vellum x timeline openai --count 10 --json`,
+    )
     .action(
       async (screenName: string, opts: { count: string }, cmd: Command) => {
         await run(cmd, async () => {
@@ -378,6 +546,22 @@ export function registerTwitterCommand(program: Command): void {
   tw.command("tweet")
     .description("Fetch a tweet and its reply thread")
     .argument("<tweetIdOrUrl>", "Tweet ID or URL")
+    .addHelpText(
+      "after",
+      `
+Arguments:
+  tweetIdOrUrl   A bare tweet ID (e.g. 1234567890) or a full tweet URL
+                 (e.g. https://x.com/user/status/1234567890)
+Fetches a single tweet and its reply thread via the browser session. The tweet
+ID is extracted from the last numeric segment of the input. Returns an array of
+tweets representing the conversation thread.
+Examples:
+  $ vellum x tweet 1234567890
+  $ vellum x tweet https://x.com/elonmusk/status/1234567890
+  $ vellum x tweet https://x.com/openai/status/9876543210 --json`,
+    )
     .action(async (tweetIdOrUrl: string, _opts: unknown, cmd: Command) => {
       await run(cmd, async () => {
         const idMatch = tweetIdOrUrl.match(/(\d+)\s*$/);
@@ -395,6 +579,26 @@ export function registerTwitterCommand(program: Command): void {
     .description("Search tweets")
     .argument("<query>", "Search query")
     .option("--product <type>", "Top, Latest, People, or Media", "Top")
+    .addHelpText(
+      "after",
+      `
+Arguments:
+  query   Twitter search query string. Supports Twitter search operators
+          (e.g. "from:user", "to:user", "min_faves:100", quoted phrases)
+The --product flag selects the search result type:
+  Top      — most relevant tweets (default)
+  Latest   — most recent tweets, reverse chronological
+  People   — user accounts matching the query
+  Media    — tweets containing images or video
+Uses the browser session path. Requires an active browser session.
+Examples:
+  $ vellum x search "AI agents"
+  $ vellum x search "from:elonmusk SpaceX" --product Latest
+  $ vellum x search "machine learning" --product Media --json`,
+    )
     .action(async (query: string, opts: { product: string }, cmd: Command) => {
       await run(cmd, async () => {
         const tweets = await searchTweets(
@@ -411,6 +615,20 @@ export function registerTwitterCommand(program: Command): void {
   tw.command("bookmarks")
     .description("Fetch your bookmarks")
     .option("--count <n>", "Number of bookmarks", "20")
+    .addHelpText(
+      "after",
+      `
+Fetches the authenticated user's bookmarked tweets via the browser session.
+The --count flag controls how many bookmarks to return (default: 20).
+Requires an active browser session. Bookmarks are private and only available
+for the logged-in account.
+Examples:
+  $ vellum x bookmarks
+  $ vellum x bookmarks --count 50
+  $ vellum x bookmarks --json`,
+    )
     .action(async (opts: { count: string }, cmd: Command) => {
       await run(cmd, async () => {
         const tweets = await getBookmarks(parseInt(opts.count, 10));
@@ -424,6 +642,19 @@ export function registerTwitterCommand(program: Command): void {
   tw.command("home")
     .description("Fetch your home timeline")
     .option("--count <n>", "Number of tweets", "20")
+    .addHelpText(
+      "after",
+      `
+Fetches the authenticated user's home timeline (the "For You" feed) via the
+browser session. The --count flag controls how many tweets to return (default: 20).
+Requires an active browser session.
+Examples:
+  $ vellum x home
+  $ vellum x home --count 50
+  $ vellum x home --json`,
+    )
     .action(async (opts: { count: string }, cmd: Command) => {
       await run(cmd, async () => {
         const tweets = await getHomeTimeline(parseInt(opts.count, 10));
@@ -437,6 +668,20 @@ export function registerTwitterCommand(program: Command): void {
   tw.command("notifications")
     .description("Fetch your notifications")
     .option("--count <n>", "Number of notifications", "20")
+    .addHelpText(
+      "after",
+      `
+Fetches the authenticated user's Twitter notifications (mentions, likes,
+retweets, follows, etc.) via the browser session. The --count flag controls
+how many notifications to return (default: 20).
+Requires an active browser session.
+Examples:
+  $ vellum x notifications
+  $ vellum x notifications --count 50
+  $ vellum x notifications --json`,
+    )
     .action(async (opts: { count: string }, cmd: Command) => {
       await run(cmd, async () => {
         const notifications = await getNotifications(parseInt(opts.count, 10));
@@ -451,6 +696,21 @@ export function registerTwitterCommand(program: Command): void {
     .description("Fetch a user's liked tweets")
     .argument("<screenName>", "Twitter screen name (without @)")
     .option("--count <n>", "Number of likes", "20")
+    .addHelpText(
+      "after",
+      `
+Arguments:
+  screenName   Twitter screen name without the @ prefix (e.g. "elonmusk", not "@elonmusk")
+Fetches tweets liked by the specified user via the browser session. Resolves the
+screen name to a user ID first. The --count flag controls how many liked tweets
+to return (default: 20).
+Examples:
+  $ vellum x likes elonmusk
+  $ vellum x likes vaborsh --count 50
+  $ vellum x likes openai --json`,
+    )
     .action(
       async (screenName: string, opts: { count: string }, cmd: Command) => {
         await run(cmd, async () => {
@@ -467,6 +727,19 @@ export function registerTwitterCommand(program: Command): void {
   tw.command("followers")
     .description("Fetch a user's followers")
     .argument("<screenName>", "Twitter screen name (without @)")
+    .addHelpText(
+      "after",
+      `
+Arguments:
+  screenName   Twitter screen name without the @ prefix (e.g. "elonmusk", not "@elonmusk")
+Fetches the list of accounts following the specified user via the browser session.
+Resolves the screen name to a user ID first.
+Examples:
+  $ vellum x followers elonmusk
+  $ vellum x followers vaborsh --json`,
+    )
     .action(async (screenName: string, _opts: unknown, cmd: Command) => {
       await run(cmd, async () => {
         const cleanName = screenName.replace(/^@/, "");
@@ -483,6 +756,21 @@ export function registerTwitterCommand(program: Command): void {
     .description("Fetch who a user follows")
     .argument("<screenName>", "Twitter screen name (without @)")
     .option("--count <n>", "Number of following", "20")
+    .addHelpText(
+      "after",
+      `
+Arguments:
+  screenName   Twitter screen name without the @ prefix (e.g. "elonmusk", not "@elonmusk")
+Fetches the list of accounts the specified user follows via the browser session.
+Resolves the screen name to a user ID first. The --count flag controls how many
+results to return (default: 20).
+Examples:
+  $ vellum x following elonmusk
+  $ vellum x following vaborsh --count 100
+  $ vellum x following openai --json`,
+    )
     .action(
       async (screenName: string, opts: { count: string }, cmd: Command) => {
         await run(cmd, async () => {
@@ -503,6 +791,21 @@ export function registerTwitterCommand(program: Command): void {
     .description("Fetch a user's media tweets")
     .argument("<screenName>", "Twitter screen name (without @)")
     .option("--count <n>", "Number of media tweets", "20")
+    .addHelpText(
+      "after",
+      `
+Arguments:
+  screenName   Twitter screen name without the @ prefix (e.g. "elonmusk", not "@elonmusk")
+Fetches tweets containing images or video from the specified user via the browser
+session. Resolves the screen name to a user ID first. The --count flag controls
+how many media tweets to return (default: 20).
+Examples:
+  $ vellum x media elonmusk
+  $ vellum x media nasa --count 50
+  $ vellum x media openai --json`,
+    )
     .action(
       async (screenName: string, opts: { count: string }, cmd: Command) => {
         await run(cmd, async () => {
@@ -613,108 +916,13 @@ function sendDaemonMessage(
 }
 // ---------------------------------------------------------------------------
-// Chrome CDP restart helper
+// Chrome CDP helpers (shared)
 // ---------------------------------------------------------------------------
-import { spawn as spawnChild } from "node:child_process";
-import { homedir } from "node:os";
-import { join as pathJoin } from "node:path";
-const CDP_BASE = "http://localhost:9222";
-const CHROME_DATA_DIR = pathJoin(
-  homedir(),
-  "Library/Application Support/Google/Chrome-CDP",
-);
-async function isCdpReady(): Promise<boolean> {
-  try {
-    const res = await fetch(`${CDP_BASE}/json/version`);
-    return res.ok;
-  } catch {
-    return false;
-  }
-}
-async function ensureChromeWithCDP(): Promise<void> {
-  // Already running with CDP?
-  if (await isCdpReady()) return;
-  // Launch a separate Chrome instance with CDP flags alongside any existing Chrome.
-  // Using a dedicated --user-data-dir allows coexistence without killing the user's browser.
-  const chromeApp =
-    "/Applications/Google Chrome.app/Contents/MacOS/Google Chrome";
-  spawnChild(
-    chromeApp,
-    [
-      `--remote-debugging-port=9222`,
-      `--force-renderer-accessibility`,
-      `--user-data-dir=${CHROME_DATA_DIR}`,
-      "https://x.com/login",
-    ],
-    {
-      detached: true,
-      stdio: "ignore",
-    },
-  ).unref();
-  // Wait for CDP to be ready
-  for (let i = 0; i < 30; i++) {
-    await new Promise((r) => setTimeout(r, 500));
-    if (await isCdpReady()) return;
-  }
-  throw new Error("Chrome started but CDP endpoint not responding after 15s");
-}
-async function minimizeChromeWindow(): Promise<void> {
-  const res = await fetch(`${CDP_BASE}/json/list`);
-  const targets = (await res.json()) as Array<{
-    type: string;
-    webSocketDebuggerUrl: string;
-  }>;
-  const pageTarget = targets.find((t) => t.type === "page");
-  if (!pageTarget) return;
-  const ws = new WebSocket(pageTarget.webSocketDebuggerUrl);
-  await new Promise<void>((resolve, reject) => {
-    const timeout = setTimeout(() => {
-      ws.close();
-      reject(new Error("CDP minimize timed out"));
-    }, 5000);
-    ws.addEventListener("open", () => {
-      ws.send(JSON.stringify({ id: 1, method: "Browser.getWindowForTarget" }));
-    });
-    ws.addEventListener("message", (event) => {
-      const msg = JSON.parse(String(event.data)) as {
-        id: number;
-        result?: { windowId: number };
-      };
-      if (msg.id === 1 && msg.result) {
-        ws.send(
-          JSON.stringify({
-            id: 2,
-            method: "Browser.setWindowBounds",
-            params: {
-              windowId: msg.result.windowId,
-              bounds: { windowState: "minimized" },
-            },
-          }),
-        );
-      } else if (msg.id === 2) {
-        clearTimeout(timeout);
-        ws.close();
-        resolve();
-      }
-    });
-    ws.addEventListener("error", (err) => {
-      clearTimeout(timeout);
-      reject(err);
-    });
-  });
-}
+import {
+  ensureChromeWithCdp,
+  minimizeChromeWindow,
+} from "../tools/browser/chrome-cdp.js";
 // ---------------------------------------------------------------------------
 // Ride Shotgun learn session helper
@@ -725,9 +933,9 @@ interface LearnResult {
   recordingPath?: string;
 }
-async function navigateToX(): Promise<void> {
+async function navigateToX(cdpBase: string): Promise<void> {
   try {
-    const res = await fetch(`${CDP_BASE}/json/list`);
+    const res = await fetch(`${cdpBase}/json/list`);
     if (!res.ok) return;
     const targets = (await res.json()) as Array<{
       id: string;
@@ -737,7 +945,7 @@ async function navigateToX(): Promise<void> {
     const tab = targets.find((t) => t.type === "page");
     if (!tab) return;
     await fetch(
-      `${CDP_BASE}/json/navigate?url=${encodeURIComponent(
+      `${cdpBase}/json/navigate?url=${encodeURIComponent(
         "https://x.com/login",
       )}&id=${tab.id}`,
       { method: "PUT" },
@@ -750,8 +958,10 @@ async function navigateToX(): Promise<void> {
 async function startLearnSession(
   durationSeconds: number,
 ): Promise<LearnResult> {
-  await ensureChromeWithCDP();
-  await navigateToX();
+  const cdpSession = await ensureChromeWithCdp({
+    startUrl: "https://x.com/login",
+  });
+  await navigateToX(cdpSession.baseUrl);
   return new Promise((resolve, reject) => {
     const socketPath = getSocketPath();
@@ -813,6 +1023,13 @@ async function startLearnSession(
           continue;
         }
+        if (m.type === "ride_shotgun_error") {
+          clearTimeout(timeoutHandle);
+          socket.destroy();
+          reject(new Error((m as { message: string }).message));
+          continue;
+        }
         if (m.type === "ride_shotgun_result") {
           clearTimeout(timeoutHandle);
           socket.destroy();

package/src/config/__tests__/build-cli-reference-section.test.ts ADDED Viewed

@@ -0,0 +1,49 @@
+/**
+ * Tests for buildCliReferenceSection — verifies the CLI reference section
+ * included in the system prompt has the expected structure and caching behaviour.
+ */
+import { beforeEach, describe, expect, test } from "bun:test";
+import {
+  _resetCliHelpCache,
+  buildCliReferenceSection,
+} from "../system-prompt.js";
+describe("buildCliReferenceSection", () => {
+  beforeEach(() => {
+    _resetCliHelpCache();
+  });
+  test("includes the Assistant CLI heading", () => {
+    const result = buildCliReferenceSection();
+    expect(result).toContain("## Assistant CLI");
+  });
+  test("includes CLI help text with command listings", () => {
+    const result = buildCliReferenceSection();
+    // The reference is a side-effect-free snapshot of the top-level CLI help.
+    expect(result).toContain("Usage:");
+    expect(result).toContain("Commands:");
+  });
+  test("mentions bash as the way to invoke the CLI", () => {
+    const result = buildCliReferenceSection();
+    expect(result).toContain("available via `bash`");
+  });
+  test("result is cached — calling twice returns the same string", () => {
+    const first = buildCliReferenceSection();
+    const second = buildCliReferenceSection();
+    expect(first).toBe(second);
+  });
+  test("cache is reset by _resetCliHelpCache", () => {
+    const first = buildCliReferenceSection();
+    _resetCliHelpCache();
+    const second = buildCliReferenceSection();
+    // Content should be identical even after reset (same CLI program),
+    // but they should be independently computed strings.
+    expect(first).toEqual(second);
+  });
+});

package/src/config/bundled-skills/amazon/SKILL.md CHANGED Viewed

@@ -2,7 +2,7 @@
 name: "Amazon"
 description: "Shop on Amazon and Amazon Fresh using the built-in CLI integration"
 user-invocable: true
-metadata: {"vellum": {"emoji": "\uD83D\uDCE6"}}
+metadata: { "vellum": { "emoji": "\uD83D\uDCE6" } }
 ---
 You can shop on Amazon (and Amazon Fresh for groceries) for the user using the `vellum amazon` CLI.
@@ -92,7 +92,7 @@ vellum amazon fresh select-slot --slot-id <id> --json
 vellum amazon payment-methods --json
 vellum amazon checkout --json
-vellum amazon order place [--payment-method-id <id>] [--slot-id <id>] --json
+vellum amazon order place [--payment-method-id <id>] --json
 ```
 ## Example Interactions

package/src/config/bundled-skills/app-builder/TOOLS.json CHANGED Viewed

@@ -326,6 +326,32 @@
       },
       "executor": "tools/app-file-write.ts",
       "execution_target": "host"
+    },
+    {
+      "name": "app_generate_icon",
+      "description": "Generate or regenerate an AI-designed icon for an app. Uses Gemini to create a professional app icon. Call this when the user wants a new or different icon for their app.",
+      "category": "apps",
+      "risk": "low",
+      "input_schema": {
+        "type": "object",
+        "properties": {
+          "app_id": {
+            "type": "string",
+            "description": "The ID of the app to generate an icon for"
+          },
+          "description": {
+            "type": "string",
+            "description": "Optional description to guide icon generation (e.g. 'a blue calendar with a checkmark'). If omitted, the app name and description are used."
+          },
+          "reason": {
+            "type": "string",
+            "description": "Brief non-technical explanation of why this tool is being called"
+          }
+        },
+        "required": ["app_id"]
+      },
+      "executor": "tools/app-generate-icon.ts",
+      "execution_target": "host"
     }
   ]
 }