npm - @steipete/oracle - Versions diffs - 0.12.0 → 0.13.0 - Mend

@steipete/oracle 0.12.0 → 0.13.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (25) hide show

package/README.md +54 -54
package/dist/bin/oracle-cli.js +15 -6
package/dist/bin/oracle-mcp.js +0 -0
package/dist/src/browser/actions/modelSelection.js +126 -25
package/dist/src/browser/actions/navigation.js +89 -27
package/dist/src/browser/actions/promptComposer.js +196 -46
package/dist/src/browser/actions/thinkingTime.js +111 -12
package/dist/src/browser/config.js +2 -0
package/dist/src/browser/index.js +43 -4
package/dist/src/browser/providers/chatgptDomProvider.js +2 -0
package/dist/src/browser/reattachability.js +22 -0
package/dist/src/browser/sessionRunner.js +1 -0
package/dist/src/cli/bridge/doctor.js +7 -2
package/dist/src/cli/browserConfig.js +9 -1
package/dist/src/cli/browserDefaults.js +3 -0
package/dist/src/cli/engine.js +6 -2
package/dist/src/cli/options.js +4 -0
package/dist/src/cli/runOptions.js +9 -20
package/dist/src/cli/sessionDisplay.js +8 -0
package/dist/src/cli/sessionRunner.js +49 -5
package/dist/src/config.js +164 -9
package/dist/src/oracle/providerRoutePlan.js +29 -2
package/dist/src/oracle/run.js +50 -156
package/dist/src/sessionManager.js +38 -22
package/package.json +14 -13

package/README.md CHANGED Viewed

@@ -272,55 +272,55 @@ Browser automation can open or control Chrome, so dry-runs and live runs print a
 ## Flags you’ll actually use
-| Flag                                                            | Purpose                                                                                                                                                                                                                                                                                                                                   |
-| --------------------------------------------------------------- | ----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
-| `-p, --prompt <text>`                                           | Required prompt.                                                                                                                                                                                                                                                                                                                          |
-| `-f, --file <paths...>`                                         | Attach files/dirs (globs + `!` excludes).                                                                                                                                                                                                                                                                                                 |
-| `-e, --engine <api\|browser>`                                   | Choose API or browser (browser is experimental).                                                                                                                                                                                                                                                                                          |
-| `-m, --model <name>`                                            | Built-ins (`gpt-5.5-pro` default, `gpt-5.5`, `gpt-5.4-pro`, `gpt-5.4`, `gpt-5.1-pro`, `gpt-5-pro`, `gpt-5.1`, `gpt-5.1-codex`, `gpt-5.2`, `gpt-5.2-instant`, `gpt-5.2-pro`, `gemini-3.1-pro` API-only, `gemini-3-pro`, `claude-4.6-sonnet`, `claude-4.1-opus`) plus any OpenRouter id (e.g., `minimax/minimax-m2`, `openai/gpt-4o-mini`). |
-| `--models <list>`                                               | Comma-separated API models (mix built-ins and OpenRouter ids) for multi-model runs.                                                                                                                                                                                                                                                       |
-| `--followup <sessionId\|responseId>`                            | Continue an OpenAI/Azure Responses API run from a stored oracle session or `resp_...` response id.                                                                                                                                                                                                                                        |
-| `--followup-model <model>`                                      | For multi-model OpenAI/Azure parent sessions, choose which model response to continue from.                                                                                                                                                                                                                                               |
-| `--base-url <url>`                                              | Point API runs at LiteLLM/Azure/OpenRouter/etc.                                                                                                                                                                                                                                                                                           |
-| `--chatgpt-url <url>`                                           | Target a ChatGPT workspace/folder or Temporary Chat URL (browser).                                                                                                                                                                                                                                                                        |
-| `--browser-model-strategy <select\|current\|ignore>`            | Control ChatGPT model selection in browser mode (current keeps the active model; ignore skips the picker).                                                                                                                                                                                                                                |
-| `--browser-manual-login`                                        | Skip cookie copy; reuse a persistent automation profile and wait for manual ChatGPT login.                                                                                                                                                                                                                                                |
-| `--browser-attach-running`                                      | Reuse your current local browser session through local `DevToolsActivePort` discovery; Oracle opens a dedicated tab instead of launching Chrome (defaults to `127.0.0.1:9222`, or combine with `--remote-chrome <host:port>` to hint a different local endpoint).                                                                         |
-| `--browser-tab <ref>`                                           | Reuse an existing ChatGPT tab by `current`, target id, URL, or title substring instead of opening a new tab.                                                                                                                                                                                                                              |
-| `--browser-thinking-time <light\|standard\|extended\|heavy>`    | Set ChatGPT thinking-time intensity (browser; Thinking/Pro models only).                                                                                                                                                                                                                                                                  |
-| `--browser-research deep`                                       | Activate ChatGPT Deep Research for broad web research and cited reports (browser only).                                                                                                                                                                                                                                                   |
-| `--browser-follow-up <prompt>`                                  | Browser-only multi-turn consult: submit an additional prompt in the same ChatGPT conversation after the initial answer. Repeat for challenge/revision/final-decision passes. Not supported with Deep Research mode.                                                                                                                       |
-| `--browser-archive <auto\|always\|never>`                       | Archive completed ChatGPT browser conversations after local artifacts are saved. `auto` archives successful one-shot chats only, and skips project, Deep Research, multi-turn, failed, and incomplete sessions.                                                                                                                           |
-| `--browser-attachments <auto\|never\|always>`                   | Control browser file delivery: `auto` pastes small text files inline and uploads larger bundles, `never` always pastes inline, and `always` uploads files as ChatGPT attachments.                                                                                                                                                         |
-| `--browser-bundle-files`, `--browser-bundle-format <text\|zip>` | Bundle browser uploads into one attachment. `text` keeps the existing single Markdown-style text bundle; `zip` preserves individual file names inside one ZIP upload.                                                                                                                                                                     |
-| `--browser-port <port>`                                         | Pin the Chrome DevTools port (WSL/Windows firewall helper).                                                                                                                                                                                                                                                                               |
-| `--browser-inline-cookies[(-file)] <payload \| path>`           | Supply cookies without Chrome/Keychain (browser).                                                                                                                                                                                                                                                                                         |
-| `--browser-timeout`, `--browser-input-timeout`                  | Control overall/browser input timeouts (supports h/m/s/ms).                                                                                                                                                                                                                                                                               |
-| `--browser-recheck-delay`, `--browser-recheck-timeout`          | Delayed recheck for long Pro runs: wait then retry capture after timeout (supports h/m/s/ms).                                                                                                                                                                                                                                             |
-| `--heartbeat <seconds>`                                         | Emit API and browser progress heartbeats. Browser mode reports ChatGPT Thinking/Reasoning sidecar liveness metadata when available, without logging reasoning text.                                                                                                                                                                       |
-| `--browser-reuse-wait`                                          | Wait for a shared Chrome profile before launching (parallel browser runs).                                                                                                                                                                                                                                                                |
-| `--browser-profile-lock-timeout`                                | Wait for the shared manual-login profile lock before sending (serializes parallel runs).                                                                                                                                                                                                                                                  |
-| `--browser-max-concurrent-tabs`                                 | Soft limit for simultaneous ChatGPT tabs sharing one manual-login profile (default 3).                                                                                                                                                                                                                                                    |
-| `--render`, `--copy`                                            | Print and/or copy the assembled markdown bundle.                                                                                                                                                                                                                                                                                          |
-| `--wait`                                                        | Block for background API runs (e.g., GPT‑5.1 Pro) instead of detaching.                                                                                                                                                                                                                                                                   |
-| `--timeout <seconds\|duration\|auto>`                           | Overall API deadline (auto = 60m for pro, 120s otherwise; durations like `10m` derive HTTP/stale-session timeouts unless overridden).                                                                                                                                                                                                     |
-| `--background`, `--no-background`                               | Force Responses API background mode (create + retrieve) for API runs.                                                                                                                                                                                                                                                                     |
-| `--http-timeout <ms\|s\|m\|h>`                                  | Override the HTTP client timeout; if omitted, explicit `--timeout` values are reused for transport.                                                                                                                                                                                                                                       |
-| `--zombie-timeout <ms\|s\|m\|h>`                                | Override stale-session cutoff used by `oracle status`.                                                                                                                                                                                                                                                                                    |
-| `--zombie-last-activity`                                        | Use last log activity to detect stale sessions.                                                                                                                                                                                                                                                                                           |
-| `--write-output <path>`                                         | Save only the final answer (multi-model adds `.<model>` and writes `<stem>.oracle.json`). Browser sessions also save transcripts and generated artifacts under `~/.oracle/sessions/<id>/artifacts/`.                                                                                                                                      |
-| `--allow-partial`, `--partial <fail\|ok>`                       | Multi-model failure policy. Default `fail` exits 1 after printing a structured partial summary; `ok` exits 0 when at least one model succeeds.                                                                                                                                                                                            |
-| `--preflight`                                                   | Check redacted provider readiness for requested API model(s), then exit without creating a session.                                                                                                                                                                                                                                       |
-| `--perf-trace`, `--perf-trace-path <path>`                      | Write startup/first-output timing trace JSON; also accepts `--perf-trace=/tmp/oracle.json`, `ORACLE_PERF_TRACE=1`, or `ORACLE_PERF_TRACE=/tmp/oracle.json`.                                                                                                                                                                               |
-| `--files-report`                                                | Print per-file token usage.                                                                                                                                                                                                                                                                                                               |
-| `--dry-run [summary\|json\|full]`                               | Preview without sending.                                                                                                                                                                                                                                                                                                                  |
-| `--remote-host`, `--remote-token`                               | Use a remote `oracle serve` host (browser).                                                                                                                                                                                                                                                                                               |
-| `--remote-chrome <host:port>`                                   | Attach to an existing remote Chrome session (browser), or when combined with `--browser-attach-running` use this host:port as the local attach hint.                                                                                                                                                                                      |
-| `--youtube <url>`                                               | YouTube video URL to analyze (Gemini browser mode).                                                                                                                                                                                                                                                                                       |
-| `--generate-image <file>`                                       | Generate image and save to file (Gemini browser mode; ChatGPT browser mode saves downloadable image artifacts when present). Extra ChatGPT images save as numbered siblings.                                                                                                                                                              |
-| `--edit-image <file>`                                           | Edit existing image with `--output` (Gemini browser mode). For ChatGPT browser mode, attach source images with `--file` and use `--generate-image` for the output path.                                                                                                                                                                   |
-| `--provider openai\|azure\|auto`, `--no-azure`, `--route`       | Choose or inspect API provider routing; `openai` / `--no-azure` ignores Azure env/config for the run.                                                                                                                                                                                                                                     |
-| `--azure-endpoint`, `--azure-deployment`, `--azure-api-version` | Target Azure OpenAI endpoints (picks Azure client automatically).                                                                                                                                                                                                                                                                         |
+| Flag                                                                           | Purpose                                                                                                                                                                                                                                                                                                                                   |
+| ------------------------------------------------------------------------------ | ----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
+| `-p, --prompt <text>`                                                          | Required prompt.                                                                                                                                                                                                                                                                                                                          |
+| `-f, --file <paths...>`                                                        | Attach files/dirs (globs + `!` excludes).                                                                                                                                                                                                                                                                                                 |
+| `-e, --engine <api\|browser>`                                                  | Choose API or browser (browser is experimental).                                                                                                                                                                                                                                                                                          |
+| `-m, --model <name>`                                                           | Built-ins (`gpt-5.5-pro` default, `gpt-5.5`, `gpt-5.4-pro`, `gpt-5.4`, `gpt-5.1-pro`, `gpt-5-pro`, `gpt-5.1`, `gpt-5.1-codex`, `gpt-5.2`, `gpt-5.2-instant`, `gpt-5.2-pro`, `gemini-3.1-pro` API-only, `gemini-3-pro`, `claude-4.6-sonnet`, `claude-4.1-opus`) plus any OpenRouter id (e.g., `minimax/minimax-m2`, `openai/gpt-4o-mini`). |
+| `--models <list>`                                                              | Comma-separated API models (mix built-ins and OpenRouter ids) for multi-model runs.                                                                                                                                                                                                                                                       |
+| `--followup <sessionId\|responseId>`                                           | Continue an OpenAI/Azure Responses API run from a stored oracle session or `resp_...` response id.                                                                                                                                                                                                                                        |
+| `--followup-model <model>`                                                     | For multi-model OpenAI/Azure parent sessions, choose which model response to continue from.                                                                                                                                                                                                                                               |
+| `--base-url <url>`                                                             | Point API runs at LiteLLM/Azure/OpenRouter/etc.                                                                                                                                                                                                                                                                                           |
+| `--chatgpt-url <url>`                                                          | Target a ChatGPT workspace/folder or Temporary Chat URL (browser).                                                                                                                                                                                                                                                                        |
+| `--browser-model-strategy <select\|current\|ignore>`                           | Control ChatGPT model selection in browser mode (current keeps the active model; ignore skips the picker).                                                                                                                                                                                                                                |
+| `--browser-manual-login`                                                       | Skip cookie copy; reuse a persistent automation profile and wait for manual ChatGPT login.                                                                                                                                                                                                                                                |
+| `--browser-attach-running`                                                     | Reuse your current local browser session through local `DevToolsActivePort` discovery; Oracle opens a dedicated tab instead of launching Chrome (defaults to `127.0.0.1:9222`, or combine with `--remote-chrome <host:port>` to hint a different local endpoint).                                                                         |
+| `--browser-tab <ref>`                                                          | Reuse an existing ChatGPT tab by `current`, target id, URL, or title substring instead of opening a new tab.                                                                                                                                                                                                                              |
+| `--browser-thinking-time <light\|standard\|extended\|heavy>`                   | Set ChatGPT thinking-time intensity (browser; Thinking/Pro models only).                                                                                                                                                                                                                                                                  |
+| `--browser-research deep`                                                      | Activate ChatGPT Deep Research for broad web research and cited reports (browser only).                                                                                                                                                                                                                                                   |
+| `--browser-follow-up <prompt>`                                                 | Browser-only multi-turn consult: submit an additional prompt in the same ChatGPT conversation after the initial answer. Repeat for challenge/revision/final-decision passes. Not supported with Deep Research mode.                                                                                                                       |
+| `--browser-archive <auto\|always\|never>`                                      | Archive completed ChatGPT browser conversations after local artifacts are saved. `auto` archives successful one-shot chats only, and skips project, Deep Research, multi-turn, failed, and incomplete sessions.                                                                                                                           |
+| `--browser-attachments <auto\|never\|always>`                                  | Control browser file delivery: `auto` pastes small text files inline and uploads larger bundles, `never` always pastes inline, and `always` uploads files as ChatGPT attachments.                                                                                                                                                         |
+| `--browser-bundle-files`, `--browser-bundle-format <text\|zip>`                | Bundle browser uploads into one attachment. `text` keeps the existing single Markdown-style text bundle; `zip` preserves individual file names inside one ZIP upload.                                                                                                                                                                     |
+| `--browser-port <port>`                                                        | Pin the Chrome DevTools port (WSL/Windows firewall helper).                                                                                                                                                                                                                                                                               |
+| `--browser-inline-cookies[(-file)] <payload \| path>`                          | Supply cookies without Chrome/Keychain (browser).                                                                                                                                                                                                                                                                                         |
+| `--browser-timeout`, `--browser-input-timeout`, `--browser-attachment-timeout` | Control overall/browser input/attachment readiness timeouts (supports h/m/s/ms).                                                                                                                                                                                                                                                          |
+| `--browser-recheck-delay`, `--browser-recheck-timeout`                         | Delayed recheck for long Pro runs: wait then retry capture after timeout (supports h/m/s/ms).                                                                                                                                                                                                                                             |
+| `--heartbeat <seconds>`                                                        | Emit API and browser progress heartbeats. Browser mode reports ChatGPT Thinking/Reasoning sidecar liveness metadata when available, without logging reasoning text.                                                                                                                                                                       |
+| `--browser-reuse-wait`                                                         | Wait for a shared Chrome profile before launching (parallel browser runs).                                                                                                                                                                                                                                                                |
+| `--browser-profile-lock-timeout`                                               | Wait for the shared manual-login profile lock before sending (serializes parallel runs).                                                                                                                                                                                                                                                  |
+| `--browser-max-concurrent-tabs`                                                | Soft limit for simultaneous ChatGPT tabs sharing one manual-login profile (default 3).                                                                                                                                                                                                                                                    |
+| `--render`, `--copy`                                                           | Print and/or copy the assembled markdown bundle.                                                                                                                                                                                                                                                                                          |
+| `--wait`                                                                       | Block for background API runs (e.g., GPT‑5.1 Pro) instead of detaching.                                                                                                                                                                                                                                                                   |
+| `--timeout <seconds\|duration\|auto>`                                          | Overall API deadline (auto = 60m for pro, 120s otherwise; durations like `10m` derive HTTP/stale-session timeouts unless overridden).                                                                                                                                                                                                     |
+| `--background`, `--no-background`                                              | Force Responses API background mode (create + retrieve) for API runs.                                                                                                                                                                                                                                                                     |
+| `--http-timeout <ms\|s\|m\|h>`                                                 | Override the HTTP client timeout; if omitted, explicit `--timeout` values are reused for transport.                                                                                                                                                                                                                                       |
+| `--zombie-timeout <ms\|s\|m\|h>`                                               | Override stale-session cutoff used by `oracle status`.                                                                                                                                                                                                                                                                                    |
+| `--zombie-last-activity`                                                       | Use last log activity to detect stale sessions.                                                                                                                                                                                                                                                                                           |
+| `--write-output <path>`                                                        | Save only the final answer (multi-model adds `.<model>` and writes `<stem>.oracle.json`). Browser sessions also save transcripts and generated artifacts under `~/.oracle/sessions/<id>/artifacts/`.                                                                                                                                      |
+| `--allow-partial`, `--partial <fail\|ok>`                                      | Multi-model failure policy. Default `fail` exits 1 after printing a structured partial summary; `ok` exits 0 when at least one model succeeds.                                                                                                                                                                                            |
+| `--preflight`                                                                  | Check redacted provider readiness for requested API model(s), then exit without creating a session.                                                                                                                                                                                                                                       |
+| `--perf-trace`, `--perf-trace-path <path>`                                     | Write startup/first-output timing trace JSON; also accepts `--perf-trace=/tmp/oracle.json`, `ORACLE_PERF_TRACE=1`, or `ORACLE_PERF_TRACE=/tmp/oracle.json`.                                                                                                                                                                               |
+| `--files-report`                                                               | Print per-file token usage.                                                                                                                                                                                                                                                                                                               |
+| `--dry-run [summary\|json\|full]`                                              | Preview without sending.                                                                                                                                                                                                                                                                                                                  |
+| `--remote-host`, `--remote-token`                                              | Use a remote `oracle serve` host (browser).                                                                                                                                                                                                                                                                                               |
+| `--remote-chrome <host:port>`                                                  | Attach to an existing remote Chrome session (browser), or when combined with `--browser-attach-running` use this host:port as the local attach hint.                                                                                                                                                                                      |
+| `--youtube <url>`                                                              | YouTube video URL to analyze (Gemini browser mode).                                                                                                                                                                                                                                                                                       |
+| `--generate-image <file>`                                                      | Generate image and save to file (Gemini browser mode; ChatGPT browser mode saves downloadable image artifacts when present). Extra ChatGPT images save as numbered siblings.                                                                                                                                                              |
+| `--edit-image <file>`                                                          | Edit existing image with `--output` (Gemini browser mode). For ChatGPT browser mode, attach source images with `--file` and use `--generate-image` for the output path.                                                                                                                                                                   |
+| `--provider openai\|azure\|auto`, `--no-azure`, `--route`                      | Choose or inspect API provider routing; `openai` / `--no-azure` ignores Azure env/config for the run.                                                                                                                                                                                                                                     |
+| `--azure-endpoint`, `--azure-deployment`, `--azure-api-version`                | Target Azure OpenAI endpoints (picks Azure client automatically).                                                                                                                                                                                                                                                                         |
 ## Configuration
@@ -345,11 +345,11 @@ When several agents share one manual-login ChatGPT profile, Oracle coordinates b
 Advanced flags
-| Area         | Flags                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
-| ------------ | ------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
-| Browser      | `--browser-manual-login`, `--browser-attach-running`, `--browser-thinking-time`, `--browser-research`, `--browser-follow-up`, `--browser-archive`, `--browser-timeout`, `--browser-input-timeout`, `--browser-recheck-delay`, `--browser-recheck-timeout`, `--browser-reuse-wait`, `--browser-profile-lock-timeout`, `--browser-max-concurrent-tabs`, `--browser-auto-reattach-delay`, `--browser-auto-reattach-interval`, `--browser-auto-reattach-timeout`, `--browser-cookie-wait`, `--browser-inline-cookies[(-file)]`, `--browser-attachments`, `--browser-inline-files`, `--browser-bundle-files`, `--browser-bundle-format`, `--browser-keep-browser`, `--browser-headless`, `--browser-hide-window`, `--browser-no-cookie-sync`, `--browser-allow-cookie-errors`, `--browser-chrome-path`, `--browser-cookie-path`, `--chatgpt-url` |
-| Run control  | `--background`, `--no-background`, `--http-timeout`, `--zombie-timeout`, `--zombie-last-activity`                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
-| Azure/OpenAI | `--azure-endpoint`, `--azure-deployment`, `--azure-api-version`, `--base-url`                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                               |
+| Area         | Flags                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
+| ------------ | --------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
+| Browser      | `--browser-manual-login`, `--browser-attach-running`, `--browser-thinking-time`, `--browser-research`, `--browser-follow-up`, `--browser-archive`, `--browser-timeout`, `--browser-input-timeout`, `--browser-attachment-timeout`, `--browser-recheck-delay`, `--browser-recheck-timeout`, `--browser-reuse-wait`, `--browser-profile-lock-timeout`, `--browser-max-concurrent-tabs`, `--browser-auto-reattach-delay`, `--browser-auto-reattach-interval`, `--browser-auto-reattach-timeout`, `--browser-cookie-wait`, `--browser-inline-cookies[(-file)]`, `--browser-attachments`, `--browser-inline-files`, `--browser-bundle-files`, `--browser-bundle-format`, `--browser-keep-browser`, `--browser-headless`, `--browser-hide-window`, `--browser-no-cookie-sync`, `--browser-allow-cookie-errors`, `--browser-chrome-path`, `--browser-cookie-path`, `--chatgpt-url` |
+| Run control  | `--background`, `--no-background`, `--http-timeout`, `--zombie-timeout`, `--zombie-last-activity`                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
+| Azure/OpenAI | `--azure-endpoint`, `--azure-deployment`, `--azure-api-version`, `--base-url`                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                               |
 Remote browser example

package/dist/bin/oracle-cli.js CHANGED Viewed

@@ -304,6 +304,7 @@ program
     .addOption(new Option("--browser-url <url>", `Alias for --chatgpt-url (default ${CHATGPT_URL}).`).hideHelp())
     .addOption(new Option("--browser-timeout <ms|s|m>", "Maximum time to wait for an answer (default 1200s / 20m).").hideHelp())
     .addOption(new Option("--browser-input-timeout <ms|s|m>", "Maximum time to wait for the prompt textarea (default 60s).").hideHelp())
+    .addOption(new Option("--browser-attachment-timeout <ms|s|m>", "Maximum time to wait for attachment upload/readiness before clicking send (default 45s).").hideHelp())
     .addOption(new Option("--browser-recheck-delay <ms|s|m|h>", "After an assistant timeout, wait this long then revisit the conversation to retry capture.").hideHelp())
     .addOption(new Option("--browser-recheck-timeout <ms|s|m|h>", "Time budget for the delayed recheck attempt (default 120s).").hideHelp())
     .addOption(new Option("--browser-reuse-wait <ms|s|m|h>", "Wait for a shared Chrome profile to appear before launching a new one (helps parallel runs).").hideHelp())
@@ -1096,19 +1097,21 @@ async function runRootCommand(options) {
         Boolean(options.azureEndpoint?.trim()) &&
         engineModels.some((model) => isAzureOpenAICandidateModel(model));
     const explicitApiProviderRequested = providerMode !== "auto" || hasExplicitAzureOption(optionUsesDefault);
-    const preferredEngine = options.engine ?? (explicitApiProviderRequested ? undefined : userConfig.engine);
+    const envEnginePreference = (process.env.ORACLE_ENGINE ?? "").trim().toLowerCase();
+    const explicitApiEngineRequested = options.engine === "api" || (!options.engine && envEnginePreference === "api");
+    const configBrowserEngineRequested = userConfig.engine === "browser" && !explicitApiEngineRequested && !explicitApiProviderRequested;
     let engine = resolveEngine({
-        engine: preferredEngine,
+        engine: options.engine,
+        configEngine: userConfig.engine,
         browserFlag: options.browser,
         apiProviderRequested: explicitApiProviderRequested,
         env: process.env,
     });
-    const envEnginePreference = (process.env.ORACLE_ENGINE ?? "").trim().toLowerCase();
     const browserEngineRequested = options.browser ||
         options.engine === "browser" ||
         Boolean(remoteHost) ||
-        (!explicitApiProviderRequested &&
-            (userConfig.engine === "browser" || envEnginePreference === "browser"));
+        configBrowserEngineRequested ||
+        (!options.engine && !explicitApiProviderRequested && envEnginePreference === "browser");
     if (azureAutoApiRequested && engine === "browser" && !browserEngineRequested) {
         engine = "api";
     }
@@ -1165,7 +1168,7 @@ async function runRootCommand(options) {
     }
     const resolvedModel = normalizedMultiModels[0] ?? (isGemini ? resolveApiModel(cliModelArg) : resolvedModelCandidate);
     const includesGeminiApiOnly = (normalizedMultiModels.length > 0 ? normalizedMultiModels : [resolvedModel]).some((model) => model === "gemini-3.1-pro");
-    if ((userForcedBrowser || userConfig.engine === "browser") && includesGeminiApiOnly) {
+    if (browserExplicitlyRequested && includesGeminiApiOnly) {
         throw new Error("gemini-3.1-pro is API-only today. Use --engine api or switch to gemini-3-pro for Gemini web.");
     }
     if (engine === "browser" && includesGeminiApiOnly) {
@@ -1271,6 +1274,12 @@ async function runRootCommand(options) {
     const getSource = (key) => program.getOptionValueSource?.(key) ?? undefined;
     const { applyBrowserDefaultsFromConfig } = await import("../src/cli/browserDefaults.js");
     applyBrowserDefaultsFromConfig(options, userConfig, getSource);
+    const attachmentTimeoutEnv = process.env.ORACLE_BROWSER_ATTACHMENT_TIMEOUT?.trim();
+    if (attachmentTimeoutEnv &&
+        (getSource("browserAttachmentTimeout") === undefined ||
+            getSource("browserAttachmentTimeout") === "default")) {
+        options.browserAttachmentTimeout = attachmentTimeoutEnv;
+    }
     const sessionMode = engine === "browser" ? "browser" : "api";
     const browserConfig = await (async () => {
         if (sessionMode !== "browser")

package/dist/bin/oracle-mcp.js CHANGED Viewed

File without changes

package/dist/src/browser/actions/modelSelection.js CHANGED Viewed

@@ -59,7 +59,7 @@ function assertResolvedModelSelection(desiredModel, resolvedLabel) {
     }
     if (!hasCurrentProSignal(resolved) ||
         hasLegacyProVersionLabel(resolved) ||
-        (resolved.includes("thinking") && !resolved.includes("pro"))) {
+        resolved.includes("thinking")) {
         throw new Error(`Model picker selected "${resolvedLabel}" while "${desiredModel}" requires GPT-5.5 Pro. Use model "gpt-5.5" with browser thinking time for the Thinking variant.`);
     }
 }
@@ -70,12 +70,7 @@ function normalizeResolvedModelLabel(value) {
         .trim();
 }
 function hasCurrentProSignal(resolved) {
-    return (resolved.includes(" pro") ||
-        resolved.endsWith("pro") ||
-        resolved.includes("pro ") ||
-        resolved.includes("extended") ||
-        resolved.includes("gpt-5.5-pro") ||
-        resolved.includes("gpt 5 5 pro"));
+    return normalizeResolvedModelLabel(resolved).split(" ").includes("pro");
 }
 function hasLegacyProVersionLabel(resolved) {
     const normalized = normalizeResolvedModelLabel(resolved);
@@ -128,6 +123,7 @@ function buildModelSelectionExpression(targetModel, strategy) {
         .replace(/\\s+/g, ' ')
         .trim();
     };
+    const hasToken = (value, token) => normalizeText(value).split(' ').includes(token);
     // Normalize every candidate token to keep fuzzy matching deterministic.
     const normalizedTarget = normalizeText(PRIMARY_LABEL);
     const normalizedTokens = Array.from(new Set([normalizedTarget, ...LABEL_TOKENS]))
@@ -173,10 +169,43 @@ function buildModelSelectionExpression(targetModel, strategy) {
       return false;
     };
     const hasProComposerPill = () => Boolean(
-      document.querySelector('button.__composer-pill, button[aria-label="Pro, click to remove"]')
+      Array.from(document.querySelectorAll('button.__composer-pill, button[aria-label]'))
+        .filter((node) => {
+          const label = normalizeText(node.getAttribute?.('aria-label') ?? '');
+          return node.matches?.('button.__composer-pill') || label.includes('click to remove');
+        })
+        .some((node) => {
+          const label = normalizeText(
+            (node.getAttribute?.('aria-label') ?? '') + ' ' + (node.textContent ?? '')
+          );
+          return hasToken(label, 'pro') && !hasToken(label, 'thinking');
+        })
     );
-    const button = document.querySelector(BUTTON_SELECTOR);
+    const isVisibleElement = (node) => {
+      if (!(node instanceof HTMLElement)) return false;
+      const rect = node.getBoundingClientRect();
+      const style = window.getComputedStyle(node);
+      return rect.width > 0 && rect.height > 0 && style.display !== 'none' && style.visibility !== 'hidden';
+    };
+    const looksLikeModelPill = (node) => {
+      if (!(node instanceof HTMLElement) || !node.matches('button.__composer-pill')) return false;
+      if (!isVisibleElement(node)) return false;
+      const label = normalizeText(
+        (node.textContent ?? '') + ' ' + (node.getAttribute('aria-label') ?? '') + ' ' + (node.getAttribute('title') ?? '')
+      );
+      if (!label) return false;
+      if (label.includes('click to remove')) return false;
+      const modelTokens = ['chatgpt', 'gpt', 'instant', 'thinking', 'pro', 'extended', 'standard', 'heavy', 'light'];
+      return modelTokens.some((token) => hasToken(label, token));
+    };
+    const findModelButton = () => {
+      const explicit = document.querySelector(BUTTON_SELECTOR);
+      if (explicit) return explicit;
+      return Array.from(document.querySelectorAll('button.__composer-pill')).find(looksLikeModelPill) ?? null;
+    };
+    const button = findModelButton();
     if (!button) {
       return { status: 'button-missing' };
     }
@@ -209,11 +238,15 @@ function buildModelSelectionExpression(targetModel, strategy) {
       const resolved = label || '';
       if (!wantsPro || !hasProComposerPill()) return resolved;
       const normalized = normalizeText(resolved);
-      if (!normalized || normalized.includes('pro')) return resolved;
+      if (!normalized) return resolved;
+      if (normalized.includes('thinking')) return 'Pro';
+      if (normalized.includes('pro')) return resolved;
       return resolved + ' + Pro';
     };
     const getResolvedLabel = (fallback) =>
       withProPillSignal(getComposerModelLabel() || getButtonLabel() || fallback);
+    const isThinkingEffortLabel = (label) =>
+      label === 'extended' || label === 'standard' || label === 'heavy' || label === 'light';
     if (MODEL_STRATEGY === 'current') {
       const currentLabel = getResolvedLabel(PRIMARY_LABEL);
       return {
@@ -225,7 +258,24 @@ function buildModelSelectionExpression(targetModel, strategy) {
       const normalizedLabel = normalizeText(getButtonLabel());
       if (!normalizedLabel) return false;
       if (isTargetGpt55VisibleAlias(normalizedLabel)) return true;
-      if (wantsPro && normalizedLabel === 'chatgpt' && hasProComposerPill()) {
+      if (
+        wantsThinking &&
+        desiredVersion === '5-5' &&
+        !hasProComposerPill() &&
+        isThinkingEffortLabel(normalizedLabel) &&
+        isTargetGpt55VisibleAlias(readComposerModelSignal())
+      ) {
+        return true;
+      }
+      if (
+        wantsPro &&
+        hasProComposerPill() &&
+        (normalizedLabel === 'chatgpt' ||
+          normalizedLabel === 'extended' ||
+          normalizedLabel === 'standard' ||
+          normalizedLabel === 'heavy' ||
+          normalizedLabel === 'light')
+      ) {
         return true;
       }
       if (desiredVersion) {
@@ -238,6 +288,14 @@ function buildModelSelectionExpression(targetModel, strategy) {
       if (wantsPro && labelHasLegacyProVersion(normalizedLabel)) return false;
       if (wantsPro && !labelHasProWord(normalizedLabel)) return false;
       if (wantsInstant && !normalizedLabel.includes('instant')) return false;
+      if (
+        wantsThinking &&
+        desiredVersion === '5-4' &&
+        !normalizedLabel.includes('pro') &&
+        !normalizedLabel.includes('instant')
+      ) {
+        return true;
+      }
       if (wantsThinking && !normalizedLabel.includes('thinking')) return false;
       // Also reject if button has variants we DON'T want
       if (!wantsPro && normalizedLabel.includes(' pro')) return false;
@@ -319,9 +377,6 @@ function buildModelSelectionExpression(targetModel, strategy) {
       if (dataSelected === 'true' || selectedStates.includes(dataState)) {
         return true;
       }
-      if (node.querySelector('[data-testid*="check"], [role="img"][data-icon="check"], svg[data-icon="check"], .trailing svg')) {
-        return true;
-      }
       return false;
     };
@@ -332,6 +387,7 @@ function buildModelSelectionExpression(targetModel, strategy) {
       }
       let score = 0;
       const normalizedTestId = (testid ?? '').toLowerCase();
+      let exactTestIdMatch = false;
       if (normalizedTestId) {
         if (desiredVersion) {
           // data-testid strings have been observed with both dotted and dashed versions (e.g. gpt-5.2-pro vs gpt-5-2-pro).
@@ -378,6 +434,7 @@ function buildModelSelectionExpression(targetModel, strategy) {
         // Exact testid matches take priority over substring matches
         const exactMatch = TEST_IDS.find((id) => id && normalizedTestId === id);
         if (exactMatch) {
+          exactTestIdMatch = true;
           score += 1500;
           if (exactMatch.startsWith('model-switcher-')) score += 200;
         } else {
@@ -394,17 +451,22 @@ function buildModelSelectionExpression(targetModel, strategy) {
       }
       const candidateGpt55VisibleAlias = isTargetGpt55VisibleAlias(normalizedText);
       const candidateHasThinking =
-        normalizedText.includes('thinking') || normalizedTestId.includes('thinking');
+        normalizedText.includes('thinking') ||
+        normalizedTestId.includes('thinking') ||
+        (wantsThinking && desiredVersion === '5-4' && exactTestIdMatch);
       const candidateHasLegacyProVersion = labelHasLegacyProVersion(normalizedText);
       const candidateHasPro =
-        candidateGpt55VisibleAlias ||
         labelHasProWord(normalizedText) ||
         normalizedText.includes('proresearch') ||
         normalizedTestId.includes('pro');
+      const candidateHasInstant =
+        normalizedText.includes('instant') || normalizedTestId.includes('instant');
       if (wantsPro && candidateHasThinking) return 0;
       if (wantsPro && candidateHasLegacyProVersion) return 0;
       if (wantsPro && !candidateHasPro) return 0;
+      if (wantsInstant && !candidateHasInstant) return 0;
       if (wantsThinking && candidateHasPro) return 0;
+      if (wantsThinking && !candidateHasThinking) return 0;
       if (desiredVersion === '5-5' && normalizedText && !candidateGpt55VisibleAlias) {
         const candidateHasVersion =
           normalizedText.includes('5 5') ||
@@ -470,10 +532,35 @@ function buildModelSelectionExpression(targetModel, strategy) {
       return Math.max(score, 0);
     };
+    const hasModelSwitcherItem = (node) =>
+      Boolean(node?.querySelector?.('[data-testid^="model-switcher-"]'));
+    const hasModelLikeMenuText = (node) => {
+      const text = normalizeText(node?.textContent ?? '');
+      return (
+        text.includes('instant') ||
+        text.includes('thinking') ||
+        labelHasProWord(text) ||
+        text.includes('5 5') ||
+        text.includes('5 4') ||
+        text.includes('5 2') ||
+        text.includes('gpt 5') ||
+        text.includes('gpt5')
+      );
+    };
+    const queryPickerMenus = () => {
+      const menus = Array.from(document.querySelectorAll(${menuContainerLiteral}));
+      const pickerMenus = menus.filter(hasModelSwitcherItem);
+      if (pickerMenus.length === 0) return menus;
+      const textFallbackMenus = menus.filter(
+        (menu) => !pickerMenus.includes(menu) && hasModelLikeMenuText(menu),
+      );
+      return pickerMenus.concat(textFallbackMenus);
+    };
     const findBestOption = () => {
       // Walk through every menu item and keep whichever earns the highest score.
       let bestMatch = null;
-      const menus = Array.from(document.querySelectorAll(${menuContainerLiteral}));
+      const menus = queryPickerMenus();
       for (const menu of menus) {
         const buttons = Array.from(menu.querySelectorAll(${menuItemLiteral}));
         for (const option of buttons) {
@@ -502,6 +589,16 @@ function buildModelSelectionExpression(targetModel, strategy) {
           resolve('target');
           return;
         }
+        const currentButtonLabel = normalizeText(getButtonLabel());
+        if (
+          wantsInstant &&
+          desiredVersion === '5-5' &&
+          currentButtonLabel === 'instant' &&
+          currentButtonLabel !== previousButtonLabel
+        ) {
+          resolve('target');
+          return;
+        }
         if (selectionStateChanged(previousButtonLabel, previousComposerSignal)) {
           resolve('changed');
           return;
@@ -529,10 +626,8 @@ function buildModelSelectionExpression(targetModel, strategy) {
         return body.includes('temporary chat');
       };
       const collectAvailableOptions = () => {
-        const menuRoots = Array.from(document.querySelectorAll(${menuContainerLiteral}));
-        const nodes = menuRoots.length > 0
-          ? menuRoots.flatMap((root) => Array.from(root.querySelectorAll(${menuItemLiteral})))
-          : Array.from(document.querySelectorAll(${menuItemLiteral}));
+        const menuRoots = queryPickerMenus();
+        const nodes = menuRoots.flatMap((root) => Array.from(root.querySelectorAll(${menuItemLiteral})));
         const labels = nodes
           .map((node) => (node?.textContent ?? '').trim())
           .filter(Boolean)
@@ -540,7 +635,7 @@ function buildModelSelectionExpression(targetModel, strategy) {
         return labels.slice(0, 12);
       };
       const ensureMenuOpen = () => {
-        const menuOpen = document.querySelector('[role="menu"], [data-radix-collection-root]');
+        const menuOpen = queryPickerMenus().length > 0;
         if (!menuOpen && performance.now() - lastPointerClick > REOPEN_INTERVAL_MS) {
           pointerClick();
         }
@@ -558,7 +653,7 @@ function buildModelSelectionExpression(targetModel, strategy) {
         ensureMenuOpen();
         const match = findBestOption();
         if (match) {
-          if (activeSelectionMatchesTarget()) {
+          if (optionIsSelected(match.node) || activeSelectionMatchesTarget()) {
             closeMenu();
             resolve({ status: 'already-selected', label: getResolvedLabel(match.label) });
             return;
@@ -614,7 +709,7 @@ function buildComposerSignalMatchers(targetModel) {
         return { includesAny: ["thinking"], excludesAny: ["pro"], allowBlank: false };
     }
     if (normalized.includes("instant")) {
-        return { includesAny: [], excludesAny: ["thinking", "pro"], allowBlank: true };
+        return { includesAny: ["instant"], excludesAny: ["thinking", "pro"], allowBlank: false };
     }
     return { includesAny: [], excludesAny: ["thinking", "pro"], allowBlank: true };
 }
@@ -657,7 +752,13 @@ function buildModelMatchersLiteral(targetModel) {
             testIdTokens.add("gpt-5-5-thinking");
             testIdTokens.add("gpt-5.5-thinking");
         }
-        if (!base.includes("pro") && !base.includes("thinking")) {
+        if (base.includes("instant")) {
+            push("instant", labelTokens);
+            testIdTokens.add("model-switcher-gpt-5-5-instant");
+            testIdTokens.add("gpt-5-5-instant");
+            testIdTokens.add("gpt-5.5-instant");
+        }
+        if (!base.includes("pro") && !base.includes("thinking") && !base.includes("instant")) {
             testIdTokens.add("model-switcher-gpt-5-5");
         }
         testIdTokens.add("gpt-5-5");