npm - @steipete/oracle - Versions diffs - 0.8.6 → 0.9.0 - Mend

@steipete/oracle 0.8.6 → 0.9.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (41) hide show

package/README.md +76 -4
package/dist/bin/oracle-cli.js +188 -7
package/dist/src/browser/actions/modelSelection.js +60 -8
package/dist/src/browser/actions/navigation.js +2 -1
package/dist/src/browser/constants.js +1 -1
package/dist/src/browser/index.js +73 -19
package/dist/src/browser/providerDomFlow.js +17 -0
package/dist/src/browser/providers/chatgptDomProvider.js +49 -0
package/dist/src/browser/providers/geminiDeepThinkDomProvider.js +245 -0
package/dist/src/browser/providers/index.js +2 -0
package/dist/src/cli/browserConfig.js +12 -6
package/dist/src/cli/detach.js +5 -2
package/dist/src/cli/fileSize.js +11 -0
package/dist/src/cli/help.js +3 -3
package/dist/src/cli/markdownBundle.js +5 -1
package/dist/src/cli/options.js +40 -3
package/dist/src/cli/runOptions.js +11 -3
package/dist/src/cli/sessionDisplay.js +91 -2
package/dist/src/cli/sessionLineage.js +56 -0
package/dist/src/cli/sessionRunner.js +20 -2
package/dist/src/cli/sessionTable.js +2 -1
package/dist/src/cli/tui/index.js +2 -0
package/dist/src/gemini-web/browserSessionManager.js +76 -0
package/dist/src/gemini-web/client.js +16 -5
package/dist/src/gemini-web/executionClients.js +1 -0
package/dist/src/gemini-web/executionMode.js +18 -0
package/dist/src/gemini-web/executor.js +273 -120
package/dist/src/mcp/tools/consult.js +34 -21
package/dist/src/oracle/client.js +42 -13
package/dist/src/oracle/config.js +43 -7
package/dist/src/oracle/errors.js +2 -2
package/dist/src/oracle/files.js +20 -5
package/dist/src/oracle/gemini.js +3 -0
package/dist/src/oracle/request.js +7 -2
package/dist/src/oracle/run.js +22 -12
package/dist/src/sessionManager.js +4 -0
package/dist/vendor/oracle-notifier/OracleNotifier.app/Contents/CodeResources +0 -0
package/dist/vendor/oracle-notifier/OracleNotifier.app/Contents/MacOS/OracleNotifier +0 -0
package/package.json +18 -18
package/vendor/oracle-notifier/OracleNotifier.app/Contents/CodeResources +0 -0
package/vendor/oracle-notifier/OracleNotifier.app/Contents/MacOS/OracleNotifier +0 -0

package/README.md CHANGED Viewed

@@ -11,7 +11,39 @@
   <a href="LICENSE"><img src="https://img.shields.io/badge/license-MIT-green?style=for-the-badge" alt="MIT License"></a>
 </p>
-Oracle bundles your prompt and files so another AI can answer with real context. It speaks GPT-5.1 Pro (default alias to GPT-5.2 Pro on the API), GPT-5.1 Codex (API-only), GPT-5.1, GPT-5.2, Gemini 3 Pro, Claude Sonnet 4.5, Claude Opus 4.1, and more—and it can ask one or multiple models in a single run. Browser automation is available; use `--browser-model-strategy current` to keep the active ChatGPT model (or `ignore` to skip the picker). API remains the most reliable path, and `--copy` is an easy manual fallback.
+Oracle bundles your prompt and files so another AI can answer with real context. It speaks GPT-5.4 Pro (default), GPT-5.4, GPT-5.1 Pro, GPT-5.1 Codex (API-only), GPT-5.1, GPT-5.2, Gemini 3.1 Pro (API-only), Gemini 3 Pro, Claude Sonnet 4.5, Claude Opus 4.1, and more—and it can ask one or multiple models in a single run. Browser automation is available; use `--browser-model-strategy current` to keep the active ChatGPT model (or `ignore` to skip the picker). API remains the most reliable path, and `--copy` is an easy manual fallback.
+## Setting up (macOS Browser Mode)
+Browser mode lets you use GPT-5.2 Pro without any API keys — it automates your Chrome browser directly.
+### First-time login
+Run this once to create an automation profile and log into ChatGPT. The browser will stay open so you can complete the login:
+```bash
+oracle --engine browser --browser-manual-login \
+  --browser-keep-browser --browser-input-timeout 120000 \
+  -p "HI"
+```
+### Subsequent runs
+Once logged in, the automation profile is saved. Use this for all future runs:
+```bash
+oracle --engine browser --browser-manual-login \
+  --browser-auto-reattach-delay 5s \
+  --browser-auto-reattach-interval 3s \
+  --browser-auto-reattach-timeout 60s \
+  -p "your prompt"
+```
+> **Why these flags?**
+> - `--browser-manual-login` — Skips macOS Keychain cookie access (avoids repeated permission popups)
+> - `--browser-auto-reattach-*` — Reconnects when ChatGPT redirects mid-page-load (fixes "Inspected target navigated or closed" error)
+> - `--browser-keep-browser` — Keeps browser open for first-time login (not needed after)
+> - `--browser-input-timeout 120000` — Gives you 2 minutes to log in on first run
 ## Quick start
@@ -30,6 +62,12 @@ npx -y @steipete/oracle -p "Write a concise architecture note for the storage ad
 # Multi-model API run
 npx -y @steipete/oracle -p "Cross-check the data layer assumptions" --models gpt-5.1-pro,gemini-3-pro --file "src/**/*.ts"
+# Follow up from an existing OpenAI/Azure session id
+npx -y @steipete/oracle --engine api --model gpt-5.2-pro --followup release-readiness-audit --followup-model gpt-5.2-pro -p "Re-evaluate with this new context" --file "src/**/*.ts"
+# Follow up directly from an OpenAI Responses API id
+npx -y @steipete/oracle --engine api --model gpt-5.2-pro --followup resp_abc1234567890 -p "Continue from this response" --file docs/notes.md
 # Preview without spending tokens
 npx -y @steipete/oracle --dry-run summary -p "Check release notes" --file docs/release-notes.md
@@ -53,7 +91,7 @@ Engine auto-picks API when `OPENAI_API_KEY` is set, otherwise browser; browser i
 ## Integration
 **CLI**
-- API mode expects API keys in your environment: `OPENAI_API_KEY` (GPT-5.x), `GEMINI_API_KEY` (Gemini 3 Pro), `ANTHROPIC_API_KEY` (Claude Sonnet 4.5 / Opus 4.1).
+- API mode expects API keys in your environment: `OPENAI_API_KEY` (GPT-5.x), `GEMINI_API_KEY` (Gemini 3.1 Pro / Gemini 3 Pro), `ANTHROPIC_API_KEY` (Claude Sonnet 4.5 / Opus 4.1).
 - Gemini browser mode uses Chrome cookies instead of an API key—just be logged into `gemini.google.com` in Chrome (no Python/venv required).
 - If your Gemini account can’t access “Pro”, Oracle auto-falls back to a supported model for web runs (and logs the fallback in verbose mode).
 - Prefer API mode or `--copy` + manual paste; browser automation is experimental.
@@ -96,11 +134,43 @@ npx -y @steipete/oracle oracle-mcp
 - Multi-model API runs with aggregated cost/usage, including OpenRouter IDs alongside first-party models.
 - Render/copy bundles for manual paste into ChatGPT when automation is blocked.
 - GPT‑5 Pro API runs detach by default; reattach via `oracle session <id>` / `oracle status` or block with `--wait`.
+- OpenAI/Azure follow-up API runs can continue from `--followup <sessionId|responseId>`; for multi-model parents, add `--followup-model <model>`.
 - Azure endpoints supported via `--azure-endpoint/--azure-deployment/--azure-api-version` or `AZURE_OPENAI_*` envs.
 - File safety: globs/excludes, size guards, `--files-report`.
 - Sessions you can replay (`oracle status`, `oracle session <id> --render`).
 - Session logs and bundles live in `~/.oracle/sessions` (override with `ORACLE_HOME_DIR`).
+## Follow-up and lineage
+Use `--followup` to continue an existing OpenAI/Azure Responses API run with additional context/files:
+```bash
+oracle \
+  --engine api \
+  --model gpt-5.2-pro \
+  --followup <existing-session-id-or-resp_id> \
+  --followup-model gpt-5.2-pro \
+  --slug "my-followup-run" \
+  --wait \
+  -p "Follow-up: re-evaluate the previous recommendation with the attached files." \
+  --file "server/src/strategy/plan.ts" \
+  --file "server/src/strategy/executor.ts"
+```
+When the parent session used `--models`, `--followup-model` picks which model's response id to chain from.
+Custom `--base-url` providers plus Gemini/Claude API runs are excluded here because they do not preserve `previous_response_id` in Oracle.
+`oracle status` shows parent/child lineage in tree form:
+```text
+Recent Sessions
+Status    Model         Mode    Timestamp           Chars    Cost  Slug
+completed gpt-5.2-pro   api     03/01/2026 09:00 AM  1800  $2.110  architecture-review-parent
+completed gpt-5.2-pro   api     03/01/2026 09:14 AM  2200  $2.980  ├─ architecture-review-followup
+running   gpt-5.2-pro   api     03/01/2026 09:22 AM  1400       -  │  └─ architecture-review-implementation-pass
+pending   gpt-5.2-pro   api     03/01/2026 09:25 AM   900       -  └─ architecture-review-risk-check
+```
 ## Browser auto-reattach (long Pro runs)
 When browser runs time out (common with long GPT‑5.x Pro responses), Oracle can keep polling the existing ChatGPT tab and capture the final answer without manual `oracle session <id>` commands.
@@ -126,8 +196,10 @@ oracle --engine browser \
 | `-p, --prompt <text>` | Required prompt. |
 | `-f, --file <paths...>` | Attach files/dirs (globs + `!` excludes). |
 | `-e, --engine <api\|browser>` | Choose API or browser (browser is experimental). |
-| `-m, --model <name>` | Built-ins (`gpt-5.1-pro` default, `gpt-5-pro`, `gpt-5.1`, `gpt-5.1-codex`, `gpt-5.2`, `gpt-5.2-instant`, `gpt-5.2-pro`, `gemini-3-pro`, `claude-4.5-sonnet`, `claude-4.1-opus`) plus any OpenRouter id (e.g., `minimax/minimax-m2`, `openai/gpt-4o-mini`). |
+| `-m, --model <name>` | Built-ins (`gpt-5.4-pro` default, `gpt-5.4`, `gpt-5.1-pro`, `gpt-5-pro`, `gpt-5.1`, `gpt-5.1-codex`, `gpt-5.2`, `gpt-5.2-instant`, `gpt-5.2-pro`, `gemini-3.1-pro` API-only, `gemini-3-pro`, `claude-4.5-sonnet`, `claude-4.1-opus`) plus any OpenRouter id (e.g., `minimax/minimax-m2`, `openai/gpt-4o-mini`). |
 | `--models <list>` | Comma-separated API models (mix built-ins and OpenRouter ids) for multi-model runs. |
+| `--followup <sessionId\|responseId>` | Continue an OpenAI/Azure Responses API run from a stored oracle session or `resp_...` response id. |
+| `--followup-model <model>` | For multi-model OpenAI/Azure parent sessions, choose which model response to continue from. |
 | `--base-url <url>` | Point API runs at LiteLLM/Azure/OpenRouter/etc. |
 | `--chatgpt-url <url>` | Target a ChatGPT workspace/folder (browser). |
 | `--browser-model-strategy <select\|current\|ignore>` | Control ChatGPT model selection in browser mode (current keeps the active model; ignore skips the picker). |
@@ -161,7 +233,7 @@ oracle --engine browser \
 Put defaults in `~/.oracle/config.json` (JSON5). Example:
 ```json5
 {
-  model: "gpt-5.1-pro",
+  model: "gpt-5.4-pro",
   engine: "api",
   filesReport: true,
   browser: {

package/dist/bin/oracle-cli.js CHANGED Viewed

@@ -47,6 +47,7 @@ import { loadUserConfig } from '../src/config.js';
 import { applyBrowserDefaultsFromConfig } from '../src/cli/browserDefaults.js';
 import { shouldBlockDuplicatePrompt } from '../src/cli/duplicatePromptGuard.js';
 import { resolveRemoteServiceConfig } from '../src/remote/remoteServiceConfig.js';
+import { resolveConfiguredMaxFileSizeBytes } from '../src/cli/fileSize.js';
 const VERSION = getCliVersion();
 const CLI_ENTRYPOINT = fileURLToPath(import.meta.url);
 const LEGACY_FLAG_ALIASES = new Map([
@@ -98,12 +99,14 @@ program.hook('preAction', (thisCommand) => {
 });
 program
     .name('oracle')
-    .description('One-shot GPT-5.2 Pro / GPT-5.2 / GPT-5.1 Codex tool for hard questions that benefit from large file context and server-side search.')
+    .description('One-shot GPT-5.4 Pro / GPT-5.4 / GPT-5.1 Codex tool for hard questions that benefit from large file context and server-side search.')
     .version(VERSION)
     .argument('[prompt]', 'Prompt text (shorthand for --prompt).')
     .option('-p, --prompt <text>', 'User prompt to send to the model.')
     .addOption(new Option('--message <text>', 'Alias for --prompt.').hideHelp())
-    .option('-f, --file <paths...>', 'Files/directories or glob patterns to attach (prefix with !pattern to exclude). Files larger than 1 MB are rejected automatically.', collectPaths, [])
+    .option('--followup <sessionId|responseId>', 'Continue an OpenAI/Azure Responses API run from a stored response id (resp_...) or from a stored oracle session id.')
+    .option('--followup-model <model>', 'When following up a multi-model session, choose which model response to continue from.')
+    .option('-f, --file <paths...>', 'Files/directories or glob patterns to attach (prefix with !pattern to exclude). Oversized files are rejected automatically (default cap: 1 MB; configurable via ORACLE_MAX_FILE_SIZE_BYTES or config.maxFileSizeBytes).', collectPaths, [])
     .addOption(new Option('--include <paths...>', 'Alias for --file.')
     .argParser(collectPaths)
     .default([])
@@ -123,8 +126,8 @@ program
     .addOption(new Option('--copy-markdown', 'Copy the assembled markdown bundle to the clipboard; pair with --render to print it too.').default(false))
     .addOption(new Option('--copy').hideHelp().default(false))
     .option('-s, --slug <words>', 'Custom session slug (3-5 words).')
-    .option('-m, --model <model>', 'Model to target (gpt-5.2-pro default; also supports gpt-5.1-pro alias). Also gpt-5-pro, gpt-5.1, gpt-5.1-codex API-only, gpt-5.2, gpt-5.2-instant, gpt-5.2-pro, gemini-3-pro, claude-4.5-sonnet, claude-4.1-opus, or ChatGPT labels like "5.2 Thinking" for browser runs).', normalizeModelOption)
-    .addOption(new Option('--models <models>', 'Comma-separated API model list to query in parallel (e.g., "gpt-5.2-pro,gemini-3-pro").')
+    .option('-m, --model <model>', 'Model to target (gpt-5.4-pro default). Also gpt-5.4, gpt-5.1-pro, gpt-5-pro, gpt-5.1, gpt-5.1-codex API-only, gpt-5.2, gpt-5.2-instant, gpt-5.2-pro, gemini-3.1-pro API-only, gemini-3-pro, claude-4.5-sonnet, claude-4.1-opus, or ChatGPT labels like "5.2 Thinking" for browser runs).', normalizeModelOption)
+    .addOption(new Option('--models <models>', 'Comma-separated API model list to query in parallel (e.g., "gpt-5.4-pro,gemini-3-pro").')
     .argParser(collectModelList)
     .default([]))
     .addOption(new Option('-e, --engine <mode>', 'Execution engine (api | browser). Browser engine: GPT models automate ChatGPT; Gemini models use a cookie-based client for gemini.google.com. If omitted, oracle picks api when OPENAI_API_KEY is set, otherwise browser.').choices(['api', 'browser']))
@@ -135,7 +138,7 @@ program
     .addOption(new Option('--no-notify', 'Disable desktop notifications.').default(undefined))
     .addOption(new Option('--notify-sound', 'Play a notification sound on completion (default off).').default(undefined))
     .addOption(new Option('--no-notify-sound', 'Disable notification sounds.').default(undefined))
-    .addOption(new Option('--timeout <seconds|auto>', 'Overall timeout before aborting the API call (auto = 60m for gpt-5.2-pro, 120s otherwise).')
+    .addOption(new Option('--timeout <seconds|auto>', 'Overall timeout before aborting the API call (auto = 60m for gpt-5.4-pro, 120s otherwise).')
     .argParser(parseTimeoutOption)
     .default('auto'))
     .addOption(new Option('--background', 'Use Responses API background mode (create + retrieve) for API runs.').default(undefined))
@@ -413,8 +416,10 @@ function buildRunOptions(options, overrides = {}) {
         prompt: options.prompt,
         model: options.model,
         models: overrides.models ?? options.models,
+        previousResponseId: overrides.previousResponseId ?? options.previousResponseId,
         effectiveModelId: overrides.effectiveModelId ?? options.effectiveModelId ?? options.model,
         file: overrides.file ?? options.file ?? [],
+        maxFileSizeBytes: overrides.maxFileSizeBytes ?? options.maxFileSizeBytes,
         slug: overrides.slug ?? options.slug,
         filesReport: overrides.filesReport ?? options.filesReport,
         maxInput: overrides.maxInput ?? options.maxInput,
@@ -454,14 +459,141 @@ function resolveHeartbeatIntervalMs(seconds) {
     }
     return Math.round(seconds * 1000);
 }
+function assertFollowupSupported({ engine, model, baseUrl, azureEndpoint, }) {
+    if (engine !== 'api') {
+        throw new Error('--followup requires --engine api.');
+    }
+    if (model.startsWith('gemini') || model.startsWith('claude')) {
+        throw new Error(`--followup is only supported for OpenAI Responses API runs. Model ${model} uses a provider client without previous_response_id support.`);
+    }
+    if (baseUrl && !azureEndpoint) {
+        throw new Error('--followup is only supported for the default OpenAI Responses API or Azure OpenAI Responses. Custom --base-url providers are not supported.');
+    }
+}
+function levenshteinDistance(a, b) {
+    if (a === b)
+        return 0;
+    if (a.length === 0)
+        return b.length;
+    if (b.length === 0)
+        return a.length;
+    const previous = new Array(b.length + 1);
+    const current = new Array(b.length + 1);
+    for (let j = 0; j <= b.length; j += 1) {
+        previous[j] = j;
+    }
+    for (let i = 1; i <= a.length; i += 1) {
+        current[0] = i;
+        for (let j = 1; j <= b.length; j += 1) {
+            const substitutionCost = a[i - 1] === b[j - 1] ? 0 : 1;
+            current[j] = Math.min(previous[j] + 1, current[j - 1] + 1, previous[j - 1] + substitutionCost);
+        }
+        for (let j = 0; j <= b.length; j += 1) {
+            previous[j] = current[j];
+        }
+    }
+    return previous[b.length];
+}
+function scoreSessionSimilarity(input, candidate) {
+    if (input === candidate)
+        return 1;
+    if (candidate.startsWith(input) || input.startsWith(candidate))
+        return 0.95;
+    if (candidate.includes(input) || input.includes(candidate))
+        return 0.8;
+    const distance = levenshteinDistance(input, candidate);
+    const maxLength = Math.max(input.length, candidate.length);
+    if (maxLength === 0)
+        return 0;
+    return Math.max(0, 1 - distance / maxLength);
+}
+async function suggestFollowupSessionIds(input, limit = 3) {
+    const normalizedInput = input.trim().toLowerCase();
+    if (!normalizedInput)
+        return [];
+    const sessions = await sessionStore.listSessions().catch(() => []);
+    const seen = new Set();
+    const ranked = sessions
+        .map((meta) => meta.id)
+        .filter((id) => typeof id === 'string' && id.length > 0)
+        .filter((id) => {
+        if (seen.has(id))
+            return false;
+        seen.add(id);
+        return true;
+    })
+        .map((id) => ({ id, score: scoreSessionSimilarity(normalizedInput, id.toLowerCase()) }))
+        .filter((entry) => entry.score >= 0.45)
+        .sort((a, b) => b.score - a.score)
+        .slice(0, limit);
+    return ranked.map((entry) => entry.id);
+}
+async function resolveFollowupReference(value, followupModel) {
+    const trimmed = value.trim();
+    if (trimmed.length === 0) {
+        throw new Error('--followup requires a session id or response id.');
+    }
+    if (trimmed.startsWith('resp_')) {
+        return { responseId: trimmed };
+    }
+    // Treat as oracle session id (slug).
+    const meta = await sessionStore.readSession(trimmed);
+    if (!meta) {
+        const suggestions = await suggestFollowupSessionIds(trimmed);
+        const suggestionText = suggestions.length > 0 ? ` Did you mean: ${suggestions.map((id) => `"${id}"`).join(', ')}?` : '';
+        throw new Error(`No session found with ID ${trimmed}.${suggestionText} Run "oracle status --hours 72 --limit 20" to list recent sessions.`);
+    }
+    const fromMetadata = extractResponseIdFromSession(meta, followupModel);
+    if (fromMetadata) {
+        return { responseId: fromMetadata, sessionId: meta.id };
+    }
+    // Fallback: scrape the log for a response id (covers older sessions / edge cases).
+    const logText = await sessionStore.readLog(trimmed).catch(() => '');
+    const matches = logText.match(/resp_[A-Za-z0-9]+/g) ?? [];
+    const last = matches.length > 0 ? matches[matches.length - 1] : null;
+    if (last) {
+        return { responseId: last, sessionId: meta.id };
+    }
+    throw new Error(`Session ${trimmed} does not contain a stored response id. Ensure the original run produced a Responses API response id (background/store helps).`);
+}
+function extractResponseIdFromSession(meta, followupModel) {
+    // Single-model sessions store response metadata at the session root.
+    const rootResponse = meta.response ?? null;
+    const rootResponseId = rootResponse?.responseId ?? rootResponse?.id;
+    if (rootResponseId && rootResponseId.startsWith('resp_')) {
+        return rootResponseId;
+    }
+    const runs = Array.isArray(meta.models) ? meta.models : [];
+    if (runs.length === 0) {
+        return null;
+    }
+    const pickRun = () => {
+        if (followupModel) {
+            return runs.find((r) => r.model === followupModel) ?? null;
+        }
+        return runs.length === 1 ? runs[0] : null;
+    };
+    const chosen = pickRun();
+    if (!chosen) {
+        const models = runs.map((r) => r.model).join(', ');
+        throw new Error(followupModel
+            ? `Session ${meta.id} has no model named ${followupModel}. Available: ${models}`
+            : `Session ${meta.id} has multiple model runs. Re-run with --followup-model. Available: ${models}`);
+    }
+    const runResponse = chosen.response ?? null;
+    const runResponseId = runResponse?.responseId ?? runResponse?.id;
+    return runResponseId && runResponseId.startsWith('resp_') ? runResponseId : null;
+}
 function buildRunOptionsFromMetadata(metadata) {
     const stored = metadata.options ?? {};
     return {
         prompt: stored.prompt ?? '',
         model: stored.model ?? DEFAULT_MODEL,
         models: stored.models,
+        previousResponseId: stored.previousResponseId,
         effectiveModelId: stored.effectiveModelId ?? stored.model,
         file: stored.file ?? [],
+        maxFileSizeBytes: stored.maxFileSizeBytes,
         slug: stored.slug,
         filesReport: stored.filesReport,
         maxInput: stored.maxInput,
@@ -664,6 +796,14 @@ async function runRootCommand(options) {
         throw new Error('--remote-host does not support --models yet. Use API engine locally instead.');
     }
     const resolvedModel = normalizedMultiModels[0] ?? (isGemini ? resolveApiModel(cliModelArg) : resolvedModelCandidate);
+    const includesGeminiApiOnly = (normalizedMultiModels.length > 0 ? normalizedMultiModels : [resolvedModel]).some((model) => model === 'gemini-3.1-pro');
+    if ((userForcedBrowser || userConfig.engine === 'browser') && includesGeminiApiOnly) {
+        throw new Error('gemini-3.1-pro is API-only today. Use --engine api or switch to gemini-3-pro for Gemini web.');
+    }
+    if (engine === 'browser' && includesGeminiApiOnly) {
+        console.log(chalk.dim('gemini-3.1-pro is API-only today; switching to API.'));
+        engine = 'api';
+    }
     const effectiveModelId = resolvedModel.startsWith('gemini')
         ? resolveGeminiModelId(resolvedModel)
         : isKnownModel(resolvedModel)
@@ -672,6 +812,7 @@ async function runRootCommand(options) {
     const resolvedBaseUrl = normalizeBaseUrl(options.baseUrl ?? (isClaude ? process.env.ANTHROPIC_BASE_URL : process.env.OPENAI_BASE_URL));
     const { models: _rawModels, ...optionsWithoutModels } = options;
     const resolvedOptions = { ...optionsWithoutModels, model: resolvedModel };
+    resolvedOptions.maxFileSizeBytes = resolveConfiguredMaxFileSizeBytes(userConfig, process.env);
     if (normalizedMultiModels.length > 0) {
         resolvedOptions.models = normalizedMultiModels;
     }
@@ -746,6 +887,21 @@ async function runRootCommand(options) {
             options.prompt = `${options.prompt.trim()}\n${userConfig.promptSuffix}`;
         }
         resolvedOptions.prompt = options.prompt;
+        if (options.followup) {
+            assertFollowupSupported({
+                engine,
+                model: resolvedModel,
+                baseUrl: resolvedBaseUrl,
+                azureEndpoint: resolvedOptions.azure?.endpoint,
+            });
+            if (normalizedMultiModels.length > 0) {
+                throw new Error('--followup cannot be combined with --models.');
+            }
+            const followup = await resolveFollowupReference(options.followup, options.followupModel);
+            resolvedOptions.previousResponseId = followup.responseId;
+            resolvedOptions.followupSessionId = followup.sessionId;
+            resolvedOptions.followupModel = options.followupModel;
+        }
         const runOptions = buildRunOptions(resolvedOptions, { preview: true, previewMode, baseUrl: resolvedBaseUrl });
         if (engine === 'browser') {
             await runBrowserPreview({
@@ -784,6 +940,21 @@ async function runRootCommand(options) {
         options.prompt = `${options.prompt.trim()}\n${userConfig.promptSuffix}`;
     }
     resolvedOptions.prompt = options.prompt;
+    if (options.followup) {
+        assertFollowupSupported({
+            engine,
+            model: resolvedModel,
+            baseUrl: resolvedBaseUrl,
+            azureEndpoint: resolvedOptions.azure?.endpoint,
+        });
+        if (normalizedMultiModels.length > 0) {
+            throw new Error('--followup cannot be combined with --models.');
+        }
+        const followup = await resolveFollowupReference(options.followup, options.followupModel);
+        resolvedOptions.previousResponseId = followup.responseId;
+        resolvedOptions.followupSessionId = followup.sessionId;
+        resolvedOptions.followupModel = options.followupModel;
+    }
     const duplicateBlocked = await shouldBlockDuplicatePrompt({
         prompt: resolvedOptions.prompt,
         force: options.force,
@@ -798,7 +969,10 @@ async function runRootCommand(options) {
         const isBrowserMode = engine === 'browser' || userForcedBrowser;
         const filesToValidate = isBrowserMode ? options.file.filter((f) => !isMediaFile(f)) : options.file;
         if (filesToValidate.length > 0) {
-            await readFiles(filesToValidate, { cwd: process.cwd() });
+            await readFiles(filesToValidate, {
+                cwd: process.cwd(),
+                maxFileSizeBytes: resolvedOptions.maxFileSizeBytes,
+            });
         }
     }
     const getSource = (key) => program.getOptionValueSource?.(key) ?? undefined;
@@ -874,6 +1048,8 @@ async function runRootCommand(options) {
         ...baseRunOptions,
         mode: sessionMode,
         browserConfig,
+        followupSessionId: resolvedOptions.followupSessionId,
+        followupModel: resolvedOptions.followupModel,
         waitPreference,
         youtube: options.youtube,
         generateImage: options.generateImage,
@@ -1022,7 +1198,10 @@ async function restartSession(sessionId, options) {
         const isBrowserMode = engine === 'browser';
         const filesToValidate = isBrowserMode ? runOptions.file.filter((f) => !isMediaFile(f)) : runOptions.file;
         if (filesToValidate.length > 0) {
-            await readFiles(filesToValidate, { cwd });
+            await readFiles(filesToValidate, {
+                cwd,
+                maxFileSizeBytes: runOptions.maxFileSizeBytes,
+            });
         }
     }
     enforceBrowserSearchFlag(runOptions, sessionMode, console.log);
@@ -1080,6 +1259,8 @@ async function restartSession(sessionId, options) {
         ...runOptions,
         mode: sessionMode,
         browserConfig,
+        followupSessionId: storedOptions.followupSessionId,
+        followupModel: storedOptions.followupModel,
         waitPreference,
         youtube: storedOptions.youtube,
         generateImage: storedOptions.generateImage,

package/dist/src/browser/actions/modelSelection.js CHANGED Viewed

@@ -71,13 +71,15 @@ function buildModelSelectionExpression(targetModel, strategy) {
       .map((token) => normalizeText(token))
       .filter(Boolean);
     const targetWords = normalizedTarget.split(' ').filter(Boolean);
-    const desiredVersion = normalizedTarget.includes('5 2')
-      ? '5-2'
-      : normalizedTarget.includes('5 1')
-        ? '5-1'
-        : normalizedTarget.includes('5 0')
-          ? '5-0'
-          : null;
+    const desiredVersion = normalizedTarget.includes('5 4')
+      ? '5-4'
+      : normalizedTarget.includes('5 2')
+        ? '5-2'
+        : normalizedTarget.includes('5 1')
+          ? '5-1'
+          : normalizedTarget.includes('5 0')
+            ? '5-0'
+            : null;
     const wantsPro = normalizedTarget.includes(' pro') || normalizedTarget.endsWith(' pro') || normalizedTokens.includes('pro');
     const wantsInstant = normalizedTarget.includes('instant');
     const wantsThinking = normalizedTarget.includes('thinking');
@@ -87,6 +89,26 @@ function buildModelSelectionExpression(targetModel, strategy) {
       return { status: 'button-missing' };
     }
+    const closeMenu = () => {
+      try {
+        if (dispatchClickSequence(button)) {
+          lastPointerClick = performance.now();
+          return;
+        }
+      } catch {}
+      try {
+        document.dispatchEvent(
+          new KeyboardEvent('keydown', {
+            key: 'Escape',
+            code: 'Escape',
+            keyCode: 27,
+            which: 27,
+            bubbles: true,
+          }),
+        );
+      } catch {}
+    };
     const getButtonLabel = () => (button.textContent ?? '').trim();
     if (MODEL_STRATEGY === 'current') {
       return { status: 'already-selected', label: getButtonLabel() };
@@ -95,6 +117,7 @@ function buildModelSelectionExpression(targetModel, strategy) {
       const normalizedLabel = normalizeText(getButtonLabel());
       if (!normalizedLabel) return false;
       if (desiredVersion) {
+        if (desiredVersion === '5-4' && !normalizedLabel.includes('5 4')) return false;
         if (desiredVersion === '5-2' && !normalizedLabel.includes('5 2')) return false;
         if (desiredVersion === '5-1' && !normalizedLabel.includes('5 1')) return false;
         if (desiredVersion === '5-0' && !normalizedLabel.includes('5 0')) return false;
@@ -159,6 +182,12 @@ function buildModelSelectionExpression(targetModel, strategy) {
             normalizedTestId.includes('gpt-5-2') ||
             normalizedTestId.includes('gpt-5.2') ||
             normalizedTestId.includes('gpt52');
+          const has54 =
+            normalizedTestId.includes('5-4') ||
+            normalizedTestId.includes('5.4') ||
+            normalizedTestId.includes('gpt-5-4') ||
+            normalizedTestId.includes('gpt-5.4') ||
+            normalizedTestId.includes('gpt54');
           const has51 =
             normalizedTestId.includes('5-1') ||
             normalizedTestId.includes('5.1') ||
@@ -171,7 +200,7 @@ function buildModelSelectionExpression(targetModel, strategy) {
             normalizedTestId.includes('gpt-5-0') ||
             normalizedTestId.includes('gpt-5.0') ||
             normalizedTestId.includes('gpt50');
-          const candidateVersion = has52 ? '5-2' : has51 ? '5-1' : has50 ? '5-0' : null;
+          const candidateVersion = has54 ? '5-4' : has52 ? '5-2' : has51 ? '5-1' : has50 ? '5-0' : null;
           // If a candidate advertises a different version, ignore it entirely.
           if (candidateVersion && candidateVersion !== desiredVersion) {
             return 0;
@@ -317,6 +346,7 @@ function buildModelSelectionExpression(targetModel, strategy) {
         const match = findBestOption();
         if (match) {
           if (optionIsSelected(match.node)) {
+            closeMenu();
             resolve({ status: 'already-selected', label: getButtonLabel() || match.label });
             return;
           }
@@ -331,6 +361,7 @@ function buildModelSelectionExpression(targetModel, strategy) {
           // Wait for the top bar label to reflect the requested model; otherwise keep scanning.
           setTimeout(() => {
             if (buttonMatchesTarget()) {
+              closeMenu();
               resolve({ status: 'switched', label: getButtonLabel() || match.label });
               return;
             }
@@ -374,6 +405,22 @@ function buildModelMatchersLiteral(targetModel) {
     push(`chatgpt ${dotless}`, labelTokens);
     push(`gpt ${base}`, labelTokens);
     push(`gpt ${dotless}`, labelTokens);
+    // Numeric variations (5.4 ↔ 54 ↔ gpt-5-4)
+    if (base.includes('5.4') || base.includes('5-4') || base.includes('54')) {
+        push('5.4', labelTokens);
+        push('gpt-5.4', labelTokens);
+        push('gpt5.4', labelTokens);
+        push('gpt-5-4', labelTokens);
+        push('gpt5-4', labelTokens);
+        push('gpt54', labelTokens);
+        push('chatgpt 5.4', labelTokens);
+        if (!base.includes('pro')) {
+            testIdTokens.add('model-switcher-gpt-5-4');
+        }
+        testIdTokens.add('gpt-5-4');
+        testIdTokens.add('gpt5-4');
+        testIdTokens.add('gpt54');
+    }
     // Numeric variations (5.1 ↔ 51 ↔ gpt-5-1)
     if (base.includes('5.1') || base.includes('5-1') || base.includes('51')) {
         push('5.1', labelTokens);
@@ -436,6 +483,11 @@ function buildModelMatchersLiteral(targetModel) {
         push('proresearch', labelTokens);
         push('research grade', labelTokens);
         push('advanced reasoning', labelTokens);
+        if (base.includes('5.4') || base.includes('5-4') || base.includes('54')) {
+            testIdTokens.add('gpt-5.4-pro');
+            testIdTokens.add('gpt-5-4-pro');
+            testIdTokens.add('gpt54pro');
+        }
         if (base.includes('5.1') || base.includes('5-1') || base.includes('51')) {
             testIdTokens.add('gpt-5.1-pro');
             testIdTokens.add('gpt-5-1-pro');

package/dist/src/browser/actions/navigation.js CHANGED Viewed

@@ -1,6 +1,7 @@
 import { CLOUDFLARE_SCRIPT_SELECTOR, CLOUDFLARE_TITLE, INPUT_SELECTORS, } from '../constants.js';
 import { delay } from '../utils.js';
 import { logDomFailure } from '../domDebug.js';
+import { BrowserAutomationError } from '../../oracle/errors.js';
 export function installJavaScriptDialogAutoDismissal(Page, logger) {
     const pageAny = Page;
     if (typeof pageAny.on !== 'function' || typeof pageAny.handleJavaScriptDialog !== 'function') {
@@ -127,7 +128,7 @@ export async function ensureNotBlocked(Runtime, headless, logger) {
             ? 'Cloudflare challenge detected in headless mode. Re-run with --headful so you can solve the challenge.'
             : 'Cloudflare challenge detected. Complete the “Just a moment…” check in the open browser, then rerun.';
         logger('Cloudflare anti-bot page detected');
-        throw new Error(message);
+        throw new BrowserAutomationError(message, { stage: 'cloudflare-challenge', headless });
     }
 }
 const LOGIN_CHECK_TIMEOUT_MS = 5_000;

package/dist/src/browser/constants.js CHANGED Viewed

@@ -1,5 +1,5 @@
 export const CHATGPT_URL = 'https://chatgpt.com/';
-export const DEFAULT_MODEL_TARGET = 'GPT-5.2 Pro';
+export const DEFAULT_MODEL_TARGET = 'GPT-5.4 Pro';
 export const DEFAULT_MODEL_STRATEGY = 'select';
 export const COOKIE_URLS = ['https://chatgpt.com', 'https://chat.openai.com', 'https://atlas.openai.com'];
 export const INPUT_SELECTORS = [