npm - @ax-llm/ax - Versions diffs - 21.0.3 → 21.0.5 - Mend

@ax-llm/ax 21.0.3 → 21.0.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (19) hide show

package/index.cjs +184 -181
package/index.cjs.map +1 -1
package/index.d.cts +42 -15
package/index.d.ts +42 -15
package/index.global.js +108 -105
package/index.global.js.map +1 -1
package/index.js +186 -183
package/index.js.map +1 -1
package/package.json +1 -1
package/skills/ax-agent-optimize.md +1 -1
package/skills/ax-agent.md +4 -4
package/skills/ax-ai.md +1 -1
package/skills/ax-audio.md +1 -1
package/skills/ax-flow.md +1 -1
package/skills/ax-gen.md +1 -1
package/skills/ax-gepa.md +1 -1
package/skills/ax-learn.md +1 -1
package/skills/ax-llm.md +1 -1
package/skills/ax-signature.md +1 -1

package/index.d.cts CHANGED Viewed

@@ -2427,6 +2427,7 @@ declare class AxBaseAI<TModel, TEmbedModel, TChatRequest, TEmbedRequest, TChatRe
     private calculatePercentile;
     private updateLatencyMetrics;
     private updateErrorMetrics;
+    private recordEstimatedCost;
     private recordTokenUsage;
     private calculateRequestSize;
     private calculateResponseSize;
@@ -2535,6 +2536,9 @@ type AxModelInfo = {
     maxTokens?: number;
     isExpensive?: boolean;
     contextWindow?: number;
+    isDeprecated?: boolean;
+    /** ISO date (YYYY-MM-DD) the upstream provider will stop serving this model. */
+    deprecatedOn?: string;
 };
 type AxTokenUsage = {
     promptTokens: number;
@@ -2755,6 +2759,10 @@ type AxCitation = {
     license?: string;
     publicationDate?: string;
     snippet?: string;
+    /** File Search multimodal (Gemini, May 2026): media chunk id. */
+    mediaId?: string;
+    /** File Search multimodal (Gemini, May 2026): page numbers cited within the source. */
+    pageNumbers?: number[];
 };
 type AxModelUsage = {
     ai: string;
@@ -4305,9 +4313,9 @@ declare class AxSignature<_TInput extends Record<string, any> = Record<string, a
 declare const promptTemplates: {
     readonly 'dsp/dspy.md': "<identity>\n{{ identityText }}\n</identity>{{ if hasFunctions }}\n\n<available_functions>\n**Available Functions**: You can call the following functions to complete the task:\n\n{{ functionsList }}\n\n## Function Call Instructions\n- Complete the task, using the functions defined earlier in this prompt.\n- Output fields should only be generated after all functions have been called.\n- Use the function results to generate the output fields.\n</available_functions>{{ /if }}\n\n<input_fields>\n{{ inputFieldsSection }}\n</input_fields>{{ if hasOutputFields }}\n\n<output_fields>\n{{ outputFieldsSection }}\n</output_fields>{{ /if }}\n{{ if hasTaskDefinition }}\n\n<task_definition>\n{{ taskDefinitionText }}\n</task_definition>{{ /if }}\n\n<formatting_rules>\n{{ if hasStructuredOutputFunction }}\nReturn the complete output by calling `{{ structuredOutputFunctionName }}`.\n{{ else }}{{ if hasComplexFields }}\nReturn valid JSON matching <output_fields>.\n{{ else }}\nReturn one `field name: value` pair per line for the required output fields only.\n{{ /if }}{{ /if }}Above rules override later instructions.\n\n</formatting_rules>\n{{ if hasExampleDemonstrations }}\n\n## Example Demonstrations\nThe following User/Assistant turns are examples only until --- END OF EXAMPLES ---, not context for the current task.\n{{ /if }}\n";
     readonly 'dsp/example-separator.md': "--- END OF EXAMPLES ---\nThe examples above were for training purposes only. Please ignore any specific entities or facts mentioned in them.\n\nREAL USER QUERY:\n";
-    readonly 'rlm/distiller.md': "## Distiller\n\nYou (`distiller`) read the available context and forward an actionable request to the downstream **executor** stage (which has the tools — shell, file system, agent functions, etc.). You do not execute the task yourself.\n\nCall `final(request, evidence)` to forward. Expand the user's original task with facts from context so the request is clear and complete; put exact inputs (paths, ids, selected records, constraints) in `evidence`, or `{}` if context has nothing to narrow. Resolve follow-ups against prior conversation. Never refuse with \"I have no tools\" — forwarding *is* the response. Use `askClarification` only when genuinely blocked by ambiguity.\n\nThe JS runtime is a long-running REPL — state persists across turns unless restarted. Each **turn**: write code → it executes → you see output → write the next block.\n\n### Context Fields\n\nContext fields are available as globals (in the REPL) on the `inputs` object:\n{{ contextVarList }}\n\n### Available Functions\n\n{{ primitivesList }}\n{{ if memoriesMode }}\n\n### Memories\n\n`inputs.memories` is an array of `{ id, content }` entries — facts, preferences, and prior context already loaded. Scan it before deciding what to do. If you need more, call `await recall(['…', '…'])` — matched memories are appended to `inputs.memories` for the next turn (and forwarded to the executor).\n{{ /if }}\n\n### How to Work\n\n- **Skip exploration when context has nothing to narrow** (direct action request, or schema is already known) — forward on turn 1 with `final(request, {})`.\n- **When narrowing**: probe shape, narrow with JS, extract. Don't dump raw data. Don't repeat probes already in the Action Log.\n- **Use JS** for deterministic work (filter, sort, slice, regex, dedupe). **Use `llmQuery`** only to interpret a narrowed slice — never pass raw `inputs.*` to it.\n- `console.log` to inspect; capture awaited results into variables (return values aren't auto-visible). Multiple `console.log`s per turn is fine.\n\n```js\nconst narrowed = inputs.emails\n  .filter(e => e.subject.toLowerCase().includes('refund'))\n  .map(e => ({ from: e.from, subject: e.subject, body: e.body.slice(0, 800) }));\n\nconst interpretation = await llmQuery([{\n  query: 'Classify each as billing_dispute | unauthorized_charge | other. JSON list.',\n  context: { emails: narrowed }\n}]);\nconsole.log(interpretation);\n```\n\n### Output Contract\n\nThe `Javascript Code` field value must be runnable JavaScript only. Do not put prose or plain labels like `task:` / `evidence:` inside the value. Never combine `console.log` with `final()` or `askClarification()` in the same turn.\n\nValid completion turns:\n\n```js\nawait final(\"Use the matched emails to answer the user's question\", { matchedEmails });\n```\n\n```js\n// Passthrough — user asked for an action and there's nothing in context to narrow.\nawait final(\"Run the shell command `ls -la` and return its output verbatim\", {});\n```\n\n```js\nawait askClarification(\"Which context should I inspect?\");\n```\n\n## JavaScript Runtime Usage Instructions\n{{ runtimeUsageInstructions }}\n";
-    readonly 'rlm/executor.md': "## Executor\n\nYou (`executor`) are the task-execution stage in a two-stage pipeline. Your ONLY job is to write JavaScript code that runs in the JS runtime (REPL) to complete tasks using the tools available to you. A separate (`responder`) agent downstream synthesizes the final answer.\n\nThe JS runtime is a long-running REPL — state persists across turns unless restarted. Each **turn**: write code → it executes → you see output → write the next block.\n\n### Executor Request & Distilled Context\n\nThe prior distiller stage produced two extra inputs:\n\n- `inputs.executorRequest` — an expanded request describing what this stage should complete.\n- `inputs.distilledContext` — pre-distilled evidence the distiller selected for this task.\n\nRead `executorRequest`, then read `distilledContext` for the evidence selected by the distiller. Raw context fields are not available in this stage. If the request needs information or effects that your available functions can provide, use those functions. If the distilled evidence is sufficient, finish directly with `final(...)`. Call `askClarification(...)` only when the missing information cannot be obtained programmatically.\n\n### Available Functions\n\n{{ primitivesList }}\n\n{{ functionsList }}\n{{ if discoveryMode }}\n\n{{ if hasModules }}\n### Available Modules\n{{ modulesList }}\n{{ /if }}\n{{ if hasDiscoveredDocs }}\n### Discovered Tool Docs\n\nThese were fetched this run — use them directly. Only re-run discovery for modules/functions not listed here.\n\n{{ discoveredDocsMarkdown }}\n{{ /if }}\n{{ /if }}\n{{ if hasSkills }}\n### Loaded Skills\n\nThese skill guides were loaded via `consult(...)` — apply them directly. Call `consult([...])` to load additional skills as needed.\n\n{{ skillsMarkdown }}\n{{ /if }}\n{{ if memoriesMode }}\n\n### Memories\n\n`inputs.memories` is an array of `{ id, content }` entries — facts, preferences, and prior context already loaded (including any the distiller forwarded). Scan it before deciding what to do. If you need more, call `await recall(['…', '…'])` — matched memories are appended to `inputs.memories` for the next turn.\n{{ /if }}\n\n### How to Work\n\n- Start from `inputs.executorRequest`, `inputs.distilledContext`, non-context task inputs, and prior successful Action Log results. Don't repeat probes already in the Action Log.\n- **Use JS** for deterministic work (filter, sort, slice, regex, dedupe). **Use `llmQuery`** only to interpret narrowed text — never pass raw `inputs.*` to it.\n- Discovery calls (`discoverModules`/`discoverFunctions`) can appear alongside other code — the runtime runs them first automatically.\n- Capture awaited results into variables (return values aren't auto-visible); inspect with `console.log(result)` or finish with `await final(\"...\", { result })`. Multiple `console.log`s per turn is fine.\n- Before calling `askClarification`, check whether any available function can resolve the need first.\n{{ if hasAgentStatusCallback }}\n- Keep the user updated: call `await reportSuccess(message)` after completing sub-tasks and `await reportFailure(message)` when something goes wrong.\n{{ /if }}\n\n```js\nconst narrowed = inputs.emails\n  .filter(e => e.subject.toLowerCase().includes('refund'))\n  .map(e => ({ from: e.from, subject: e.subject, body: e.body.slice(0, 800) }));\n\nconst plan = await llmQuery([{\n  query: 'Determine which messages require a refund response and draft a compact action plan.',\n  context: { emails: narrowed }\n}]);\nconsole.log(plan);\n```\n\n### Output Contract\n\nThe `Javascript Code` field value must be runnable JavaScript only. Do not put prose or plain labels like `task:` / `evidence:` inside the value. Never combine `console.log` with `final()` or `askClarification()` in the same turn.\n\nWhen done, call `await final(task, evidence)`:\n\n- `task` — a one-line instruction the **responder** will follow when writing the user-facing output fields (e.g. \"Answer the user's question using the matched emails\").\n- `evidence` — the curated data the responder will read to follow `task`. Pass narrowed JS objects with only the fields that matter, not raw `inputs.*`. Use plain keys (`{ matchedEmails: [...] }`) — don't wrap under the output field name.\n\nDo not pre-format the answer; the responder writes the output fields.\n\nValid completion turns:\n\n```js\nawait final(\"Answer the user's question using the gathered evidence\", { evidence });\n```\n\n```js\nawait askClarification(\"Which file should I analyze?\");\n```\n\n## JavaScript Runtime Usage Instructions\n{{ runtimeUsageInstructions }}\n";
-    readonly 'rlm/responder.md': "## Answer Synthesis Agent\n\nYou synthesize the final answer from the evidence the actor gathered. You do not run code, call tools, or invoke agents — you read input fields and write the output fields.\n\n### Reading the actor's payload\n\n`Context Data` has two keys:\n\n- `task` — a one-line instruction telling you what to write into the output fields.\n- `evidence` — the data the actor curated for you to follow that instruction.\n\n### Rules\n\n1. Follow `Context Data.task` using `Context Data.evidence` and any other input fields provided.\n2. When emitting a JSON output field, write the value flat — do **not** wrap it under a key matching the field's title. The field is already named.\n3. If `evidence` lacks sufficient information, give the best possible answer from what's available across all input fields.\n\n### Context variables that were analyzed (metadata only)\n{{ contextVarSummary }}\n{{ if hasAgentIdentity }}\n\n### Agent Identity\n\nUser-facing identity:\n{{ agentIdentityText }}\n{{ /if }}\n";
+    readonly 'rlm/distiller.md': "## Distiller\n\nYou (`distiller`) read the available context and forward an actionable request to the downstream **executor** stage, which owns any available tools/functions and capability checks. You do not execute the task yourself, choose executor tools, or decide whether the executor can perform the action.\n\nCall `final(request, evidence)` to forward. Expand the user's original task with facts from context so the request is clear and complete; put exact inputs (paths, ids, selected records, constraints) in `evidence`, or `{}` if context has nothing to narrow. Resolve follow-ups against prior conversation. Never refuse, answer, or ask clarification because of your own lack of tools or perceived executor capabilities — forwarding *is* the response. Use `askClarification` only when the requested action or target is genuinely ambiguous.\n\nThe JS runtime is a long-running REPL — state persists across turns unless restarted. Each **turn**: write code → it executes → you see output → write the next block.\n\n### Context Fields\n\nContext fields are available as globals (in the REPL) on the `inputs` object:\n{{ contextVarList }}\n\n### Available Functions\n\n{{ primitivesList }}\n{{ if memoriesMode }}\n\n### Memories\n\n`inputs.memories` is an array of `{ id, content }` entries — facts, preferences, and prior context already loaded. Scan it before deciding what to do. If you need more, call `await recall(['…', '…'])` — matched memories are appended to `inputs.memories` for the next turn (and forwarded to the executor).\n{{ /if }}\n\n### How to Work\n\n- **Skip exploration when context has nothing to narrow** (direct action request, or schema is already known) — forward on turn 1 with `final(request, {})`.\n- **For direct action requests**: preserve the requested action faithfully. The executor decides which available functions to use, attempts the work when possible, and reports the actual result or failure.\n- **When narrowing**: probe shape, narrow with JS, extract. Don't dump raw data. Don't repeat probes already in the Action Log.\n- **Use JS** for deterministic work (filter, sort, slice, regex, dedupe). **Use `llmQuery`** only to interpret a narrowed slice — never pass raw `inputs.*` to it.\n- `console.log` to inspect; capture awaited results into variables (return values aren't auto-visible). Multiple `console.log`s per turn is fine.\n\n```js\nconst narrowed = inputs.emails\n  .filter(e => e.subject.toLowerCase().includes('refund'))\n  .map(e => ({ from: e.from, subject: e.subject, body: e.body.slice(0, 800) }));\n\nconst interpretation = await llmQuery([{\n  query: 'Classify each as billing_dispute | unauthorized_charge | other. JSON list.',\n  context: { emails: narrowed }\n}]);\nconsole.log(interpretation);\n```\n\n### Output Contract\n\nThe `Javascript Code` field value must be runnable JavaScript only. Do not put prose or plain labels like `task:` / `evidence:` inside the value. Never combine `console.log` with `final()` or `askClarification()` in the same turn.\n\nValid completion turns:\n\n```js\nawait final(\"Use the matched emails to answer the user's question\", { matchedEmails });\n```\n\n```js\n// Passthrough — user asked for an action and there's nothing in context to narrow.\nawait final(\"Perform the requested action and report the actual result or failure\", {});\n```\n\n```js\nawait askClarification(\"Which context should I inspect?\");\n```\n\n## JavaScript Runtime Usage Instructions\n{{ runtimeUsageInstructions }}\n";
+    readonly 'rlm/executor.md': "## Executor\n\nYou (`executor`) are the task-execution stage in a two-stage pipeline. Your ONLY job is to write JavaScript code that runs in the JS runtime (REPL) to complete tasks using the tools available to you. A separate (`responder`) agent downstream synthesizes the final answer.\n\nThe JS runtime is a long-running REPL — state persists across turns unless restarted. Each **turn**: write code → it executes → you see output → write the next block.\n\n### Executor Request & Distilled Context\n\nThe prior distiller stage produced two extra inputs:\n\n- `inputs.executorRequest` — an expanded request describing what this stage should complete.\n- `inputs.distilledContext` — pre-distilled evidence the distiller selected for this task.\n\nRead `executorRequest`, then read `distilledContext` for the evidence selected by the distiller. Raw context fields are not available in this stage. You are the capability and tool-use authority: if the request needs information or effects that your available functions can provide, use those functions before refusing or asking clarification. If the distilled evidence is sufficient, finish directly with `final(...)`. Call `askClarification(...)` only when the missing information cannot be obtained programmatically.\n\n### Available Functions\n\n{{ primitivesList }}\n\n{{ functionsList }}\n{{ if discoveryMode }}\n\n{{ if hasModules }}\n### Available Modules\n{{ modulesList }}\n{{ /if }}\n{{ if hasDiscoveredDocs }}\n### Discovered Tool Docs\n\nThese were fetched this run — use them directly. Only re-run discovery for modules/functions not listed here.\n\n{{ discoveredDocsMarkdown }}\n{{ /if }}\n{{ /if }}\n{{ if hasSkills }}\n### Loaded Skills\n\nThese skill guides were loaded via `consult(...)` — apply them directly. Call `consult([...])` to load additional skills as needed.\n\n{{ skillsMarkdown }}\n{{ /if }}\n{{ if memoriesMode }}\n\n### Memories\n\n`inputs.memories` is an array of `{ id, content }` entries — facts, preferences, and prior context already loaded (including any the distiller forwarded). Scan it before deciding what to do. If you need more, call `await recall(['…', '…'])` — matched memories are appended to `inputs.memories` for the next turn.\n{{ /if }}\n\n### How to Work\n\n- Start from `inputs.executorRequest`, `inputs.distilledContext`, non-context task inputs, and prior successful Action Log results. Don't repeat probes already in the Action Log.\n- Treat direct action requests as work to attempt with available functions. If a function fails or the environment denies the action, capture the real error, status, output, or exception in the evidence for the responder.\n- **Use JS** for deterministic work (filter, sort, slice, regex, dedupe). **Use `llmQuery`** only to interpret narrowed text — never pass raw `inputs.*` to it.\n- Discovery calls (`discoverModules`/`discoverFunctions`) can appear alongside other code — the runtime runs them first automatically.\n- Capture awaited results into variables (return values aren't auto-visible); inspect with `console.log(result)` or finish with `await final(\"...\", { result })`. Multiple `console.log`s per turn is fine.\n- Before calling `askClarification`, check whether any available function can resolve the need first.\n{{ if hasAgentStatusCallback }}\n- Keep the user updated: call `await reportSuccess(message)` after completing sub-tasks and `await reportFailure(message)` when something goes wrong.\n{{ /if }}\n\n```js\nconst narrowed = inputs.emails\n  .filter(e => e.subject.toLowerCase().includes('refund'))\n  .map(e => ({ from: e.from, subject: e.subject, body: e.body.slice(0, 800) }));\n\nconst plan = await llmQuery([{\n  query: 'Determine which messages require a refund response and draft a compact action plan.',\n  context: { emails: narrowed }\n}]);\nconsole.log(plan);\n```\n\n### Output Contract\n\nThe `Javascript Code` field value must be runnable JavaScript only. Do not put prose or plain labels like `task:` / `evidence:` inside the value. Never combine `console.log` with `final()` or `askClarification()` in the same turn.\n\nWhen done, call `await final(task, evidence)`:\n\n- `task` — a one-line instruction the **responder** will follow when writing the user-facing output fields (e.g. \"Answer the user's question using the matched emails\").\n- `evidence` — the curated data the responder will read to follow `task`. Pass narrowed JS objects with only the fields that matter, not raw `inputs.*`. Use plain keys (`{ matchedEmails: [...] }`) — don't wrap under the output field name.\n\nDo not pre-format the answer; the responder writes the output fields.\n\nValid completion turns:\n\n```js\nawait final(\"Answer the user's question using the gathered evidence\", { evidence });\n```\n\n```js\nawait askClarification(\"Which file should I analyze?\");\n```\n\n## JavaScript Runtime Usage Instructions\n{{ runtimeUsageInstructions }}\n";
+    readonly 'rlm/responder.md': "## Answer Synthesis Agent\n\nYou synthesize the final answer from the evidence the actor gathered. You do not run code, call tools, or invoke agents — you read input fields and write the output fields.\n\n### Reading the actor's payload\n\n`Context Data` has two keys:\n\n- `task` — a one-line instruction telling you what to write into the output fields.\n- `evidence` — the data the actor curated for you to follow that instruction.\n\n### Rules\n\n1. Follow `Context Data.task` using `Context Data.evidence` and any other input fields provided.\n2. When emitting a JSON output field, write the value flat — do **not** wrap it under a key matching the field's title. The field is already named.\n3. If `evidence` lacks sufficient information, give the best possible answer from what's available across all input fields.\n4. Do not contradict actor evidence. If evidence contains a tool result, failure, status, output, or exception, report that result rather than inventing a capability limit.\n\n### Context variables that were analyzed (metadata only)\n{{ contextVarSummary }}\n{{ if hasAgentIdentity }}\n\n### Agent Identity\n\nUser-facing identity:\n{{ agentIdentityText }}\n{{ /if }}\n";
 };
 type TemplateId = keyof typeof promptTemplates;
@@ -5709,6 +5717,10 @@ type AxAIAnthropicThinkingWire = {
 type AxAIAnthropicEffortLevel = 'low' | 'medium' | 'high' | 'max';
 type AxAIAnthropicOutputConfig = {
     effort?: AxAIAnthropicEffortLevel;
+    format?: {
+        type: 'json_schema';
+        schema: object;
+    };
 };
 type AxAIAnthropicEffortLevelMapping = {
     minimal?: AxAIAnthropicEffortLevel;
@@ -5771,7 +5783,7 @@ type AxAIAnthropicChatRequest = {
                 media_type: string;
                 data: string;
             };
-        } & AxAIAnthropicChatRequestCacheParam) | {
+        } & AxAIAnthropicChatRequestCacheParam) | ({
             type: 'tool_result';
             is_error?: boolean;
             tool_use_id: string;
@@ -5786,7 +5798,7 @@ type AxAIAnthropicChatRequest = {
                     data: string;
                 };
             } & AxAIAnthropicChatRequestCacheParam))[];
-        })[];
+        } & AxAIAnthropicChatRequestCacheParam))[];
     } | {
         role: 'assistant';
         content: string | (({
@@ -5826,10 +5838,6 @@ type AxAIAnthropicChatRequest = {
     top_k?: number;
     thinking?: AxAIAnthropicThinkingWire;
     output_config?: AxAIAnthropicOutputConfig;
-    output_format?: {
-        type: 'json_schema';
-        schema: object;
-    };
     metadata?: {
         user_id: string;
     };
@@ -6003,8 +6011,11 @@ declare enum AxAIOpenAIModel {
     GPT4OMini = "gpt-4o-mini",
     GPTAudio = "gpt-audio",
     GPTAudioMini = "gpt-audio-mini",
+    GPTAudio15 = "gpt-audio-1.5",
+    GPTRealtime15 = "gpt-realtime-1.5",
     GPTRealtime2 = "gpt-realtime-2",
     GPTRealtimeWhisper = "gpt-realtime-whisper",
+    GPTRealtimeTranslate = "gpt-realtime-translate",
     GPT4ChatGPT4O = "chatgpt-4o-latest",
     GPT4Turbo = "gpt-4-turbo",
     GPT35Turbo = "gpt-3.5-turbo",
@@ -6031,6 +6042,8 @@ declare enum AxAIOpenAIModel {
     GPT54 = "gpt-5.4",
     GPT54Mini = "gpt-5.4-mini",
     GPT54Nano = "gpt-5.4-nano",
+    GPT55 = "gpt-5.5",
+    GPT55Pro = "gpt-5.5-pro",
     O1 = "o1",
     O1Mini = "o1-mini",
     O3 = "o3",
@@ -6063,7 +6076,7 @@ type AxAIOpenAIConfig<TModel, TEmbedModel> = Omit<AxModelConfig, 'topK'> & {
     logprobs?: number;
     echo?: boolean;
     dimensions?: number;
-    reasoningEffort?: 'minimal' | 'low' | 'medium' | 'high';
+    reasoningEffort?: 'none' | 'minimal' | 'low' | 'medium' | 'high' | 'xhigh';
     store?: boolean;
     serviceTier?: 'auto' | 'default' | 'flex';
     webSearchOptions?: {
@@ -6111,7 +6124,7 @@ interface AxAIOpenAIResponseDelta<T> {
 }
 type AxAIOpenAIChatRequest<TModel> = {
     model: TModel;
-    reasoning_effort?: 'none' | 'minimal' | 'low' | 'medium' | 'high';
+    reasoning_effort?: 'none' | 'minimal' | 'low' | 'medium' | 'high' | 'xhigh';
     store?: boolean;
     modalities?: readonly ('text' | 'audio')[];
     audio?: {
@@ -6946,6 +6959,10 @@ declare enum AxAIGoogleGeminiModel {
     Gemini3Flash = "gemini-3-flash-preview",
     Gemini3Pro = "gemini-3.1-pro-preview",
     Gemini3ProImage = "gemini-3-pro-image-preview",
+    Gemini31FlashImage = "gemini-3.1-flash-image-preview",
+    Gemini31FlashTTS = "gemini-3.1-flash-tts-preview",
+    NanoBanana2 = "nano-banana-2",
+    GeminiRoboticsER16 = "gemini-robotics-er-1.6-preview",
     Gemini25Pro = "gemini-2.5-pro",
     Gemini25Flash = "gemini-2.5-flash",
     Gemini25FlashNativeAudio = "gemini-2.5-flash-native-audio-preview-12-2025",
@@ -6967,7 +6984,6 @@ declare enum AxAIGoogleGeminiEmbedModel {
     GeminiEmbedding001 = "gemini-embedding-001",
     GeminiEmbedding = "gemini-embedding-exp",
     TextEmbeddingLarge = "text-embedding-large-exp-03-07",
-    TextEmbedding004 = "text-embedding-004",
     TextEmbedding005 = "text-embedding-005"
 }
 declare enum AxAIGoogleGeminiSafetyCategory {
@@ -7123,6 +7139,14 @@ type AxAIGoogleGeminiChatResponse = {
                     title?: string;
                     uri?: string;
                 };
+                retrievedContext?: {
+                    title?: string;
+                    uri?: string;
+                    /** File Search multimodal (May 2026): id of the file/media chunk. */
+                    media_id?: string;
+                    /** File Search multimodal (May 2026): page numbers cited within the source. */
+                    page_numbers?: number[];
+                };
             }[];
             googleMapsWidgetContextToken?: string;
         };
@@ -7527,6 +7551,8 @@ declare enum AxAIOpenAIResponsesModel {
     GPT54 = "gpt-5.4",
     GPT54Mini = "gpt-5.4-mini",
     GPT54Nano = "gpt-5.4-nano",
+    GPT55 = "gpt-5.5",
+    GPT55Pro = "gpt-5.5-pro",
     O1Pro = "o1-pro",
     O1 = "o1",
     O1Mini = "o1-mini",
@@ -7592,14 +7618,14 @@ interface AxAIOpenAIResponsesRequest<TModel = AxAIOpenAIResponsesModel> {
     readonly input: string | ReadonlyArray<AxAIOpenAIResponsesInputItem>;
     readonly model: TModel;
     readonly background?: boolean | null;
-    readonly include?: ReadonlyArray<'file_search_call.results' | 'message.input_image.image_url' | 'computer_call_output.output.image_url' | 'reasoning.encrypted_content' | 'code_interpreter_call.outputs'> | null;
+    readonly include?: ReadonlyArray<'file_search_call.results' | 'message.input_image.image_url' | 'computer_call_output.output.image_url' | 'reasoning.encrypted_content' | 'code_interpreter_call.outputs' | 'web_search_call.action.return_token_budget'> | null;
     readonly instructions?: string | null;
     readonly max_output_tokens?: number | null;
     readonly metadata?: Readonly<Record<string, string>> | null;
     readonly parallel_tool_calls?: boolean | null;
     readonly previous_response_id?: string | null;
     readonly reasoning?: {
-        readonly effort?: 'minimal' | 'low' | 'medium' | 'high' | null;
+        readonly effort?: 'none' | 'minimal' | 'low' | 'medium' | 'high' | 'xhigh' | null;
         readonly summary?: 'auto' | 'concise' | 'detailed' | null;
     } | null;
     readonly service_tier?: 'auto' | 'default' | 'flex' | null;
@@ -7629,6 +7655,7 @@ interface AxAIOpenAIResponsesOutputMessageItem {
     role: 'assistant';
     content: ReadonlyArray<AxAIOpenAIResponsesOutputTextContentPart | AxAIOpenAIResponsesOutputRefusalContentPart>;
     status: 'in_progress' | 'completed' | 'incomplete';
+    phase?: 'commentary' | 'final_answer';
 }
 interface AxAIOpenAIResponsesFunctionCallItem {
     type: 'function_call';
@@ -7978,7 +8005,7 @@ type AxAIOpenAIResponsesConfig<TModel, TEmbedModel> = Omit<AxModelConfig, 'topK'
     logprobs?: number;
     echo?: boolean;
     dimensions?: number;
-    reasoningEffort?: 'minimal' | 'low' | 'medium' | 'high';
+    reasoningEffort?: 'none' | 'minimal' | 'low' | 'medium' | 'high' | 'xhigh';
     reasoningSummary?: 'auto' | 'concise' | 'detailed';
     store?: boolean;
     systemPrompt?: string;

package/index.d.ts CHANGED Viewed

@@ -2427,6 +2427,7 @@ declare class AxBaseAI<TModel, TEmbedModel, TChatRequest, TEmbedRequest, TChatRe
     private calculatePercentile;
     private updateLatencyMetrics;
     private updateErrorMetrics;
+    private recordEstimatedCost;
     private recordTokenUsage;
     private calculateRequestSize;
     private calculateResponseSize;
@@ -2535,6 +2536,9 @@ type AxModelInfo = {
     maxTokens?: number;
     isExpensive?: boolean;
     contextWindow?: number;
+    isDeprecated?: boolean;
+    /** ISO date (YYYY-MM-DD) the upstream provider will stop serving this model. */
+    deprecatedOn?: string;
 };
 type AxTokenUsage = {
     promptTokens: number;
@@ -2755,6 +2759,10 @@ type AxCitation = {
     license?: string;
     publicationDate?: string;
     snippet?: string;
+    /** File Search multimodal (Gemini, May 2026): media chunk id. */
+    mediaId?: string;
+    /** File Search multimodal (Gemini, May 2026): page numbers cited within the source. */
+    pageNumbers?: number[];
 };
 type AxModelUsage = {
     ai: string;
@@ -4305,9 +4313,9 @@ declare class AxSignature<_TInput extends Record<string, any> = Record<string, a
 declare const promptTemplates: {
     readonly 'dsp/dspy.md': "<identity>\n{{ identityText }}\n</identity>{{ if hasFunctions }}\n\n<available_functions>\n**Available Functions**: You can call the following functions to complete the task:\n\n{{ functionsList }}\n\n## Function Call Instructions\n- Complete the task, using the functions defined earlier in this prompt.\n- Output fields should only be generated after all functions have been called.\n- Use the function results to generate the output fields.\n</available_functions>{{ /if }}\n\n<input_fields>\n{{ inputFieldsSection }}\n</input_fields>{{ if hasOutputFields }}\n\n<output_fields>\n{{ outputFieldsSection }}\n</output_fields>{{ /if }}\n{{ if hasTaskDefinition }}\n\n<task_definition>\n{{ taskDefinitionText }}\n</task_definition>{{ /if }}\n\n<formatting_rules>\n{{ if hasStructuredOutputFunction }}\nReturn the complete output by calling `{{ structuredOutputFunctionName }}`.\n{{ else }}{{ if hasComplexFields }}\nReturn valid JSON matching <output_fields>.\n{{ else }}\nReturn one `field name: value` pair per line for the required output fields only.\n{{ /if }}{{ /if }}Above rules override later instructions.\n\n</formatting_rules>\n{{ if hasExampleDemonstrations }}\n\n## Example Demonstrations\nThe following User/Assistant turns are examples only until --- END OF EXAMPLES ---, not context for the current task.\n{{ /if }}\n";
     readonly 'dsp/example-separator.md': "--- END OF EXAMPLES ---\nThe examples above were for training purposes only. Please ignore any specific entities or facts mentioned in them.\n\nREAL USER QUERY:\n";
-    readonly 'rlm/distiller.md': "## Distiller\n\nYou (`distiller`) read the available context and forward an actionable request to the downstream **executor** stage (which has the tools — shell, file system, agent functions, etc.). You do not execute the task yourself.\n\nCall `final(request, evidence)` to forward. Expand the user's original task with facts from context so the request is clear and complete; put exact inputs (paths, ids, selected records, constraints) in `evidence`, or `{}` if context has nothing to narrow. Resolve follow-ups against prior conversation. Never refuse with \"I have no tools\" — forwarding *is* the response. Use `askClarification` only when genuinely blocked by ambiguity.\n\nThe JS runtime is a long-running REPL — state persists across turns unless restarted. Each **turn**: write code → it executes → you see output → write the next block.\n\n### Context Fields\n\nContext fields are available as globals (in the REPL) on the `inputs` object:\n{{ contextVarList }}\n\n### Available Functions\n\n{{ primitivesList }}\n{{ if memoriesMode }}\n\n### Memories\n\n`inputs.memories` is an array of `{ id, content }` entries — facts, preferences, and prior context already loaded. Scan it before deciding what to do. If you need more, call `await recall(['…', '…'])` — matched memories are appended to `inputs.memories` for the next turn (and forwarded to the executor).\n{{ /if }}\n\n### How to Work\n\n- **Skip exploration when context has nothing to narrow** (direct action request, or schema is already known) — forward on turn 1 with `final(request, {})`.\n- **When narrowing**: probe shape, narrow with JS, extract. Don't dump raw data. Don't repeat probes already in the Action Log.\n- **Use JS** for deterministic work (filter, sort, slice, regex, dedupe). **Use `llmQuery`** only to interpret a narrowed slice — never pass raw `inputs.*` to it.\n- `console.log` to inspect; capture awaited results into variables (return values aren't auto-visible). Multiple `console.log`s per turn is fine.\n\n```js\nconst narrowed = inputs.emails\n  .filter(e => e.subject.toLowerCase().includes('refund'))\n  .map(e => ({ from: e.from, subject: e.subject, body: e.body.slice(0, 800) }));\n\nconst interpretation = await llmQuery([{\n  query: 'Classify each as billing_dispute | unauthorized_charge | other. JSON list.',\n  context: { emails: narrowed }\n}]);\nconsole.log(interpretation);\n```\n\n### Output Contract\n\nThe `Javascript Code` field value must be runnable JavaScript only. Do not put prose or plain labels like `task:` / `evidence:` inside the value. Never combine `console.log` with `final()` or `askClarification()` in the same turn.\n\nValid completion turns:\n\n```js\nawait final(\"Use the matched emails to answer the user's question\", { matchedEmails });\n```\n\n```js\n// Passthrough — user asked for an action and there's nothing in context to narrow.\nawait final(\"Run the shell command `ls -la` and return its output verbatim\", {});\n```\n\n```js\nawait askClarification(\"Which context should I inspect?\");\n```\n\n## JavaScript Runtime Usage Instructions\n{{ runtimeUsageInstructions }}\n";
-    readonly 'rlm/executor.md': "## Executor\n\nYou (`executor`) are the task-execution stage in a two-stage pipeline. Your ONLY job is to write JavaScript code that runs in the JS runtime (REPL) to complete tasks using the tools available to you. A separate (`responder`) agent downstream synthesizes the final answer.\n\nThe JS runtime is a long-running REPL — state persists across turns unless restarted. Each **turn**: write code → it executes → you see output → write the next block.\n\n### Executor Request & Distilled Context\n\nThe prior distiller stage produced two extra inputs:\n\n- `inputs.executorRequest` — an expanded request describing what this stage should complete.\n- `inputs.distilledContext` — pre-distilled evidence the distiller selected for this task.\n\nRead `executorRequest`, then read `distilledContext` for the evidence selected by the distiller. Raw context fields are not available in this stage. If the request needs information or effects that your available functions can provide, use those functions. If the distilled evidence is sufficient, finish directly with `final(...)`. Call `askClarification(...)` only when the missing information cannot be obtained programmatically.\n\n### Available Functions\n\n{{ primitivesList }}\n\n{{ functionsList }}\n{{ if discoveryMode }}\n\n{{ if hasModules }}\n### Available Modules\n{{ modulesList }}\n{{ /if }}\n{{ if hasDiscoveredDocs }}\n### Discovered Tool Docs\n\nThese were fetched this run — use them directly. Only re-run discovery for modules/functions not listed here.\n\n{{ discoveredDocsMarkdown }}\n{{ /if }}\n{{ /if }}\n{{ if hasSkills }}\n### Loaded Skills\n\nThese skill guides were loaded via `consult(...)` — apply them directly. Call `consult([...])` to load additional skills as needed.\n\n{{ skillsMarkdown }}\n{{ /if }}\n{{ if memoriesMode }}\n\n### Memories\n\n`inputs.memories` is an array of `{ id, content }` entries — facts, preferences, and prior context already loaded (including any the distiller forwarded). Scan it before deciding what to do. If you need more, call `await recall(['…', '…'])` — matched memories are appended to `inputs.memories` for the next turn.\n{{ /if }}\n\n### How to Work\n\n- Start from `inputs.executorRequest`, `inputs.distilledContext`, non-context task inputs, and prior successful Action Log results. Don't repeat probes already in the Action Log.\n- **Use JS** for deterministic work (filter, sort, slice, regex, dedupe). **Use `llmQuery`** only to interpret narrowed text — never pass raw `inputs.*` to it.\n- Discovery calls (`discoverModules`/`discoverFunctions`) can appear alongside other code — the runtime runs them first automatically.\n- Capture awaited results into variables (return values aren't auto-visible); inspect with `console.log(result)` or finish with `await final(\"...\", { result })`. Multiple `console.log`s per turn is fine.\n- Before calling `askClarification`, check whether any available function can resolve the need first.\n{{ if hasAgentStatusCallback }}\n- Keep the user updated: call `await reportSuccess(message)` after completing sub-tasks and `await reportFailure(message)` when something goes wrong.\n{{ /if }}\n\n```js\nconst narrowed = inputs.emails\n  .filter(e => e.subject.toLowerCase().includes('refund'))\n  .map(e => ({ from: e.from, subject: e.subject, body: e.body.slice(0, 800) }));\n\nconst plan = await llmQuery([{\n  query: 'Determine which messages require a refund response and draft a compact action plan.',\n  context: { emails: narrowed }\n}]);\nconsole.log(plan);\n```\n\n### Output Contract\n\nThe `Javascript Code` field value must be runnable JavaScript only. Do not put prose or plain labels like `task:` / `evidence:` inside the value. Never combine `console.log` with `final()` or `askClarification()` in the same turn.\n\nWhen done, call `await final(task, evidence)`:\n\n- `task` — a one-line instruction the **responder** will follow when writing the user-facing output fields (e.g. \"Answer the user's question using the matched emails\").\n- `evidence` — the curated data the responder will read to follow `task`. Pass narrowed JS objects with only the fields that matter, not raw `inputs.*`. Use plain keys (`{ matchedEmails: [...] }`) — don't wrap under the output field name.\n\nDo not pre-format the answer; the responder writes the output fields.\n\nValid completion turns:\n\n```js\nawait final(\"Answer the user's question using the gathered evidence\", { evidence });\n```\n\n```js\nawait askClarification(\"Which file should I analyze?\");\n```\n\n## JavaScript Runtime Usage Instructions\n{{ runtimeUsageInstructions }}\n";
-    readonly 'rlm/responder.md': "## Answer Synthesis Agent\n\nYou synthesize the final answer from the evidence the actor gathered. You do not run code, call tools, or invoke agents — you read input fields and write the output fields.\n\n### Reading the actor's payload\n\n`Context Data` has two keys:\n\n- `task` — a one-line instruction telling you what to write into the output fields.\n- `evidence` — the data the actor curated for you to follow that instruction.\n\n### Rules\n\n1. Follow `Context Data.task` using `Context Data.evidence` and any other input fields provided.\n2. When emitting a JSON output field, write the value flat — do **not** wrap it under a key matching the field's title. The field is already named.\n3. If `evidence` lacks sufficient information, give the best possible answer from what's available across all input fields.\n\n### Context variables that were analyzed (metadata only)\n{{ contextVarSummary }}\n{{ if hasAgentIdentity }}\n\n### Agent Identity\n\nUser-facing identity:\n{{ agentIdentityText }}\n{{ /if }}\n";
+    readonly 'rlm/distiller.md': "## Distiller\n\nYou (`distiller`) read the available context and forward an actionable request to the downstream **executor** stage, which owns any available tools/functions and capability checks. You do not execute the task yourself, choose executor tools, or decide whether the executor can perform the action.\n\nCall `final(request, evidence)` to forward. Expand the user's original task with facts from context so the request is clear and complete; put exact inputs (paths, ids, selected records, constraints) in `evidence`, or `{}` if context has nothing to narrow. Resolve follow-ups against prior conversation. Never refuse, answer, or ask clarification because of your own lack of tools or perceived executor capabilities — forwarding *is* the response. Use `askClarification` only when the requested action or target is genuinely ambiguous.\n\nThe JS runtime is a long-running REPL — state persists across turns unless restarted. Each **turn**: write code → it executes → you see output → write the next block.\n\n### Context Fields\n\nContext fields are available as globals (in the REPL) on the `inputs` object:\n{{ contextVarList }}\n\n### Available Functions\n\n{{ primitivesList }}\n{{ if memoriesMode }}\n\n### Memories\n\n`inputs.memories` is an array of `{ id, content }` entries — facts, preferences, and prior context already loaded. Scan it before deciding what to do. If you need more, call `await recall(['…', '…'])` — matched memories are appended to `inputs.memories` for the next turn (and forwarded to the executor).\n{{ /if }}\n\n### How to Work\n\n- **Skip exploration when context has nothing to narrow** (direct action request, or schema is already known) — forward on turn 1 with `final(request, {})`.\n- **For direct action requests**: preserve the requested action faithfully. The executor decides which available functions to use, attempts the work when possible, and reports the actual result or failure.\n- **When narrowing**: probe shape, narrow with JS, extract. Don't dump raw data. Don't repeat probes already in the Action Log.\n- **Use JS** for deterministic work (filter, sort, slice, regex, dedupe). **Use `llmQuery`** only to interpret a narrowed slice — never pass raw `inputs.*` to it.\n- `console.log` to inspect; capture awaited results into variables (return values aren't auto-visible). Multiple `console.log`s per turn is fine.\n\n```js\nconst narrowed = inputs.emails\n  .filter(e => e.subject.toLowerCase().includes('refund'))\n  .map(e => ({ from: e.from, subject: e.subject, body: e.body.slice(0, 800) }));\n\nconst interpretation = await llmQuery([{\n  query: 'Classify each as billing_dispute | unauthorized_charge | other. JSON list.',\n  context: { emails: narrowed }\n}]);\nconsole.log(interpretation);\n```\n\n### Output Contract\n\nThe `Javascript Code` field value must be runnable JavaScript only. Do not put prose or plain labels like `task:` / `evidence:` inside the value. Never combine `console.log` with `final()` or `askClarification()` in the same turn.\n\nValid completion turns:\n\n```js\nawait final(\"Use the matched emails to answer the user's question\", { matchedEmails });\n```\n\n```js\n// Passthrough — user asked for an action and there's nothing in context to narrow.\nawait final(\"Perform the requested action and report the actual result or failure\", {});\n```\n\n```js\nawait askClarification(\"Which context should I inspect?\");\n```\n\n## JavaScript Runtime Usage Instructions\n{{ runtimeUsageInstructions }}\n";
+    readonly 'rlm/executor.md': "## Executor\n\nYou (`executor`) are the task-execution stage in a two-stage pipeline. Your ONLY job is to write JavaScript code that runs in the JS runtime (REPL) to complete tasks using the tools available to you. A separate (`responder`) agent downstream synthesizes the final answer.\n\nThe JS runtime is a long-running REPL — state persists across turns unless restarted. Each **turn**: write code → it executes → you see output → write the next block.\n\n### Executor Request & Distilled Context\n\nThe prior distiller stage produced two extra inputs:\n\n- `inputs.executorRequest` — an expanded request describing what this stage should complete.\n- `inputs.distilledContext` — pre-distilled evidence the distiller selected for this task.\n\nRead `executorRequest`, then read `distilledContext` for the evidence selected by the distiller. Raw context fields are not available in this stage. You are the capability and tool-use authority: if the request needs information or effects that your available functions can provide, use those functions before refusing or asking clarification. If the distilled evidence is sufficient, finish directly with `final(...)`. Call `askClarification(...)` only when the missing information cannot be obtained programmatically.\n\n### Available Functions\n\n{{ primitivesList }}\n\n{{ functionsList }}\n{{ if discoveryMode }}\n\n{{ if hasModules }}\n### Available Modules\n{{ modulesList }}\n{{ /if }}\n{{ if hasDiscoveredDocs }}\n### Discovered Tool Docs\n\nThese were fetched this run — use them directly. Only re-run discovery for modules/functions not listed here.\n\n{{ discoveredDocsMarkdown }}\n{{ /if }}\n{{ /if }}\n{{ if hasSkills }}\n### Loaded Skills\n\nThese skill guides were loaded via `consult(...)` — apply them directly. Call `consult([...])` to load additional skills as needed.\n\n{{ skillsMarkdown }}\n{{ /if }}\n{{ if memoriesMode }}\n\n### Memories\n\n`inputs.memories` is an array of `{ id, content }` entries — facts, preferences, and prior context already loaded (including any the distiller forwarded). Scan it before deciding what to do. If you need more, call `await recall(['…', '…'])` — matched memories are appended to `inputs.memories` for the next turn.\n{{ /if }}\n\n### How to Work\n\n- Start from `inputs.executorRequest`, `inputs.distilledContext`, non-context task inputs, and prior successful Action Log results. Don't repeat probes already in the Action Log.\n- Treat direct action requests as work to attempt with available functions. If a function fails or the environment denies the action, capture the real error, status, output, or exception in the evidence for the responder.\n- **Use JS** for deterministic work (filter, sort, slice, regex, dedupe). **Use `llmQuery`** only to interpret narrowed text — never pass raw `inputs.*` to it.\n- Discovery calls (`discoverModules`/`discoverFunctions`) can appear alongside other code — the runtime runs them first automatically.\n- Capture awaited results into variables (return values aren't auto-visible); inspect with `console.log(result)` or finish with `await final(\"...\", { result })`. Multiple `console.log`s per turn is fine.\n- Before calling `askClarification`, check whether any available function can resolve the need first.\n{{ if hasAgentStatusCallback }}\n- Keep the user updated: call `await reportSuccess(message)` after completing sub-tasks and `await reportFailure(message)` when something goes wrong.\n{{ /if }}\n\n```js\nconst narrowed = inputs.emails\n  .filter(e => e.subject.toLowerCase().includes('refund'))\n  .map(e => ({ from: e.from, subject: e.subject, body: e.body.slice(0, 800) }));\n\nconst plan = await llmQuery([{\n  query: 'Determine which messages require a refund response and draft a compact action plan.',\n  context: { emails: narrowed }\n}]);\nconsole.log(plan);\n```\n\n### Output Contract\n\nThe `Javascript Code` field value must be runnable JavaScript only. Do not put prose or plain labels like `task:` / `evidence:` inside the value. Never combine `console.log` with `final()` or `askClarification()` in the same turn.\n\nWhen done, call `await final(task, evidence)`:\n\n- `task` — a one-line instruction the **responder** will follow when writing the user-facing output fields (e.g. \"Answer the user's question using the matched emails\").\n- `evidence` — the curated data the responder will read to follow `task`. Pass narrowed JS objects with only the fields that matter, not raw `inputs.*`. Use plain keys (`{ matchedEmails: [...] }`) — don't wrap under the output field name.\n\nDo not pre-format the answer; the responder writes the output fields.\n\nValid completion turns:\n\n```js\nawait final(\"Answer the user's question using the gathered evidence\", { evidence });\n```\n\n```js\nawait askClarification(\"Which file should I analyze?\");\n```\n\n## JavaScript Runtime Usage Instructions\n{{ runtimeUsageInstructions }}\n";
+    readonly 'rlm/responder.md': "## Answer Synthesis Agent\n\nYou synthesize the final answer from the evidence the actor gathered. You do not run code, call tools, or invoke agents — you read input fields and write the output fields.\n\n### Reading the actor's payload\n\n`Context Data` has two keys:\n\n- `task` — a one-line instruction telling you what to write into the output fields.\n- `evidence` — the data the actor curated for you to follow that instruction.\n\n### Rules\n\n1. Follow `Context Data.task` using `Context Data.evidence` and any other input fields provided.\n2. When emitting a JSON output field, write the value flat — do **not** wrap it under a key matching the field's title. The field is already named.\n3. If `evidence` lacks sufficient information, give the best possible answer from what's available across all input fields.\n4. Do not contradict actor evidence. If evidence contains a tool result, failure, status, output, or exception, report that result rather than inventing a capability limit.\n\n### Context variables that were analyzed (metadata only)\n{{ contextVarSummary }}\n{{ if hasAgentIdentity }}\n\n### Agent Identity\n\nUser-facing identity:\n{{ agentIdentityText }}\n{{ /if }}\n";
 };
 type TemplateId = keyof typeof promptTemplates;
@@ -5709,6 +5717,10 @@ type AxAIAnthropicThinkingWire = {
 type AxAIAnthropicEffortLevel = 'low' | 'medium' | 'high' | 'max';
 type AxAIAnthropicOutputConfig = {
     effort?: AxAIAnthropicEffortLevel;
+    format?: {
+        type: 'json_schema';
+        schema: object;
+    };
 };
 type AxAIAnthropicEffortLevelMapping = {
     minimal?: AxAIAnthropicEffortLevel;
@@ -5771,7 +5783,7 @@ type AxAIAnthropicChatRequest = {
                 media_type: string;
                 data: string;
             };
-        } & AxAIAnthropicChatRequestCacheParam) | {
+        } & AxAIAnthropicChatRequestCacheParam) | ({
             type: 'tool_result';
             is_error?: boolean;
             tool_use_id: string;
@@ -5786,7 +5798,7 @@ type AxAIAnthropicChatRequest = {
                     data: string;
                 };
             } & AxAIAnthropicChatRequestCacheParam))[];
-        })[];
+        } & AxAIAnthropicChatRequestCacheParam))[];
     } | {
         role: 'assistant';
         content: string | (({
@@ -5826,10 +5838,6 @@ type AxAIAnthropicChatRequest = {
     top_k?: number;
     thinking?: AxAIAnthropicThinkingWire;
     output_config?: AxAIAnthropicOutputConfig;
-    output_format?: {
-        type: 'json_schema';
-        schema: object;
-    };
     metadata?: {
         user_id: string;
     };
@@ -6003,8 +6011,11 @@ declare enum AxAIOpenAIModel {
     GPT4OMini = "gpt-4o-mini",
     GPTAudio = "gpt-audio",
     GPTAudioMini = "gpt-audio-mini",
+    GPTAudio15 = "gpt-audio-1.5",
+    GPTRealtime15 = "gpt-realtime-1.5",
     GPTRealtime2 = "gpt-realtime-2",
     GPTRealtimeWhisper = "gpt-realtime-whisper",
+    GPTRealtimeTranslate = "gpt-realtime-translate",
     GPT4ChatGPT4O = "chatgpt-4o-latest",
     GPT4Turbo = "gpt-4-turbo",
     GPT35Turbo = "gpt-3.5-turbo",
@@ -6031,6 +6042,8 @@ declare enum AxAIOpenAIModel {
     GPT54 = "gpt-5.4",
     GPT54Mini = "gpt-5.4-mini",
     GPT54Nano = "gpt-5.4-nano",
+    GPT55 = "gpt-5.5",
+    GPT55Pro = "gpt-5.5-pro",
     O1 = "o1",
     O1Mini = "o1-mini",
     O3 = "o3",
@@ -6063,7 +6076,7 @@ type AxAIOpenAIConfig<TModel, TEmbedModel> = Omit<AxModelConfig, 'topK'> & {
     logprobs?: number;
     echo?: boolean;
     dimensions?: number;
-    reasoningEffort?: 'minimal' | 'low' | 'medium' | 'high';
+    reasoningEffort?: 'none' | 'minimal' | 'low' | 'medium' | 'high' | 'xhigh';
     store?: boolean;
     serviceTier?: 'auto' | 'default' | 'flex';
     webSearchOptions?: {
@@ -6111,7 +6124,7 @@ interface AxAIOpenAIResponseDelta<T> {
 }
 type AxAIOpenAIChatRequest<TModel> = {
     model: TModel;
-    reasoning_effort?: 'none' | 'minimal' | 'low' | 'medium' | 'high';
+    reasoning_effort?: 'none' | 'minimal' | 'low' | 'medium' | 'high' | 'xhigh';
     store?: boolean;
     modalities?: readonly ('text' | 'audio')[];
     audio?: {
@@ -6946,6 +6959,10 @@ declare enum AxAIGoogleGeminiModel {
     Gemini3Flash = "gemini-3-flash-preview",
     Gemini3Pro = "gemini-3.1-pro-preview",
     Gemini3ProImage = "gemini-3-pro-image-preview",
+    Gemini31FlashImage = "gemini-3.1-flash-image-preview",
+    Gemini31FlashTTS = "gemini-3.1-flash-tts-preview",
+    NanoBanana2 = "nano-banana-2",
+    GeminiRoboticsER16 = "gemini-robotics-er-1.6-preview",
     Gemini25Pro = "gemini-2.5-pro",
     Gemini25Flash = "gemini-2.5-flash",
     Gemini25FlashNativeAudio = "gemini-2.5-flash-native-audio-preview-12-2025",
@@ -6967,7 +6984,6 @@ declare enum AxAIGoogleGeminiEmbedModel {
     GeminiEmbedding001 = "gemini-embedding-001",
     GeminiEmbedding = "gemini-embedding-exp",
     TextEmbeddingLarge = "text-embedding-large-exp-03-07",
-    TextEmbedding004 = "text-embedding-004",
     TextEmbedding005 = "text-embedding-005"
 }
 declare enum AxAIGoogleGeminiSafetyCategory {
@@ -7123,6 +7139,14 @@ type AxAIGoogleGeminiChatResponse = {
                     title?: string;
                     uri?: string;
                 };
+                retrievedContext?: {
+                    title?: string;
+                    uri?: string;
+                    /** File Search multimodal (May 2026): id of the file/media chunk. */
+                    media_id?: string;
+                    /** File Search multimodal (May 2026): page numbers cited within the source. */
+                    page_numbers?: number[];
+                };
             }[];
             googleMapsWidgetContextToken?: string;
         };
@@ -7527,6 +7551,8 @@ declare enum AxAIOpenAIResponsesModel {
     GPT54 = "gpt-5.4",
     GPT54Mini = "gpt-5.4-mini",
     GPT54Nano = "gpt-5.4-nano",
+    GPT55 = "gpt-5.5",
+    GPT55Pro = "gpt-5.5-pro",
     O1Pro = "o1-pro",
     O1 = "o1",
     O1Mini = "o1-mini",
@@ -7592,14 +7618,14 @@ interface AxAIOpenAIResponsesRequest<TModel = AxAIOpenAIResponsesModel> {
     readonly input: string | ReadonlyArray<AxAIOpenAIResponsesInputItem>;
     readonly model: TModel;
     readonly background?: boolean | null;
-    readonly include?: ReadonlyArray<'file_search_call.results' | 'message.input_image.image_url' | 'computer_call_output.output.image_url' | 'reasoning.encrypted_content' | 'code_interpreter_call.outputs'> | null;
+    readonly include?: ReadonlyArray<'file_search_call.results' | 'message.input_image.image_url' | 'computer_call_output.output.image_url' | 'reasoning.encrypted_content' | 'code_interpreter_call.outputs' | 'web_search_call.action.return_token_budget'> | null;
     readonly instructions?: string | null;
     readonly max_output_tokens?: number | null;
     readonly metadata?: Readonly<Record<string, string>> | null;
     readonly parallel_tool_calls?: boolean | null;
     readonly previous_response_id?: string | null;
     readonly reasoning?: {
-        readonly effort?: 'minimal' | 'low' | 'medium' | 'high' | null;
+        readonly effort?: 'none' | 'minimal' | 'low' | 'medium' | 'high' | 'xhigh' | null;
         readonly summary?: 'auto' | 'concise' | 'detailed' | null;
     } | null;
     readonly service_tier?: 'auto' | 'default' | 'flex' | null;
@@ -7629,6 +7655,7 @@ interface AxAIOpenAIResponsesOutputMessageItem {
     role: 'assistant';
     content: ReadonlyArray<AxAIOpenAIResponsesOutputTextContentPart | AxAIOpenAIResponsesOutputRefusalContentPart>;
     status: 'in_progress' | 'completed' | 'incomplete';
+    phase?: 'commentary' | 'final_answer';
 }
 interface AxAIOpenAIResponsesFunctionCallItem {
     type: 'function_call';
@@ -7978,7 +8005,7 @@ type AxAIOpenAIResponsesConfig<TModel, TEmbedModel> = Omit<AxModelConfig, 'topK'
     logprobs?: number;
     echo?: boolean;
     dimensions?: number;
-    reasoningEffort?: 'minimal' | 'low' | 'medium' | 'high';
+    reasoningEffort?: 'none' | 'minimal' | 'low' | 'medium' | 'high' | 'xhigh';
     reasoningSummary?: 'auto' | 'concise' | 'detailed';
     store?: boolean;
     systemPrompt?: string;