npm - @ai-sdk/openai - Versions diffs - 4.0.0-beta.7 → 4.0.0-beta.74 - Mend

@ai-sdk/openai 4.0.0-beta.7 → 4.0.0-beta.74

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (73) hide show

package/CHANGELOG.md +636 -24
package/README.md +2 -0
package/dist/index.d.ts +240 -44
package/dist/index.js +3345 -1683
package/dist/index.js.map +1 -1
package/dist/internal/index.d.ts +390 -36
package/dist/internal/index.js +2707 -1706
package/dist/internal/index.js.map +1 -1
package/docs/03-openai.mdx +413 -39
package/package.json +16 -17
package/src/chat/convert-openai-chat-usage.ts +1 -1
package/src/chat/convert-to-openai-chat-messages.ts +96 -68
package/src/chat/map-openai-finish-reason.ts +1 -1
package/src/chat/openai-chat-api.ts +6 -2
package/src/chat/{openai-chat-options.ts → openai-chat-language-model-options.ts} +11 -1
package/src/chat/openai-chat-language-model.ts +82 -148
package/src/chat/openai-chat-prepare-tools.ts +3 -3
package/src/completion/convert-openai-completion-usage.ts +1 -1
package/src/completion/convert-to-openai-completion-prompt.ts +1 -2
package/src/completion/map-openai-finish-reason.ts +1 -1
package/src/completion/openai-completion-api.ts +5 -2
package/src/completion/{openai-completion-options.ts → openai-completion-language-model-options.ts} +5 -1
package/src/completion/openai-completion-language-model.ts +53 -17
package/src/embedding/{openai-embedding-options.ts → openai-embedding-model-options.ts} +5 -1
package/src/embedding/openai-embedding-model.ts +22 -5
package/src/files/openai-files-api.ts +17 -0
package/src/files/openai-files-options.ts +22 -0
package/src/files/openai-files.ts +100 -0
package/src/image/openai-image-model-options.ts +123 -0
package/src/image/openai-image-model.ts +62 -83
package/src/index.ts +15 -6
package/src/internal/index.ts +7 -6
package/src/openai-config.ts +7 -7
package/src/openai-language-model-capabilities.ts +5 -4
package/src/openai-provider.ts +80 -9
package/src/openai-stream-error.ts +181 -0
package/src/openai-tools.ts +12 -1
package/src/realtime/index.ts +2 -0
package/src/realtime/openai-realtime-event-mapper.ts +436 -0
package/src/realtime/openai-realtime-model-options.ts +3 -0
package/src/realtime/openai-realtime-model.ts +111 -0
package/src/responses/convert-openai-responses-usage.ts +1 -1
package/src/responses/convert-to-openai-responses-input.ts +345 -90
package/src/responses/map-openai-responses-finish-reason.ts +1 -1
package/src/responses/openai-responses-api.ts +186 -17
package/src/responses/{openai-responses-options.ts → openai-responses-language-model-options.ts} +55 -1
package/src/responses/openai-responses-language-model.ts +330 -52
package/src/responses/openai-responses-prepare-tools.ts +129 -18
package/src/responses/openai-responses-provider-metadata.ts +12 -2
package/src/skills/openai-skills-api.ts +31 -0
package/src/skills/openai-skills.ts +83 -0
package/src/speech/{openai-speech-options.ts → openai-speech-model-options.ts} +5 -1
package/src/speech/openai-speech-model.ts +23 -7
package/src/tool/apply-patch.ts +33 -32
package/src/tool/code-interpreter.ts +40 -41
package/src/tool/custom.ts +2 -8
package/src/tool/file-search.ts +3 -3
package/src/tool/image-generation.ts +2 -2
package/src/tool/local-shell.ts +2 -2
package/src/tool/mcp.ts +3 -3
package/src/tool/shell.ts +9 -4
package/src/tool/tool-search.ts +98 -0
package/src/tool/web-search-preview.ts +2 -2
package/src/tool/web-search.ts +10 -2
package/src/transcription/{openai-transcription-options.ts → openai-transcription-model-options.ts} +5 -1
package/src/transcription/openai-transcription-model.ts +35 -13
package/dist/index.d.mts +0 -1107
package/dist/index.mjs +0 -6509
package/dist/index.mjs.map +0 -1
package/dist/internal/index.d.mts +0 -1137
package/dist/internal/index.mjs +0 -6322
package/dist/internal/index.mjs.map +0 -1
package/src/image/openai-image-options.ts +0 -31

package/src/tool/local-shell.ts CHANGED Viewed

@@ -1,5 +1,5 @@
 import {
-  createProviderToolFactoryWithOutputSchema,
+  createProviderDefinedToolFactoryWithOutputSchema,
   lazySchema,
   zodSchema,
 } from '@ai-sdk/provider-utils';
@@ -24,7 +24,7 @@ export const localShellOutputSchema = lazySchema(() =>
   zodSchema(z.object({ output: z.string() })),
 );
-export const localShell = createProviderToolFactoryWithOutputSchema<
+export const localShell = createProviderDefinedToolFactoryWithOutputSchema<
   {
     /**
      * Execute a shell command on the server.

package/src/tool/mcp.ts CHANGED Viewed

@@ -1,9 +1,9 @@
 import {
-  createProviderToolFactoryWithOutputSchema,
+  createProviderExecutedToolFactory,
   lazySchema,
   zodSchema,
 } from '@ai-sdk/provider-utils';
-import { JSONValue } from '@ai-sdk/provider';
+import type { JSONValue } from '@ai-sdk/provider';
 import { z } from 'zod/v4';
 const jsonValueSchema: z.ZodType<JSONValue> = z.lazy(() =>
@@ -105,7 +105,7 @@ type McpArgs = {
   serverUrl?: string;
 };
-export const mcpToolFactory = createProviderToolFactoryWithOutputSchema<
+export const mcpToolFactory = createProviderExecutedToolFactory<
   {},
   {
     type: 'call';

package/src/tool/shell.ts CHANGED Viewed

@@ -1,8 +1,9 @@
 import {
-  createProviderToolFactoryWithOutputSchema,
+  createProviderDefinedToolFactoryWithOutputSchema,
   lazySchema,
   zodSchema,
 } from '@ai-sdk/provider-utils';
+import type { SharedV4ProviderReference } from '@ai-sdk/provider';
 import { z } from 'zod/v4';
 export const shellInputSchema = lazySchema(() =>
@@ -39,7 +40,7 @@ const shellSkillsSchema = z
     z.discriminatedUnion('type', [
       z.object({
         type: z.literal('skillReference'),
-        skillId: z.string(),
+        providerReference: z.record(z.string(), z.string()),
         version: z.string().optional(),
       }),
       z.object({
@@ -125,7 +126,11 @@ type ShellArgs = {
               }>;
             };
         skills?: Array<
-          | { type: 'skillReference'; skillId: string; version?: string }
+          | {
+              type: 'skillReference';
+              providerReference: SharedV4ProviderReference;
+              version?: string;
+            }
           | {
               type: 'inline';
               name: string;
@@ -152,7 +157,7 @@ type ShellArgs = {
       };
 };
-export const shell = createProviderToolFactoryWithOutputSchema<
+export const shell = createProviderDefinedToolFactoryWithOutputSchema<
   {
     /**
      * Shell tool action containing commands to execute.

package/src/tool/tool-search.ts ADDED Viewed

@@ -0,0 +1,98 @@
+import type { JSONObject } from '@ai-sdk/provider';
+import {
+  createProviderDefinedToolFactoryWithOutputSchema,
+  lazySchema,
+  zodSchema,
+  type FlexibleSchema,
+} from '@ai-sdk/provider-utils';
+import { z } from 'zod/v4';
+export const toolSearchArgsSchema = lazySchema(() =>
+  zodSchema(
+    z.object({
+      execution: z.enum(['server', 'client']).optional(),
+      description: z.string().optional(),
+      parameters: z.record(z.string(), z.unknown()).optional(),
+    }),
+  ),
+);
+export const toolSearchInputSchema = lazySchema(() =>
+  zodSchema(
+    z.object({
+      arguments: z.unknown().optional(),
+      call_id: z.string().nullish(),
+    }),
+  ),
+);
+export const toolSearchOutputSchema: FlexibleSchema<{
+  tools: Array<JSONObject>;
+}> = lazySchema(() =>
+  zodSchema(
+    z.object({
+      tools: z.array(z.record(z.string(), z.unknown())),
+    }),
+  ),
+) as FlexibleSchema<{ tools: Array<JSONObject> }>;
+const toolSearchToolFactory = createProviderDefinedToolFactoryWithOutputSchema<
+  {
+    /**
+     * The arguments from the tool_search_call.
+     * This is preserved for multi-turn conversation reconstruction.
+     */
+    arguments?: unknown;
+    /**
+     * The call ID from the tool_search_call.
+     * Present for client-executed tool search; null for hosted.
+     */
+    call_id?: string | null;
+  },
+  {
+    /**
+     * The tools that were loaded by the tool search.
+     * These are the deferred tools that the model requested to load.
+     * Each tool is represented as a JSON object with properties depending on its type.
+     *
+     * Common properties include:
+     * - `type`: The type of the tool (e.g., 'function', 'web_search', etc.)
+     * - `name`: The name of the tool (for function tools)
+     * - `description`: A description of the tool
+     * - `deferLoading`: Whether this tool was deferred (had defer_loading: true)
+     * - `parameters`: The JSON Schema for the function parameters (for function tools)
+     * - `strict`: Whether to enable strict schema adherence (for function tools)
+     */
+    tools: Array<JSONObject>;
+  },
+  {
+    /**
+     * Whether the tool search is executed by the server (hosted) or client.
+     * - `'server'` (default): OpenAI performs the search across deferred tools.
+     * - `'client'`: The model emits a `tool_search_call` and your `execute`
+     *   function performs the lookup, returning the tools to load.
+     */
+    execution?: 'server' | 'client';
+    /**
+     * A description of the tool search capability.
+     * Only used for client-executed tool search.
+     */
+    description?: string;
+    /**
+     * JSON Schema for the search arguments your application expects.
+     * Only used for client-executed tool search.
+     */
+    parameters?: Record<string, unknown>;
+  }
+>({
+  id: 'openai.tool_search',
+  inputSchema: toolSearchInputSchema,
+  outputSchema: toolSearchOutputSchema,
+});
+export const toolSearch = (
+  args: Parameters<typeof toolSearchToolFactory>[0] = {},
+) => toolSearchToolFactory(args);

package/src/tool/web-search-preview.ts CHANGED Viewed

@@ -1,5 +1,5 @@
 import {
-  createProviderToolFactoryWithOutputSchema,
+  createProviderExecutedToolFactory,
   lazySchema,
   zodSchema,
 } from '@ai-sdk/provider-utils';
@@ -50,7 +50,7 @@ const webSearchPreviewOutputSchema = lazySchema(() =>
   ),
 );
-export const webSearchPreview = createProviderToolFactoryWithOutputSchema<
+export const webSearchPreview = createProviderExecutedToolFactory<
   {
     // Web search preview doesn't take input parameters - it's controlled by the prompt
   },

package/src/tool/web-search.ts CHANGED Viewed

@@ -1,5 +1,5 @@
 import {
-  createProviderToolFactoryWithOutputSchema,
+  createProviderExecutedToolFactory,
   lazySchema,
   zodSchema,
 } from '@ai-sdk/provider-utils';
@@ -36,6 +36,7 @@ export const webSearchOutputSchema = lazySchema(() =>
           z.object({
             type: z.literal('search'),
             query: z.string().optional(),
+            queries: z.array(z.string()).optional(),
           }),
           z.object({
             type: z.literal('openPage'),
@@ -60,7 +61,7 @@ export const webSearchOutputSchema = lazySchema(() =>
   ),
 );
-export const webSearchToolFactory = createProviderToolFactoryWithOutputSchema<
+export const webSearchToolFactory = createProviderExecutedToolFactory<
   {
     // Web search doesn't take input parameters - it's controlled by the prompt
   },
@@ -78,8 +79,15 @@ export const webSearchToolFactory = createProviderToolFactoryWithOutputSchema<
           /**
            * The search query.
+           *
+           * @deprecated Use `queries` instead.
            */
           query?: string;
+          /**
+           * The search queries the model used.
+           */
+          queries?: string[];
         }
       | {
           /**

package/src/transcription/{openai-transcription-options.ts → openai-transcription-model-options.ts} RENAMED Viewed

@@ -1,4 +1,8 @@
-import { InferSchema, lazySchema, zodSchema } from '@ai-sdk/provider-utils';
+import {
+  lazySchema,
+  zodSchema,
+  type InferSchema,
+} from '@ai-sdk/provider-utils';
 import { z } from 'zod/v4';
 export type OpenAITranscriptionModelId =

package/src/transcription/openai-transcription-model.ts CHANGED Viewed

@@ -1,4 +1,4 @@
-import {
+import type {
   TranscriptionModelV4,
   TranscriptionModelV4CallOptions,
   SharedV4Warning,
@@ -10,16 +10,18 @@ import {
   mediaTypeToExtension,
   parseProviderOptions,
   postFormDataToApi,
+  serializeModelOptions,
+  WORKFLOW_DESERIALIZE,
+  WORKFLOW_SERIALIZE,
 } from '@ai-sdk/provider-utils';
-import { OpenAIConfig } from '../openai-config';
+import type { OpenAIConfig } from '../openai-config';
 import { openaiFailedResponseHandler } from '../openai-error';
 import { openaiTranscriptionResponseSchema } from './openai-transcription-api';
 import {
-  OpenAITranscriptionModelId,
   openAITranscriptionModelOptions,
-  OpenAITranscriptionModelOptions,
-} from './openai-transcription-options';
+  type OpenAITranscriptionModelId,
+  type OpenAITranscriptionModelOptions,
+} from './openai-transcription-model-options';
 export type OpenAITranscriptionCallOptions = Omit<
   TranscriptionModelV4CallOptions,
   'providerOptions'
@@ -99,6 +101,20 @@ const languageMap = {
 export class OpenAITranscriptionModel implements TranscriptionModelV4 {
   readonly specificationVersion = 'v4';
+  static [WORKFLOW_SERIALIZE](model: OpenAITranscriptionModel) {
+    return serializeModelOptions({
+      modelId: model.modelId,
+      config: model.config,
+    });
+  }
+  static [WORKFLOW_DESERIALIZE](options: {
+    modelId: OpenAITranscriptionModelId;
+    config: OpenAITranscriptionModelConfig;
+  }) {
+    return new OpenAITranscriptionModel(options.modelId, options.config);
+  }
   get provider(): string {
     return this.config.provider;
   }
@@ -137,20 +153,26 @@ export class OpenAITranscriptionModel implements TranscriptionModelV4 {
       `audio.${fileExtension}`,
     );
+    if (this.modelId === 'whisper-1') {
+      formData.append('response_format', 'verbose_json');
+    }
     // Add provider-specific options
     if (openAIOptions) {
+      const isGpt4oTranscribeModel = [
+        'gpt-4o-transcribe',
+        'gpt-4o-mini-transcribe',
+      ].includes(this.modelId);
       const transcriptionModelOptions = {
         include: openAIOptions.include,
         language: openAIOptions.language,
         prompt: openAIOptions.prompt,
         // https://platform.openai.com/docs/api-reference/audio/createTranscription#audio_createtranscription-response_format
         // prefer verbose_json to get segments for models that support it
-        response_format: [
-          'gpt-4o-transcribe',
-          'gpt-4o-mini-transcribe',
-        ].includes(this.modelId)
-          ? 'json'
-          : 'verbose_json',
+        ...(this.modelId !== 'whisper-1' && {
+          response_format: isGpt4oTranscribeModel ? 'json' : 'verbose_json',
+        }),
         temperature: openAIOptions.temperature,
         timestamp_granularities: openAIOptions.timestampGranularities,
       };
@@ -189,7 +211,7 @@ export class OpenAITranscriptionModel implements TranscriptionModelV4 {
         path: '/audio/transcriptions',
         modelId: this.modelId,
       }),
-      headers: combineHeaders(this.config.headers(), options.headers),
+      headers: combineHeaders(this.config.headers?.(), options.headers),
       formData,
       failedResponseHandler: openaiFailedResponseHandler,
       successfulResponseHandler: createJsonResponseHandler(