npm - @ai-sdk/openai - Versions diffs - 3.0.0-beta.102 → 3.0.0-beta.105 - Mend

@ai-sdk/openai 3.0.0-beta.102 → 3.0.0-beta.105

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (14) hide show

package/CHANGELOG.md +21 -0
package/dist/index.d.mts +13 -1
package/dist/index.d.ts +13 -1
package/dist/index.js +146 -26
package/dist/index.js.map +1 -1
package/dist/index.mjs +154 -30
package/dist/index.mjs.map +1 -1
package/dist/internal/index.d.mts +5 -3
package/dist/internal/index.d.ts +5 -3
package/dist/internal/index.js +143 -25
package/dist/internal/index.js.map +1 -1
package/dist/internal/index.mjs +151 -29
package/dist/internal/index.mjs.map +1 -1
package/package.json +3 -3

package/dist/index.mjs CHANGED Viewed

@@ -43,7 +43,7 @@ var openaiFailedResponseHandler = createJsonErrorResponseHandler({
 function getOpenAILanguageModelCapabilities(modelId) {
   const supportsFlexProcessing = modelId.startsWith("o3") || modelId.startsWith("o4-mini") || modelId.startsWith("gpt-5") && !modelId.startsWith("gpt-5-chat");
   const supportsPriorityProcessing = modelId.startsWith("gpt-4") || modelId.startsWith("gpt-5-mini") || modelId.startsWith("gpt-5") && !modelId.startsWith("gpt-5-nano") && !modelId.startsWith("gpt-5-chat") || modelId.startsWith("o3") || modelId.startsWith("o4-mini");
-  const isReasoningModel = !(modelId.startsWith("gpt-3") || modelId.startsWith("gpt-4") || modelId.startsWith("chatgpt-4o") || modelId.startsWith("gpt-5-chat"));
+  const isReasoningModel = modelId.startsWith("o1") || modelId.startsWith("o3") || modelId.startsWith("o4-mini") || modelId.startsWith("codex-mini") || modelId.startsWith("computer-use-preview") || modelId.startsWith("gpt-5") && !modelId.startsWith("gpt-5-chat");
   const supportsNonReasoningParameters = modelId.startsWith("gpt-5.1") || modelId.startsWith("gpt-5.2");
   const systemMessageMode = isReasoningModel ? "developer" : "system";
   return {
@@ -545,7 +545,26 @@ var openaiChatLanguageModelOptions = lazySchema2(
        * username or email address, in order to avoid sending us any identifying
        * information.
        */
-      safetyIdentifier: z3.string().optional()
+      safetyIdentifier: z3.string().optional(),
+      /**
+       * Override the system message mode for this model.
+       * - 'system': Use the 'system' role for system messages (default for most models)
+       * - 'developer': Use the 'developer' role for system messages (used by reasoning models)
+       * - 'remove': Remove system messages entirely
+       *
+       * If not specified, the mode is automatically determined based on the model.
+       */
+      systemMessageMode: z3.enum(["system", "developer", "remove"]).optional(),
+      /**
+       * Force treating this model as a reasoning model.
+       *
+       * This is useful for "stealth" reasoning models (e.g. via a custom baseURL)
+       * where the model ID is not recognized by the SDK's allowlist.
+       *
+       * When enabled, the SDK applies reasoning-model parameter compatibility rules
+       * and defaults `systemMessageMode` to `developer` unless overridden.
+       */
+      forceReasoning: z3.boolean().optional()
     })
   )
 );
@@ -642,7 +661,7 @@ var OpenAIChatLanguageModel = class {
     toolChoice,
     providerOptions
   }) {
-    var _a, _b, _c;
+    var _a, _b, _c, _d, _e;
     const warnings = [];
     const openaiOptions = (_a = await parseProviderOptions({
       provider: "openai",
@@ -650,17 +669,18 @@ var OpenAIChatLanguageModel = class {
       schema: openaiChatLanguageModelOptions
     })) != null ? _a : {};
     const modelCapabilities = getOpenAILanguageModelCapabilities(this.modelId);
+    const isReasoningModel = (_b = openaiOptions.forceReasoning) != null ? _b : modelCapabilities.isReasoningModel;
     if (topK != null) {
       warnings.push({ type: "unsupported", feature: "topK" });
     }
     const { messages, warnings: messageWarnings } = convertToOpenAIChatMessages(
       {
         prompt,
-        systemMessageMode: modelCapabilities.systemMessageMode
+        systemMessageMode: (_c = openaiOptions.systemMessageMode) != null ? _c : isReasoningModel ? "developer" : modelCapabilities.systemMessageMode
       }
     );
     warnings.push(...messageWarnings);
-    const strictJsonSchema = (_b = openaiOptions.strictJsonSchema) != null ? _b : true;
+    const strictJsonSchema = (_d = openaiOptions.strictJsonSchema) != null ? _d : true;
     const baseArgs = {
       // model id:
       model: this.modelId,
@@ -681,7 +701,7 @@ var OpenAIChatLanguageModel = class {
         json_schema: {
           schema: responseFormat.schema,
           strict: strictJsonSchema,
-          name: (_c = responseFormat.name) != null ? _c : "response",
+          name: (_e = responseFormat.name) != null ? _e : "response",
           description: responseFormat.description
         }
       } : { type: "json_object" } : void 0,
@@ -702,7 +722,7 @@ var OpenAIChatLanguageModel = class {
       // messages:
       messages
     };
-    if (modelCapabilities.isReasoningModel) {
+    if (isReasoningModel) {
       if (openaiOptions.reasoningEffort !== "none" || !modelCapabilities.supportsNonReasoningParameters) {
         if (baseArgs.temperature != null) {
           baseArgs.temperature = void 0;
@@ -1678,7 +1698,11 @@ var OpenAIEmbeddingModel = class {
 // src/image/openai-image-model.ts
 import {
   combineHeaders as combineHeaders4,
+  convertBase64ToUint8Array,
+  convertToFormData,
   createJsonResponseHandler as createJsonResponseHandler4,
+  downloadBlob,
+  postFormDataToApi,
   postJsonToApi as postJsonToApi4
 } from "@ai-sdk/provider-utils";
@@ -1717,11 +1741,13 @@ var modelMaxImagesPerCall = {
   "dall-e-3": 1,
   "dall-e-2": 10,
   "gpt-image-1": 10,
-  "gpt-image-1-mini": 10
+  "gpt-image-1-mini": 10,
+  "gpt-image-1.5": 10
 };
 var hasDefaultResponseFormat = /* @__PURE__ */ new Set([
   "gpt-image-1",
-  "gpt-image-1-mini"
+  "gpt-image-1-mini",
+  "gpt-image-1.5"
 ]);
 // src/image/openai-image-model.ts
@@ -1740,6 +1766,8 @@ var OpenAIImageModel = class {
   }
   async doGenerate({
     prompt,
+    files,
+    mask,
     n,
     size,
     aspectRatio,
@@ -1748,7 +1776,7 @@ var OpenAIImageModel = class {
     headers,
     abortSignal
   }) {
-    var _a, _b, _c, _d, _e, _f, _g;
+    var _a, _b, _c, _d, _e, _f, _g, _h, _i, _j, _k;
     const warnings = [];
     if (aspectRatio != null) {
       warnings.push({
@@ -1761,6 +1789,72 @@ var OpenAIImageModel = class {
       warnings.push({ type: "unsupported", feature: "seed" });
     }
     const currentDate = (_c = (_b = (_a = this.config._internal) == null ? void 0 : _a.currentDate) == null ? void 0 : _b.call(_a)) != null ? _c : /* @__PURE__ */ new Date();
+    if (files != null) {
+      const { value: response2, responseHeaders: responseHeaders2 } = await postFormDataToApi({
+        url: this.config.url({
+          path: "/images/edits",
+          modelId: this.modelId
+        }),
+        headers: combineHeaders4(this.config.headers(), headers),
+        formData: convertToFormData({
+          model: this.modelId,
+          prompt,
+          image: await Promise.all(
+            files.map(
+              (file) => file.type === "file" ? new Blob(
+                [
+                  file.data instanceof Uint8Array ? new Blob([file.data], {
+                    type: file.mediaType
+                  }) : new Blob([convertBase64ToUint8Array(file.data)], {
+                    type: file.mediaType
+                  })
+                ],
+                { type: file.mediaType }
+              ) : downloadBlob(file.url)
+            )
+          ),
+          mask: mask != null ? await fileToBlob(mask) : void 0,
+          n,
+          size,
+          ...(_d = providerOptions.openai) != null ? _d : {}
+        }),
+        failedResponseHandler: openaiFailedResponseHandler,
+        successfulResponseHandler: createJsonResponseHandler4(
+          openaiImageResponseSchema
+        ),
+        abortSignal,
+        fetch: this.config.fetch
+      });
+      return {
+        images: response2.data.map((item) => item.b64_json),
+        warnings,
+        usage: response2.usage != null ? {
+          inputTokens: (_e = response2.usage.input_tokens) != null ? _e : void 0,
+          outputTokens: (_f = response2.usage.output_tokens) != null ? _f : void 0,
+          totalTokens: (_g = response2.usage.total_tokens) != null ? _g : void 0
+        } : void 0,
+        response: {
+          timestamp: currentDate,
+          modelId: this.modelId,
+          headers: responseHeaders2
+        },
+        providerMetadata: {
+          openai: {
+            images: response2.data.map((item) => {
+              var _a2, _b2, _c2, _d2, _e2;
+              return {
+                ...item.revised_prompt ? { revisedPrompt: item.revised_prompt } : {},
+                created: (_a2 = response2.created) != null ? _a2 : void 0,
+                size: (_b2 = response2.size) != null ? _b2 : void 0,
+                quality: (_c2 = response2.quality) != null ? _c2 : void 0,
+                background: (_d2 = response2.background) != null ? _d2 : void 0,
+                outputFormat: (_e2 = response2.output_format) != null ? _e2 : void 0
+              };
+            })
+          }
+        }
+      };
+    }
     const { value: response, responseHeaders } = await postJsonToApi4({
       url: this.config.url({
         path: "/images/generations",
@@ -1772,7 +1866,7 @@ var OpenAIImageModel = class {
         prompt,
         n,
         size,
-        ...(_d = providerOptions.openai) != null ? _d : {},
+        ...(_h = providerOptions.openai) != null ? _h : {},
         ...!hasDefaultResponseFormat.has(this.modelId) ? { response_format: "b64_json" } : {}
       },
       failedResponseHandler: openaiFailedResponseHandler,
@@ -1786,9 +1880,9 @@ var OpenAIImageModel = class {
       images: response.data.map((item) => item.b64_json),
       warnings,
       usage: response.usage != null ? {
-        inputTokens: (_e = response.usage.input_tokens) != null ? _e : void 0,
-        outputTokens: (_f = response.usage.output_tokens) != null ? _f : void 0,
-        totalTokens: (_g = response.usage.total_tokens) != null ? _g : void 0
+        inputTokens: (_i = response.usage.input_tokens) != null ? _i : void 0,
+        outputTokens: (_j = response.usage.output_tokens) != null ? _j : void 0,
+        totalTokens: (_k = response.usage.total_tokens) != null ? _k : void 0
       } : void 0,
       response: {
         timestamp: currentDate,
@@ -1813,6 +1907,14 @@ var OpenAIImageModel = class {
     };
   }
 };
+async function fileToBlob(file) {
+  if (!file) return void 0;
+  if (file.type === "url") {
+    return downloadBlob(file.url);
+  }
+  const data = file.data instanceof Uint8Array ? file.data : convertBase64ToUint8Array(file.data);
+  return new Blob([data], { type: file.mediaType });
+}
 // src/tool/apply-patch.ts
 import {
@@ -3675,7 +3777,26 @@ var openaiResponsesProviderOptionsSchema = lazySchema18(
        * Defaults to `undefined`.
        * @see https://platform.openai.com/docs/guides/safety-best-practices/end-user-ids
        */
-      user: z20.string().nullish()
+      user: z20.string().nullish(),
+      /**
+       * Override the system message mode for this model.
+       * - 'system': Use the 'system' role for system messages (default for most models)
+       * - 'developer': Use the 'developer' role for system messages (used by reasoning models)
+       * - 'remove': Remove system messages entirely
+       *
+       * If not specified, the mode is automatically determined based on the model.
+       */
+      systemMessageMode: z20.enum(["system", "developer", "remove"]).optional(),
+      /**
+       * Force treating this model as a reasoning model.
+       *
+       * This is useful for "stealth" reasoning models (e.g. via a custom baseURL)
+       * where the model ID is not recognized by the SDK's allowlist.
+       *
+       * When enabled, the SDK applies reasoning-model parameter compatibility rules
+       * and defaults `systemMessageMode` to `developer` unless overridden.
+       */
+      forceReasoning: z20.boolean().optional()
     })
   )
 );
@@ -3888,7 +4009,7 @@ var OpenAIResponsesLanguageModel = class {
     toolChoice,
     responseFormat
   }) {
-    var _a, _b, _c, _d;
+    var _a, _b, _c, _d, _e, _f;
     const warnings = [];
     const modelCapabilities = getOpenAILanguageModelCapabilities(this.modelId);
     if (topK != null) {
@@ -3911,6 +4032,7 @@ var OpenAIResponsesLanguageModel = class {
       providerOptions,
       schema: openaiResponsesProviderOptionsSchema
     });
+    const isReasoningModel = (_a = openaiOptions == null ? void 0 : openaiOptions.forceReasoning) != null ? _a : modelCapabilities.isReasoningModel;
     if ((openaiOptions == null ? void 0 : openaiOptions.conversation) && (openaiOptions == null ? void 0 : openaiOptions.previousResponseId)) {
       warnings.push({
         type: "unsupported",
@@ -3935,15 +4057,15 @@ var OpenAIResponsesLanguageModel = class {
     const { input, warnings: inputWarnings } = await convertToOpenAIResponsesInput({
       prompt,
       toolNameMapping,
-      systemMessageMode: modelCapabilities.systemMessageMode,
+      systemMessageMode: (_b = openaiOptions == null ? void 0 : openaiOptions.systemMessageMode) != null ? _b : isReasoningModel ? "developer" : modelCapabilities.systemMessageMode,
       fileIdPrefixes: this.config.fileIdPrefixes,
-      store: (_a = openaiOptions == null ? void 0 : openaiOptions.store) != null ? _a : true,
+      store: (_c = openaiOptions == null ? void 0 : openaiOptions.store) != null ? _c : true,
       hasLocalShellTool: hasOpenAITool("openai.local_shell"),
       hasShellTool: hasOpenAITool("openai.shell"),
       hasApplyPatchTool: hasOpenAITool("openai.apply_patch")
     });
     warnings.push(...inputWarnings);
-    const strictJsonSchema = (_b = openaiOptions == null ? void 0 : openaiOptions.strictJsonSchema) != null ? _b : true;
+    const strictJsonSchema = (_d = openaiOptions == null ? void 0 : openaiOptions.strictJsonSchema) != null ? _d : true;
     let include = openaiOptions == null ? void 0 : openaiOptions.include;
     function addInclude(key) {
       if (include == null) {
@@ -3959,9 +4081,9 @@ var OpenAIResponsesLanguageModel = class {
     if (topLogprobs) {
       addInclude("message.output_text.logprobs");
     }
-    const webSearchToolName = (_c = tools == null ? void 0 : tools.find(
+    const webSearchToolName = (_e = tools == null ? void 0 : tools.find(
       (tool) => tool.type === "provider" && (tool.id === "openai.web_search" || tool.id === "openai.web_search_preview")
-    )) == null ? void 0 : _c.name;
+    )) == null ? void 0 : _e.name;
     if (webSearchToolName) {
       addInclude("web_search_call.action.sources");
     }
@@ -3969,7 +4091,7 @@ var OpenAIResponsesLanguageModel = class {
       addInclude("code_interpreter_call.outputs");
     }
     const store = openaiOptions == null ? void 0 : openaiOptions.store;
-    if (store === false && modelCapabilities.isReasoningModel) {
+    if (store === false && isReasoningModel) {
       addInclude("reasoning.encrypted_content");
     }
     const baseArgs = {
@@ -3984,7 +4106,7 @@ var OpenAIResponsesLanguageModel = class {
             format: responseFormat.schema != null ? {
               type: "json_schema",
               strict: strictJsonSchema,
-              name: (_d = responseFormat.name) != null ? _d : "response",
+              name: (_f = responseFormat.name) != null ? _f : "response",
               description: responseFormat.description,
               schema: responseFormat.schema
             } : { type: "json_object" }
@@ -4011,7 +4133,7 @@ var OpenAIResponsesLanguageModel = class {
       top_logprobs: topLogprobs,
       truncation: openaiOptions == null ? void 0 : openaiOptions.truncation,
       // model-specific settings:
-      ...modelCapabilities.isReasoningModel && ((openaiOptions == null ? void 0 : openaiOptions.reasoningEffort) != null || (openaiOptions == null ? void 0 : openaiOptions.reasoningSummary) != null) && {
+      ...isReasoningModel && ((openaiOptions == null ? void 0 : openaiOptions.reasoningEffort) != null || (openaiOptions == null ? void 0 : openaiOptions.reasoningSummary) != null) && {
         reasoning: {
           ...(openaiOptions == null ? void 0 : openaiOptions.reasoningEffort) != null && {
             effort: openaiOptions.reasoningEffort
@@ -4022,7 +4144,7 @@ var OpenAIResponsesLanguageModel = class {
         }
       }
     };
-    if (modelCapabilities.isReasoningModel) {
+    if (isReasoningModel) {
       if (!((openaiOptions == null ? void 0 : openaiOptions.reasoningEffort) === "none" && modelCapabilities.supportsNonReasoningParameters)) {
         if (baseArgs.temperature != null) {
           baseArgs.temperature = void 0;
@@ -5330,11 +5452,11 @@ var OpenAISpeechModel = class {
 // src/transcription/openai-transcription-model.ts
 import {
   combineHeaders as combineHeaders7,
-  convertBase64ToUint8Array,
+  convertBase64ToUint8Array as convertBase64ToUint8Array2,
   createJsonResponseHandler as createJsonResponseHandler6,
   mediaTypeToExtension,
   parseProviderOptions as parseProviderOptions7,
-  postFormDataToApi
+  postFormDataToApi as postFormDataToApi2
 } from "@ai-sdk/provider-utils";
 // src/transcription/openai-transcription-api.ts
@@ -5484,7 +5606,7 @@ var OpenAITranscriptionModel = class {
       schema: openAITranscriptionProviderOptions
     });
     const formData = new FormData();
-    const blob = audio instanceof Uint8Array ? new Blob([audio]) : new Blob([convertBase64ToUint8Array(audio)]);
+    const blob = audio instanceof Uint8Array ? new Blob([audio]) : new Blob([convertBase64ToUint8Array2(audio)]);
     formData.append("model", this.modelId);
     const fileExtension = mediaTypeToExtension(mediaType);
     formData.append(
@@ -5531,7 +5653,7 @@ var OpenAITranscriptionModel = class {
       value: response,
       responseHeaders,
       rawValue: rawResponse
-    } = await postFormDataToApi({
+    } = await postFormDataToApi2({
       url: this.config.url({
         path: "/audio/transcriptions",
         modelId: this.modelId
@@ -5571,7 +5693,7 @@ var OpenAITranscriptionModel = class {
 };
 // src/version.ts
-var VERSION = true ? "3.0.0-beta.102" : "0.0.0-test";
+var VERSION = true ? "3.0.0-beta.105" : "0.0.0-test";
 // src/openai-provider.ts
 function createOpenAI(options = {}) {
@@ -5659,6 +5781,8 @@ function createOpenAI(options = {}) {
   provider.responses = createResponsesModel;
   provider.embedding = createEmbeddingModel;
   provider.embeddingModel = createEmbeddingModel;
+  provider.textEmbedding = createEmbeddingModel;
+  provider.textEmbeddingModel = createEmbeddingModel;
   provider.image = createImageModel;
   provider.imageModel = createImageModel;
   provider.transcription = createTranscriptionModel;