npm - @ai-sdk/openai - Versions diffs - 2.0.0-canary.7 → 2.0.0-canary.9 - Mend

@ai-sdk/openai 2.0.0-canary.7 → 2.0.0-canary.9

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (14) hide show

package/CHANGELOG.md +21 -0
package/dist/index.d.mts +9 -3
package/dist/index.d.ts +9 -3
package/dist/index.js +187 -61
package/dist/index.js.map +1 -1
package/dist/index.mjs +189 -58
package/dist/index.mjs.map +1 -1
package/dist/internal/index.d.mts +35 -6
package/dist/internal/index.d.ts +35 -6
package/dist/internal/index.js +284 -164
package/dist/internal/index.js.map +1 -1
package/dist/internal/index.mjs +288 -164
package/dist/internal/index.mjs.map +1 -1
package/package.json +6 -5

package/dist/index.mjs CHANGED Viewed

@@ -521,13 +521,13 @@ var OpenAIChatLanguageModel = class {
         }
         baseArgs.max_tokens = void 0;
       }
-    } else if (this.modelId.startsWith("gpt-4o-search-preview")) {
+    } else if (this.modelId.startsWith("gpt-4o-search-preview") || this.modelId.startsWith("gpt-4o-mini-search-preview")) {
       if (baseArgs.temperature != null) {
         baseArgs.temperature = void 0;
         warnings.push({
           type: "unsupported-setting",
           setting: "temperature",
-          details: "temperature is not supported for the gpt-4o-search-preview model and has been removed."
+          details: "temperature is not supported for the search preview models and has been removed."
         });
       }
     }
@@ -550,7 +550,7 @@ var OpenAIChatLanguageModel = class {
     };
   }
   async doGenerate(options) {
-    var _a, _b, _c, _d, _e, _f, _g;
+    var _a, _b, _c, _d, _e, _f, _g, _h;
     const { args: body, warnings } = this.getArgs(options);
     const {
       responseHeaders,
@@ -570,10 +570,23 @@ var OpenAIChatLanguageModel = class {
       abortSignal: options.abortSignal,
       fetch: this.config.fetch
     });
-    const { messages: rawPrompt, ...rawSettings } = body;
     const choice = response.choices[0];
-    const completionTokenDetails = (_a = response.usage) == null ? void 0 : _a.completion_tokens_details;
-    const promptTokenDetails = (_b = response.usage) == null ? void 0 : _b.prompt_tokens_details;
+    const content = [];
+    const text = choice.message.content;
+    if (text != null && text.length > 0) {
+      content.push({ type: "text", text });
+    }
+    for (const toolCall of (_a = choice.message.tool_calls) != null ? _a : []) {
+      content.push({
+        type: "tool-call",
+        toolCallType: "function",
+        toolCallId: (_b = toolCall.id) != null ? _b : generateId(),
+        toolName: toolCall.function.name,
+        args: toolCall.function.arguments
+      });
+    }
+    const completionTokenDetails = (_c = response.usage) == null ? void 0 : _c.completion_tokens_details;
+    const promptTokenDetails = (_d = response.usage) == null ? void 0 : _d.prompt_tokens_details;
     const providerMetadata = { openai: {} };
     if ((completionTokenDetails == null ? void 0 : completionTokenDetails.reasoning_tokens) != null) {
       providerMetadata.openai.reasoningTokens = completionTokenDetails == null ? void 0 : completionTokenDetails.reasoning_tokens;
@@ -588,21 +601,11 @@ var OpenAIChatLanguageModel = class {
       providerMetadata.openai.cachedPromptTokens = promptTokenDetails == null ? void 0 : promptTokenDetails.cached_tokens;
     }
     return {
-      text: choice.message.content != null ? { type: "text", text: choice.message.content } : void 0,
-      toolCalls: (_c = choice.message.tool_calls) == null ? void 0 : _c.map((toolCall) => {
-        var _a2;
-        return {
-          type: "tool-call",
-          toolCallType: "function",
-          toolCallId: (_a2 = toolCall.id) != null ? _a2 : generateId(),
-          toolName: toolCall.function.name,
-          args: toolCall.function.arguments
-        };
-      }),
+      content,
       finishReason: mapOpenAIFinishReason(choice.finish_reason),
       usage: {
-        inputTokens: (_e = (_d = response.usage) == null ? void 0 : _d.prompt_tokens) != null ? _e : void 0,
-        outputTokens: (_g = (_f = response.usage) == null ? void 0 : _f.completion_tokens) != null ? _g : void 0
+        inputTokens: (_f = (_e = response.usage) == null ? void 0 : _e.prompt_tokens) != null ? _f : void 0,
+        outputTokens: (_h = (_g = response.usage) == null ? void 0 : _g.completion_tokens) != null ? _h : void 0
       },
       request: { body },
       response: {
@@ -650,6 +653,9 @@ var OpenAIChatLanguageModel = class {
     return {
       stream: response.pipeThrough(
         new TransformStream({
+          start(controller) {
+            controller.enqueue({ type: "stream-start", warnings });
+          },
           transform(chunk, controller) {
             var _a, _b, _c, _d, _e, _f, _g, _h, _i, _j, _k, _l;
             if (!chunk.success) {
@@ -807,8 +813,7 @@ var OpenAIChatLanguageModel = class {
         })
       ),
       request: { body },
-      response: { headers: responseHeaders },
-      warnings
+      response: { headers: responseHeaders }
     };
   }
 };
@@ -909,7 +914,7 @@ var openaiChatChunkSchema = z3.union([
   openaiErrorDataSchema
 ]);
 function isReasoningModel(modelId) {
-  return modelId === "o1" || modelId.startsWith("o1-") || modelId === "o3" || modelId.startsWith("o3-");
+  return modelId.startsWith("o");
 }
 function isAudioModel(modelId) {
   return modelId.startsWith("gpt-4o-audio-preview");
@@ -1140,7 +1145,7 @@ var OpenAICompletionLanguageModel = class {
     });
     const choice = response.choices[0];
     return {
-      text: { type: "text", text: choice.text },
+      content: [{ type: "text", text: choice.text }],
       usage: {
         inputTokens: response.usage.prompt_tokens,
         outputTokens: response.usage.completion_tokens
@@ -1188,6 +1193,9 @@ var OpenAICompletionLanguageModel = class {
     return {
       stream: response.pipeThrough(
         new TransformStream({
+          start(controller) {
+            controller.enqueue({ type: "stream-start", warnings });
+          },
           transform(chunk, controller) {
             if (!chunk.success) {
               finishReason = "error";
@@ -1239,9 +1247,8 @@ var OpenAICompletionLanguageModel = class {
           }
         })
       ),
-      response: { headers: responseHeaders },
-      warnings,
-      request: { body: JSON.stringify(body) }
+      request: { body },
+      response: { headers: responseHeaders }
     };
   }
 };
@@ -1874,6 +1881,7 @@ var OpenAIResponsesLanguageModel = class {
   constructor(modelId, config) {
     this.specificationVersion = "v2";
     this.defaultObjectGenerationMode = "json";
+    this.supportsStructuredOutputs = true;
     this.modelId = modelId;
     this.config = config;
   }
@@ -1999,7 +2007,7 @@ var OpenAIResponsesLanguageModel = class {
     };
   }
   async doGenerate(options) {
-    var _a, _b, _c, _d, _e;
+    var _a, _b, _c, _d, _e, _f, _g, _h;
     const { args: body, warnings } = this.getArgs(options);
     const {
       responseHeaders,
@@ -2063,36 +2071,45 @@ var OpenAIResponsesLanguageModel = class {
       abortSignal: options.abortSignal,
       fetch: this.config.fetch
     });
-    const outputTextElements = response.output.filter((output) => output.type === "message").flatMap((output) => output.content).filter((content) => content.type === "output_text");
-    const toolCalls = response.output.filter((output) => output.type === "function_call").map((output) => ({
-      type: "tool-call",
-      toolCallType: "function",
-      toolCallId: output.call_id,
-      toolName: output.name,
-      args: output.arguments
-    }));
+    const content = [];
+    for (const part of response.output) {
+      switch (part.type) {
+        case "message": {
+          for (const contentPart of part.content) {
+            content.push({
+              type: "text",
+              text: contentPart.text
+            });
+            for (const annotation of contentPart.annotations) {
+              content.push({
+                type: "source",
+                sourceType: "url",
+                id: (_c = (_b = (_a = this.config).generateId) == null ? void 0 : _b.call(_a)) != null ? _c : generateId2(),
+                url: annotation.url,
+                title: annotation.title
+              });
+            }
+          }
+          break;
+        }
+        case "function_call": {
+          content.push({
+            type: "tool-call",
+            toolCallType: "function",
+            toolCallId: part.call_id,
+            toolName: part.name,
+            args: part.arguments
+          });
+          break;
+        }
+      }
+    }
     return {
-      text: {
-        type: "text",
-        text: outputTextElements.map((content) => content.text).join("\n")
-      },
-      sources: outputTextElements.flatMap(
-        (content) => content.annotations.map((annotation) => {
-          var _a2, _b2, _c2;
-          return {
-            type: "source",
-            sourceType: "url",
-            id: (_c2 = (_b2 = (_a2 = this.config).generateId) == null ? void 0 : _b2.call(_a2)) != null ? _c2 : generateId2(),
-            url: annotation.url,
-            title: annotation.title
-          };
-        })
-      ),
+      content,
       finishReason: mapOpenAIResponseFinishReason({
-        finishReason: (_a = response.incomplete_details) == null ? void 0 : _a.reason,
-        hasToolCalls: toolCalls.length > 0
+        finishReason: (_d = response.incomplete_details) == null ? void 0 : _d.reason,
+        hasToolCalls: content.some((part) => part.type === "tool-call")
       }),
-      toolCalls: toolCalls.length > 0 ? toolCalls : void 0,
       usage: {
         inputTokens: response.usage.input_tokens,
         outputTokens: response.usage.output_tokens
@@ -2108,8 +2125,8 @@ var OpenAIResponsesLanguageModel = class {
       providerMetadata: {
         openai: {
           responseId: response.id,
-          cachedPromptTokens: (_c = (_b = response.usage.input_tokens_details) == null ? void 0 : _b.cached_tokens) != null ? _c : null,
-          reasoningTokens: (_e = (_d = response.usage.output_tokens_details) == null ? void 0 : _d.reasoning_tokens) != null ? _e : null
+          cachedPromptTokens: (_f = (_e = response.usage.input_tokens_details) == null ? void 0 : _e.cached_tokens) != null ? _f : null,
+          reasoningTokens: (_h = (_g = response.usage.output_tokens_details) == null ? void 0 : _g.reasoning_tokens) != null ? _h : null
         }
       },
       warnings
@@ -2148,6 +2165,9 @@ var OpenAIResponsesLanguageModel = class {
     return {
       stream: response.pipeThrough(
         new TransformStream({
+          start(controller) {
+            controller.enqueue({ type: "stream-start", warnings });
+          },
           transform(chunk, controller) {
             var _a, _b, _c, _d, _e, _f, _g, _h;
             if (!chunk.success) {
@@ -2242,8 +2262,7 @@ var OpenAIResponsesLanguageModel = class {
         })
       ),
       request: { body },
-      response: { headers: responseHeaders },
-      warnings
+      response: { headers: responseHeaders }
     };
   }
 };
@@ -2383,6 +2402,110 @@ var openaiResponsesProviderOptionsSchema = z9.object({
   instructions: z9.string().nullish()
 });
+// src/openai-speech-model.ts
+import {
+  combineHeaders as combineHeaders7,
+  createBinaryResponseHandler,
+  parseProviderOptions as parseProviderOptions4,
+  postJsonToApi as postJsonToApi6
+} from "@ai-sdk/provider-utils";
+import { z as z10 } from "zod";
+var OpenAIProviderOptionsSchema = z10.object({
+  instructions: z10.string().nullish(),
+  speed: z10.number().min(0.25).max(4).default(1).nullish()
+});
+var OpenAISpeechModel = class {
+  constructor(modelId, config) {
+    this.modelId = modelId;
+    this.config = config;
+    this.specificationVersion = "v1";
+  }
+  get provider() {
+    return this.config.provider;
+  }
+  getArgs({
+    text,
+    voice = "alloy",
+    outputFormat = "mp3",
+    speed,
+    instructions,
+    providerOptions
+  }) {
+    const warnings = [];
+    const openAIOptions = parseProviderOptions4({
+      provider: "openai",
+      providerOptions,
+      schema: OpenAIProviderOptionsSchema
+    });
+    const requestBody = {
+      model: this.modelId,
+      input: text,
+      voice,
+      response_format: "mp3",
+      speed,
+      instructions
+    };
+    if (outputFormat) {
+      if (["mp3", "opus", "aac", "flac", "wav", "pcm"].includes(outputFormat)) {
+        requestBody.response_format = outputFormat;
+      } else {
+        warnings.push({
+          type: "unsupported-setting",
+          setting: "outputFormat",
+          details: `Unsupported output format: ${outputFormat}. Using mp3 instead.`
+        });
+      }
+    }
+    if (openAIOptions) {
+      const speechModelOptions = {};
+      for (const key in speechModelOptions) {
+        const value = speechModelOptions[key];
+        if (value !== void 0) {
+          requestBody[key] = value;
+        }
+      }
+    }
+    return {
+      requestBody,
+      warnings
+    };
+  }
+  async doGenerate(options) {
+    var _a, _b, _c;
+    const currentDate = (_c = (_b = (_a = this.config._internal) == null ? void 0 : _a.currentDate) == null ? void 0 : _b.call(_a)) != null ? _c : /* @__PURE__ */ new Date();
+    const { requestBody, warnings } = this.getArgs(options);
+    const {
+      value: audio,
+      responseHeaders,
+      rawValue: rawResponse
+    } = await postJsonToApi6({
+      url: this.config.url({
+        path: "/audio/speech",
+        modelId: this.modelId
+      }),
+      headers: combineHeaders7(this.config.headers(), options.headers),
+      body: requestBody,
+      failedResponseHandler: openaiFailedResponseHandler,
+      successfulResponseHandler: createBinaryResponseHandler(),
+      abortSignal: options.abortSignal,
+      fetch: this.config.fetch
+    });
+    return {
+      audio,
+      warnings,
+      request: {
+        body: JSON.stringify(requestBody)
+      },
+      response: {
+        timestamp: currentDate,
+        modelId: this.modelId,
+        headers: responseHeaders,
+        body: rawResponse
+      }
+    };
+  }
+};
 // src/openai-provider.ts
 function createOpenAI(options = {}) {
   var _a, _b, _c;
@@ -2431,6 +2554,12 @@ function createOpenAI(options = {}) {
     headers: getHeaders,
     fetch: options.fetch
   });
+  const createSpeechModel = (modelId) => new OpenAISpeechModel(modelId, {
+    provider: `${providerName}.speech`,
+    url: ({ path }) => `${baseURL}${path}`,
+    headers: getHeaders,
+    fetch: options.fetch
+  });
   const createLanguageModel = (modelId, settings) => {
     if (new.target) {
       throw new Error(
@@ -2467,6 +2596,8 @@ function createOpenAI(options = {}) {
   provider.imageModel = createImageModel;
   provider.transcription = createTranscriptionModel;
   provider.transcriptionModel = createTranscriptionModel;
+  provider.speech = createSpeechModel;
+  provider.speechModel = createSpeechModel;
   provider.tools = openaiTools;
   return provider;
 }