npm - @ai-sdk/openai - Versions diffs - 1.3.8 → 1.3.10 - Mend

@ai-sdk/openai 1.3.8 → 1.3.10

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (14) hide show

package/CHANGELOG.md +17 -0
package/dist/index.d.mts +1 -1
package/dist/index.d.ts +1 -1
package/dist/index.js +37 -38
package/dist/index.js.map +1 -1
package/dist/index.mjs +37 -38
package/dist/index.mjs.map +1 -1
package/internal/dist/index.d.mts +16 -16
package/internal/dist/index.d.ts +16 -16
package/internal/dist/index.js +37 -38
package/internal/dist/index.js.map +1 -1
package/internal/dist/index.mjs +37 -38
package/internal/dist/index.mjs.map +1 -1
package/package.json +3 -3

package/internal/dist/index.mjs CHANGED Viewed

@@ -520,6 +520,15 @@ var OpenAIChatLanguageModel = class {
         }
         baseArgs.max_tokens = void 0;
       }
+    } else if (this.modelId.startsWith("gpt-4o-search-preview")) {
+      if (baseArgs.temperature != null) {
+        baseArgs.temperature = void 0;
+        warnings.push({
+          type: "unsupported-setting",
+          setting: "temperature",
+          details: "temperature is not supported for the gpt-4o-search-preview model and has been removed."
+        });
+      }
     }
     switch (type) {
       case "regular": {
@@ -1615,17 +1624,11 @@ import {
 } from "@ai-sdk/provider-utils";
 import { z as z6 } from "zod";
 var OpenAIProviderOptionsSchema = z6.object({
-  include: z6.array(z6.string()).optional().describe(
-    "Additional information to include in the transcription response."
-  ),
-  language: z6.string().optional().describe("The language of the input audio in ISO-639-1 format."),
-  prompt: z6.string().optional().describe(
-    "An optional text to guide the model's style or continue a previous audio segment."
-  ),
-  temperature: z6.number().min(0).max(1).optional().default(0).describe("The sampling temperature, between 0 and 1."),
-  timestampGranularities: z6.array(z6.enum(["word", "segment"])).optional().default(["segment"]).describe(
-    "The timestamp granularities to populate for this transcription."
-  )
+  include: z6.array(z6.string()).nullish(),
+  language: z6.string().nullish(),
+  prompt: z6.string().nullish(),
+  temperature: z6.number().min(0).max(1).nullish().default(0),
+  timestampGranularities: z6.array(z6.enum(["word", "segment"])).nullish().default(["segment"])
 });
 var languageMap = {
   afrikaans: "af",
@@ -1697,9 +1700,10 @@ var OpenAITranscriptionModel = class {
   }
   getArgs({
     audio,
-    mimeType,
+    mediaType,
     providerOptions
   }) {
+    var _a, _b, _c, _d, _e;
     const warnings = [];
     const openAIOptions = parseProviderOptions({
       provider: "openai",
@@ -1709,19 +1713,19 @@ var OpenAITranscriptionModel = class {
     const formData = new FormData();
     const blob = audio instanceof Uint8Array ? new Blob([audio]) : new Blob([convertBase64ToUint8Array(audio)]);
     formData.append("model", this.modelId);
-    formData.append("file", new File([blob], "audio", { type: mimeType }));
+    formData.append("file", new File([blob], "audio", { type: mediaType }));
     if (openAIOptions) {
       const transcriptionModelOptions = {
-        include: openAIOptions.include,
-        language: openAIOptions.language,
-        prompt: openAIOptions.prompt,
-        temperature: openAIOptions.temperature,
-        timestamp_granularities: openAIOptions.timestampGranularities
+        include: (_a = openAIOptions.include) != null ? _a : void 0,
+        language: (_b = openAIOptions.language) != null ? _b : void 0,
+        prompt: (_c = openAIOptions.prompt) != null ? _c : void 0,
+        temperature: (_d = openAIOptions.temperature) != null ? _d : void 0,
+        timestamp_granularities: (_e = openAIOptions.timestampGranularities) != null ? _e : void 0
       };
       for (const key in transcriptionModelOptions) {
         const value = transcriptionModelOptions[key];
         if (value !== void 0) {
-          formData.append(key, value);
+          formData.append(key, String(value));
         }
       }
     }
@@ -1731,10 +1735,14 @@ var OpenAITranscriptionModel = class {
     };
   }
   async doGenerate(options) {
-    var _a, _b, _c;
+    var _a, _b, _c, _d, _e, _f;
     const currentDate = (_c = (_b = (_a = this.config._internal) == null ? void 0 : _a.currentDate) == null ? void 0 : _b.call(_a)) != null ? _c : /* @__PURE__ */ new Date();
     const { formData, warnings } = this.getArgs(options);
-    const { value: response, responseHeaders } = await postFormDataToApi({
+    const {
+      value: response,
+      responseHeaders,
+      rawValue: rawResponse
+    } = await postFormDataToApi({
       url: this.config.url({
         path: "/audio/transcriptions",
         modelId: this.modelId
@@ -1748,46 +1756,37 @@ var OpenAITranscriptionModel = class {
       abortSignal: options.abortSignal,
       fetch: this.config.fetch
     });
-    let language;
-    if (response.language && response.language in languageMap) {
-      language = languageMap[response.language];
-    }
+    const language = response.language != null && response.language in languageMap ? languageMap[response.language] : void 0;
     return {
       text: response.text,
-      segments: response.words.map((word) => ({
+      segments: (_e = (_d = response.words) == null ? void 0 : _d.map((word) => ({
         text: word.word,
         startSecond: word.start,
         endSecond: word.end
-      })),
+      }))) != null ? _e : [],
       language,
-      durationInSeconds: response.duration,
+      durationInSeconds: (_f = response.duration) != null ? _f : void 0,
       warnings,
       response: {
         timestamp: currentDate,
         modelId: this.modelId,
         headers: responseHeaders,
-        body: response
-      },
-      // When using format `verbose_json` on `whisper-1`, OpenAI includes the things like `task` and enhanced `segments` information.
-      providerMetadata: {
-        openai: {
-          transcript: response
-        }
+        body: rawResponse
       }
     };
   }
 };
 var openaiTranscriptionResponseSchema = z6.object({
   text: z6.string(),
-  language: z6.string().optional(),
-  duration: z6.number().optional(),
+  language: z6.string().nullish(),
+  duration: z6.number().nullish(),
   words: z6.array(
     z6.object({
       word: z6.string(),
       start: z6.number(),
       end: z6.number()
     })
-  )
+  ).nullish()
 });
 // src/responses/openai-responses-language-model.ts