npm - @aigne/openai - Versions diffs - 0.16.4-beta.4 → 0.16.4-beta.6 - Mend

@aigne/openai 0.16.4-beta.4 → 0.16.4-beta.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (12) hide show

package/CHANGELOG.md +32 -0
package/lib/cjs/openai-chat-model.d.ts +3 -2
package/lib/cjs/openai-chat-model.js +42 -19
package/lib/cjs/openai-video-model.d.ts +24 -4
package/lib/cjs/openai-video-model.js +8 -5
package/lib/dts/openai-chat-model.d.ts +3 -2
package/lib/dts/openai-video-model.d.ts +24 -4
package/lib/esm/openai-chat-model.d.ts +3 -2
package/lib/esm/openai-chat-model.js +42 -19
package/lib/esm/openai-video-model.d.ts +24 -4
package/lib/esm/openai-video-model.js +8 -5
package/package.json +4 -4

package/CHANGELOG.md CHANGED Viewed

@@ -1,5 +1,37 @@
 # Changelog
+## [0.16.4-beta.6](https://github.com/AIGNE-io/aigne-framework/compare/openai-v0.16.4-beta.5...openai-v0.16.4-beta.6) (2025-10-31)
+### Bug Fixes
+* **models:** add image parameters support for video generation ([#684](https://github.com/AIGNE-io/aigne-framework/issues/684)) ([b048b7f](https://github.com/AIGNE-io/aigne-framework/commit/b048b7f92bd7a532dbdbeb6fb5fa5499bae6b953))
+### Dependencies
+* The following workspace dependencies were updated
+  * dependencies
+    * @aigne/core bumped to 1.65.0-beta.5
+  * devDependencies
+    * @aigne/test-utils bumped to 0.5.57-beta.6
+## [0.16.4-beta.5](https://github.com/AIGNE-io/aigne-framework/compare/openai-v0.16.4-beta.4...openai-v0.16.4-beta.5) (2025-10-29)
+### Features
+* add reasoningEffort option for chat model ([#680](https://github.com/AIGNE-io/aigne-framework/issues/680)) ([f69d232](https://github.com/AIGNE-io/aigne-framework/commit/f69d232d714d4a3e4946bdc8c6598747c9bcbd57))
+### Dependencies
+* The following workspace dependencies were updated
+  * dependencies
+    * @aigne/core bumped to 1.65.0-beta.4
+  * devDependencies
+    * @aigne/test-utils bumped to 0.5.57-beta.5
 ## [0.16.4-beta.4](https://github.com/AIGNE-io/aigne-framework/compare/openai-v0.16.4-beta.3...openai-v0.16.4-beta.4) (2025-10-28)

package/lib/cjs/openai-chat-model.d.ts CHANGED Viewed

@@ -1,4 +1,4 @@
-import { type AgentInvokeOptions, type AgentProcessResult, ChatModel, type ChatModelInput, type ChatModelInputMessage, type ChatModelInputTool, type ChatModelOptions, type ChatModelOutput } from "@aigne/core";
+import { type AgentInvokeOptions, type AgentProcessResult, ChatModel, type ChatModelInput, type ChatModelInputMessage, type ChatModelInputOptions, type ChatModelInputTool, type ChatModelOptions, type ChatModelOutput } from "@aigne/core";
 import { type PromiseOrValue } from "@aigne/core/utils/type-utils.js";
 import type { ClientOptions, OpenAI } from "openai";
 import type { ChatCompletionMessageParam, ChatCompletionTool } from "openai/resources";
@@ -127,13 +127,14 @@ export declare class OpenAIChatModel extends ChatModel {
         apiKey: string | undefined;
         model: string;
     };
-    get modelOptions(): Omit<import("@aigne/core").ChatModelInputOptions, "model"> | undefined;
+    get modelOptions(): Omit<ChatModelInputOptions, "model"> | undefined;
     /**
      * Process the input and generate a response
      * @param input The input to process
      * @returns The generated response
      */
     process(input: ChatModelInput, _options: AgentInvokeOptions): PromiseOrValue<AgentProcessResult<ChatModelOutput>>;
+    private getReasoningEffort;
     private _process;
     private getParallelToolCalls;
     protected getRunMessages(input: ChatModelInput): Promise<ChatCompletionMessageParam[]>;

package/lib/cjs/openai-chat-model.js CHANGED Viewed

@@ -105,6 +105,20 @@ class OpenAIChatModel extends core_1.ChatModel {
     process(input, _options) {
         return this._process(input);
     }
+    getReasoningEffort(effort) {
+        if (typeof effort === "number") {
+            if (effort > 5000)
+                return "high";
+            if (effort > 1000)
+                return "medium";
+            if (effort > 500)
+                return "low";
+            if (effort > 0)
+                return "minimal";
+            return undefined;
+        }
+        return effort;
+    }
     async _process(input) {
         const messages = await this.getRunMessages(input);
         const model = input.modelOptions?.model || this.credential.model;
@@ -121,6 +135,7 @@ class OpenAIChatModel extends core_1.ChatModel {
                 include_usage: true,
             },
             stream: true,
+            reasoning_effort: this.getReasoningEffort(input.modelOptions?.reasoningEffort ?? this.modelOptions?.reasoningEffort),
         };
         // For models that do not support tools use with JSON schema in same request,
         // so we need to handle the case where tools are not used and responseFormat is json
@@ -138,9 +153,9 @@ class OpenAIChatModel extends core_1.ChatModel {
             response_format: responseFormat,
         }));
         if (input.responseFormat?.type !== "json_schema") {
-            return await this.extractResultFromStream(stream, false, true);
+            return await this.extractResultFromStream(body, stream, false, true);
         }
-        const result = await this.extractResultFromStream(stream, jsonMode);
+        const result = await this.extractResultFromStream(body, stream, jsonMode);
         // Just return the result if it has tool calls
         if (result.toolCalls?.length || result.json)
             return result;
@@ -214,18 +229,28 @@ class OpenAIChatModel extends core_1.ChatModel {
             ...body,
             response_format: resolvedResponseFormat,
         }));
-        return this.extractResultFromStream(res, jsonMode);
+        return this.extractResultFromStream(body, res, jsonMode);
     }
-    async extractResultFromStream(stream, jsonMode, streaming) {
+    async extractResultFromStream(body, stream, jsonMode, streaming) {
         const result = new ReadableStream({
             start: async (controller) => {
                 try {
+                    controller.enqueue({
+                        delta: {
+                            json: {
+                                modelOptions: {
+                                    reasoningEffort: body.reasoning_effort,
+                                },
+                            },
+                        },
+                    });
                     let text = "";
                     let refusal = "";
                     const toolCalls = [];
                     let model;
                     for await (const chunk of stream) {
                         const choice = chunk.choices?.[0];
+                        const delta = choice?.delta;
                         if (!model) {
                             model = chunk.model;
                             controller.enqueue({
@@ -236,8 +261,8 @@ class OpenAIChatModel extends core_1.ChatModel {
                                 },
                             });
                         }
-                        if (choice?.delta.tool_calls?.length) {
-                            for (const call of choice.delta.tool_calls) {
+                        if (delta?.tool_calls?.length) {
+                            for (const call of delta.tool_calls) {
                                 if (this.supportsToolStreaming && call.index !== undefined) {
                                     handleToolCallDelta(toolCalls, call);
                                 }
@@ -246,27 +271,23 @@ class OpenAIChatModel extends core_1.ChatModel {
                                 }
                             }
                         }
-                        if (choice?.delta.content) {
-                            text += choice.delta.content;
+                        if (delta && "reasoning" in delta && typeof delta.reasoning === "string") {
+                            controller.enqueue({ delta: { text: { thoughts: delta.reasoning } } });
+                        }
+                        if (delta?.content) {
+                            text += delta.content;
                             if (!jsonMode) {
                                 controller.enqueue({
                                     delta: {
                                         text: {
-                                            text: choice.delta.content,
+                                            text: delta.content,
                                         },
                                     },
                                 });
                             }
                         }
-                        if (choice?.delta.refusal) {
-                            refusal += choice.delta.refusal;
-                            if (!jsonMode) {
-                                controller.enqueue({
-                                    delta: {
-                                        text: { text: choice.delta.refusal },
-                                    },
-                                });
-                            }
+                        if (delta?.refusal) {
+                            refusal += delta.refusal;
                         }
                         if (chunk.usage) {
                             controller.enqueue({
@@ -281,7 +302,6 @@ class OpenAIChatModel extends core_1.ChatModel {
                             });
                         }
                     }
-                    text = text || refusal;
                     if (jsonMode && text) {
                         controller.enqueue({
                             delta: {
@@ -303,6 +323,9 @@ class OpenAIChatModel extends core_1.ChatModel {
                             },
                         });
                     }
+                    if (refusal) {
+                        controller.error(new Error(`Got refusal from LLM: ${refusal}`));
+                    }
                     controller.close();
                 }
                 catch (error) {

package/lib/cjs/openai-video-model.d.ts CHANGED Viewed

@@ -1,4 +1,4 @@
-import { VideoModel, type VideoModelInput, type VideoModelOptions, type VideoModelOutput } from "@aigne/core";
+import { type AgentInvokeOptions, VideoModel, type VideoModelInput, type VideoModelOptions, type VideoModelOutput } from "@aigne/core";
 import type OpenAI from "openai";
 import type { ClientOptions } from "openai";
 /**
@@ -6,9 +6,29 @@ import type { ClientOptions } from "openai";
  */
 export interface OpenAIVideoModelInput extends VideoModelInput {
     /**
-     * Optional image reference that guides generation (file path or URL)
+     * Sora model to use for video generation
+     *
+     * - `sora-2`: Standard version, lower cost
+     * - `sora-2-pro`: Pro version, higher quality
+     *
+     * @default "sora-2"
+     */
+    model?: "sora-2" | "sora-2-pro";
+    /**
+     * Video resolution (width x height)
+     *
+     * - `720x1280`: Vertical video (9:16)
+     * - `1280x720`: Horizontal video (16:9)
+     * - `1024x1792`: Vertical video (9:16, higher resolution)
+     * - `1792x1024`: Horizontal video (16:9, higher resolution)
+     */
+    size?: "720x1280" | "1280x720" | "1024x1792" | "1792x1024";
+    /**
+     * Video duration in seconds
+     *
+     * @default "4"
      */
-    inputReference?: string;
+    seconds?: "4" | "8" | "12";
 }
 /**
  * Output from OpenAI Video Model
@@ -68,5 +88,5 @@ export declare class OpenAIVideoModel extends VideoModel<OpenAIVideoModelInput,
     };
     get modelOptions(): Omit<Partial<OpenAIVideoModelInput>, "model"> | undefined;
     downloadToFile(videoId: string): Promise<string>;
-    process(input: OpenAIVideoModelInput): Promise<OpenAIVideoModelOutput>;
+    process(input: OpenAIVideoModelInput, options: AgentInvokeOptions): Promise<OpenAIVideoModelOutput>;
 }

package/lib/cjs/openai-video-model.js CHANGED Viewed

@@ -9,7 +9,9 @@ const openai_js_1 = require("./openai.js");
 const DEFAULT_MODEL = "sora-2";
 const DEFAULT_SECONDS = 4;
 const openAIVideoModelInputSchema = core_1.videoModelInputSchema.extend({
-    inputReference: zod_1.z.string().optional(),
+    model: zod_1.z.enum(["sora-2", "sora-2-pro"]).optional(),
+    seconds: zod_1.z.enum(["4", "8", "12"]).optional(),
+    size: zod_1.z.enum(["720x1280", "1280x720", "1024x1792", "1792x1024"]).optional(),
 });
 const openAIVideoModelOptionsSchema = zod_1.z.object({
     apiKey: zod_1.z.string().optional(),
@@ -64,7 +66,7 @@ class OpenAIVideoModel extends core_1.VideoModel {
         const buffer = Buffer.from(arrayBuffer);
         return buffer.toString("base64");
     }
-    async process(input) {
+    async process(input, options) {
         const model = input.model ?? input.modelOptions?.model ?? this.credential.model;
         const createParams = {
             model: model,
@@ -74,9 +76,10 @@ class OpenAIVideoModel extends core_1.VideoModel {
             createParams.seconds = input.seconds;
         if (input.size)
             createParams.size = input.size;
-        if (input.inputReference) {
-            createParams.input_reference =
-                input.inputReference;
+        if (input.image) {
+            createParams.input_reference = await this.transformFileType("file", input.image, options).then((file) => new File([Buffer.from(file.data, "base64")], file.filename || "image.png", {
+                type: file.mimeType,
+            }));
         }
         let video = await this.client.videos.create(createParams);
         logger_js_1.logger.debug(`Video generation started: ${video.id}`);

package/lib/dts/openai-chat-model.d.ts CHANGED Viewed

@@ -1,4 +1,4 @@
-import { type AgentInvokeOptions, type AgentProcessResult, ChatModel, type ChatModelInput, type ChatModelInputMessage, type ChatModelInputTool, type ChatModelOptions, type ChatModelOutput } from "@aigne/core";
+import { type AgentInvokeOptions, type AgentProcessResult, ChatModel, type ChatModelInput, type ChatModelInputMessage, type ChatModelInputOptions, type ChatModelInputTool, type ChatModelOptions, type ChatModelOutput } from "@aigne/core";
 import { type PromiseOrValue } from "@aigne/core/utils/type-utils.js";
 import type { ClientOptions, OpenAI } from "openai";
 import type { ChatCompletionMessageParam, ChatCompletionTool } from "openai/resources";
@@ -127,13 +127,14 @@ export declare class OpenAIChatModel extends ChatModel {
         apiKey: string | undefined;
         model: string;
     };
-    get modelOptions(): Omit<import("@aigne/core").ChatModelInputOptions, "model"> | undefined;
+    get modelOptions(): Omit<ChatModelInputOptions, "model"> | undefined;
     /**
      * Process the input and generate a response
      * @param input The input to process
      * @returns The generated response
      */
     process(input: ChatModelInput, _options: AgentInvokeOptions): PromiseOrValue<AgentProcessResult<ChatModelOutput>>;
+    private getReasoningEffort;
     private _process;
     private getParallelToolCalls;
     protected getRunMessages(input: ChatModelInput): Promise<ChatCompletionMessageParam[]>;

package/lib/dts/openai-video-model.d.ts CHANGED Viewed

@@ -1,4 +1,4 @@
-import { VideoModel, type VideoModelInput, type VideoModelOptions, type VideoModelOutput } from "@aigne/core";
+import { type AgentInvokeOptions, VideoModel, type VideoModelInput, type VideoModelOptions, type VideoModelOutput } from "@aigne/core";
 import type OpenAI from "openai";
 import type { ClientOptions } from "openai";
 /**
@@ -6,9 +6,29 @@ import type { ClientOptions } from "openai";
  */
 export interface OpenAIVideoModelInput extends VideoModelInput {
     /**
-     * Optional image reference that guides generation (file path or URL)
+     * Sora model to use for video generation
+     *
+     * - `sora-2`: Standard version, lower cost
+     * - `sora-2-pro`: Pro version, higher quality
+     *
+     * @default "sora-2"
+     */
+    model?: "sora-2" | "sora-2-pro";
+    /**
+     * Video resolution (width x height)
+     *
+     * - `720x1280`: Vertical video (9:16)
+     * - `1280x720`: Horizontal video (16:9)
+     * - `1024x1792`: Vertical video (9:16, higher resolution)
+     * - `1792x1024`: Horizontal video (16:9, higher resolution)
+     */
+    size?: "720x1280" | "1280x720" | "1024x1792" | "1792x1024";
+    /**
+     * Video duration in seconds
+     *
+     * @default "4"
      */
-    inputReference?: string;
+    seconds?: "4" | "8" | "12";
 }
 /**
  * Output from OpenAI Video Model
@@ -68,5 +88,5 @@ export declare class OpenAIVideoModel extends VideoModel<OpenAIVideoModelInput,
     };
     get modelOptions(): Omit<Partial<OpenAIVideoModelInput>, "model"> | undefined;
     downloadToFile(videoId: string): Promise<string>;
-    process(input: OpenAIVideoModelInput): Promise<OpenAIVideoModelOutput>;
+    process(input: OpenAIVideoModelInput, options: AgentInvokeOptions): Promise<OpenAIVideoModelOutput>;
 }

package/lib/esm/openai-chat-model.d.ts CHANGED Viewed

@@ -1,4 +1,4 @@
-import { type AgentInvokeOptions, type AgentProcessResult, ChatModel, type ChatModelInput, type ChatModelInputMessage, type ChatModelInputTool, type ChatModelOptions, type ChatModelOutput } from "@aigne/core";
+import { type AgentInvokeOptions, type AgentProcessResult, ChatModel, type ChatModelInput, type ChatModelInputMessage, type ChatModelInputOptions, type ChatModelInputTool, type ChatModelOptions, type ChatModelOutput } from "@aigne/core";
 import { type PromiseOrValue } from "@aigne/core/utils/type-utils.js";
 import type { ClientOptions, OpenAI } from "openai";
 import type { ChatCompletionMessageParam, ChatCompletionTool } from "openai/resources";
@@ -127,13 +127,14 @@ export declare class OpenAIChatModel extends ChatModel {
         apiKey: string | undefined;
         model: string;
     };
-    get modelOptions(): Omit<import("@aigne/core").ChatModelInputOptions, "model"> | undefined;
+    get modelOptions(): Omit<ChatModelInputOptions, "model"> | undefined;
     /**
      * Process the input and generate a response
      * @param input The input to process
      * @returns The generated response
      */
     process(input: ChatModelInput, _options: AgentInvokeOptions): PromiseOrValue<AgentProcessResult<ChatModelOutput>>;
+    private getReasoningEffort;
     private _process;
     private getParallelToolCalls;
     protected getRunMessages(input: ChatModelInput): Promise<ChatCompletionMessageParam[]>;

package/lib/esm/openai-chat-model.js CHANGED Viewed

@@ -100,6 +100,20 @@ export class OpenAIChatModel extends ChatModel {
     process(input, _options) {
         return this._process(input);
     }
+    getReasoningEffort(effort) {
+        if (typeof effort === "number") {
+            if (effort > 5000)
+                return "high";
+            if (effort > 1000)
+                return "medium";
+            if (effort > 500)
+                return "low";
+            if (effort > 0)
+                return "minimal";
+            return undefined;
+        }
+        return effort;
+    }
     async _process(input) {
         const messages = await this.getRunMessages(input);
         const model = input.modelOptions?.model || this.credential.model;
@@ -116,6 +130,7 @@ export class OpenAIChatModel extends ChatModel {
                 include_usage: true,
             },
             stream: true,
+            reasoning_effort: this.getReasoningEffort(input.modelOptions?.reasoningEffort ?? this.modelOptions?.reasoningEffort),
         };
         // For models that do not support tools use with JSON schema in same request,
         // so we need to handle the case where tools are not used and responseFormat is json
@@ -133,9 +148,9 @@ export class OpenAIChatModel extends ChatModel {
             response_format: responseFormat,
         }));
         if (input.responseFormat?.type !== "json_schema") {
-            return await this.extractResultFromStream(stream, false, true);
+            return await this.extractResultFromStream(body, stream, false, true);
         }
-        const result = await this.extractResultFromStream(stream, jsonMode);
+        const result = await this.extractResultFromStream(body, stream, jsonMode);
         // Just return the result if it has tool calls
         if (result.toolCalls?.length || result.json)
             return result;
@@ -209,18 +224,28 @@ export class OpenAIChatModel extends ChatModel {
             ...body,
             response_format: resolvedResponseFormat,
         }));
-        return this.extractResultFromStream(res, jsonMode);
+        return this.extractResultFromStream(body, res, jsonMode);
     }
-    async extractResultFromStream(stream, jsonMode, streaming) {
+    async extractResultFromStream(body, stream, jsonMode, streaming) {
         const result = new ReadableStream({
             start: async (controller) => {
                 try {
+                    controller.enqueue({
+                        delta: {
+                            json: {
+                                modelOptions: {
+                                    reasoningEffort: body.reasoning_effort,
+                                },
+                            },
+                        },
+                    });
                     let text = "";
                     let refusal = "";
                     const toolCalls = [];
                     let model;
                     for await (const chunk of stream) {
                         const choice = chunk.choices?.[0];
+                        const delta = choice?.delta;
                         if (!model) {
                             model = chunk.model;
                             controller.enqueue({
@@ -231,8 +256,8 @@ export class OpenAIChatModel extends ChatModel {
                                 },
                             });
                         }
-                        if (choice?.delta.tool_calls?.length) {
-                            for (const call of choice.delta.tool_calls) {
+                        if (delta?.tool_calls?.length) {
+                            for (const call of delta.tool_calls) {
                                 if (this.supportsToolStreaming && call.index !== undefined) {
                                     handleToolCallDelta(toolCalls, call);
                                 }
@@ -241,27 +266,23 @@ export class OpenAIChatModel extends ChatModel {
                                 }
                             }
                         }
-                        if (choice?.delta.content) {
-                            text += choice.delta.content;
+                        if (delta && "reasoning" in delta && typeof delta.reasoning === "string") {
+                            controller.enqueue({ delta: { text: { thoughts: delta.reasoning } } });
+                        }
+                        if (delta?.content) {
+                            text += delta.content;
                             if (!jsonMode) {
                                 controller.enqueue({
                                     delta: {
                                         text: {
-                                            text: choice.delta.content,
+                                            text: delta.content,
                                         },
                                     },
                                 });
                             }
                         }
-                        if (choice?.delta.refusal) {
-                            refusal += choice.delta.refusal;
-                            if (!jsonMode) {
-                                controller.enqueue({
-                                    delta: {
-                                        text: { text: choice.delta.refusal },
-                                    },
-                                });
-                            }
+                        if (delta?.refusal) {
+                            refusal += delta.refusal;
                         }
                         if (chunk.usage) {
                             controller.enqueue({
@@ -276,7 +297,6 @@ export class OpenAIChatModel extends ChatModel {
                             });
                         }
                     }
-                    text = text || refusal;
                     if (jsonMode && text) {
                         controller.enqueue({
                             delta: {
@@ -298,6 +318,9 @@ export class OpenAIChatModel extends ChatModel {
                             },
                         });
                     }
+                    if (refusal) {
+                        controller.error(new Error(`Got refusal from LLM: ${refusal}`));
+                    }
                     controller.close();
                 }
                 catch (error) {

package/lib/esm/openai-video-model.d.ts CHANGED Viewed

@@ -1,4 +1,4 @@
-import { VideoModel, type VideoModelInput, type VideoModelOptions, type VideoModelOutput } from "@aigne/core";
+import { type AgentInvokeOptions, VideoModel, type VideoModelInput, type VideoModelOptions, type VideoModelOutput } from "@aigne/core";
 import type OpenAI from "openai";
 import type { ClientOptions } from "openai";
 /**
@@ -6,9 +6,29 @@ import type { ClientOptions } from "openai";
  */
 export interface OpenAIVideoModelInput extends VideoModelInput {
     /**
-     * Optional image reference that guides generation (file path or URL)
+     * Sora model to use for video generation
+     *
+     * - `sora-2`: Standard version, lower cost
+     * - `sora-2-pro`: Pro version, higher quality
+     *
+     * @default "sora-2"
+     */
+    model?: "sora-2" | "sora-2-pro";
+    /**
+     * Video resolution (width x height)
+     *
+     * - `720x1280`: Vertical video (9:16)
+     * - `1280x720`: Horizontal video (16:9)
+     * - `1024x1792`: Vertical video (9:16, higher resolution)
+     * - `1792x1024`: Horizontal video (16:9, higher resolution)
+     */
+    size?: "720x1280" | "1280x720" | "1024x1792" | "1792x1024";
+    /**
+     * Video duration in seconds
+     *
+     * @default "4"
      */
-    inputReference?: string;
+    seconds?: "4" | "8" | "12";
 }
 /**
  * Output from OpenAI Video Model
@@ -68,5 +88,5 @@ export declare class OpenAIVideoModel extends VideoModel<OpenAIVideoModelInput,
     };
     get modelOptions(): Omit<Partial<OpenAIVideoModelInput>, "model"> | undefined;
     downloadToFile(videoId: string): Promise<string>;
-    process(input: OpenAIVideoModelInput): Promise<OpenAIVideoModelOutput>;
+    process(input: OpenAIVideoModelInput, options: AgentInvokeOptions): Promise<OpenAIVideoModelOutput>;
 }

package/lib/esm/openai-video-model.js CHANGED Viewed

@@ -6,7 +6,9 @@ import { CustomOpenAI } from "./openai.js";
 const DEFAULT_MODEL = "sora-2";
 const DEFAULT_SECONDS = 4;
 const openAIVideoModelInputSchema = videoModelInputSchema.extend({
-    inputReference: z.string().optional(),
+    model: z.enum(["sora-2", "sora-2-pro"]).optional(),
+    seconds: z.enum(["4", "8", "12"]).optional(),
+    size: z.enum(["720x1280", "1280x720", "1024x1792", "1792x1024"]).optional(),
 });
 const openAIVideoModelOptionsSchema = z.object({
     apiKey: z.string().optional(),
@@ -61,7 +63,7 @@ export class OpenAIVideoModel extends VideoModel {
         const buffer = Buffer.from(arrayBuffer);
         return buffer.toString("base64");
     }
-    async process(input) {
+    async process(input, options) {
         const model = input.model ?? input.modelOptions?.model ?? this.credential.model;
         const createParams = {
             model: model,
@@ -71,9 +73,10 @@ export class OpenAIVideoModel extends VideoModel {
             createParams.seconds = input.seconds;
         if (input.size)
             createParams.size = input.size;
-        if (input.inputReference) {
-            createParams.input_reference =
-                input.inputReference;
+        if (input.image) {
+            createParams.input_reference = await this.transformFileType("file", input.image, options).then((file) => new File([Buffer.from(file.data, "base64")], file.filename || "image.png", {
+                type: file.mimeType,
+            }));
         }
         let video = await this.client.videos.create(createParams);
         logger.debug(`Video generation started: ${video.id}`);

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@aigne/openai",
-  "version": "0.16.4-beta.4",
+  "version": "0.16.4-beta.6",
   "description": "AIGNE OpenAI SDK for integrating with OpenAI's GPT models and API services",
   "publishConfig": {
     "access": "public"
@@ -38,8 +38,8 @@
     "@aigne/uuid": "^13.0.1",
     "openai": "^6.5.0",
     "zod": "^3.25.67",
-    "@aigne/core": "^1.65.0-beta.3",
-    "@aigne/platform-helpers": "^0.6.3"
+    "@aigne/platform-helpers": "^0.6.3",
+    "@aigne/core": "^1.65.0-beta.5"
   },
   "devDependencies": {
     "@types/bun": "^1.2.22",
@@ -47,7 +47,7 @@
     "npm-run-all": "^4.1.5",
     "rimraf": "^6.0.1",
     "typescript": "^5.9.2",
-    "@aigne/test-utils": "^0.5.57-beta.4"
+    "@aigne/test-utils": "^0.5.57-beta.6"
   },
   "scripts": {
     "lint": "tsc --noEmit",