npm - ai-world-sdk - Versions diffs - 1.5.5 → 1.5.6 - Mend

ai-world-sdk 1.5.5 → 1.5.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (8) hide show

package/dist/cli/commands/image.js +0 -1
package/dist/config.d.ts +3 -3
package/dist/config.js +2 -2
package/dist/video_generation.d.ts +38 -3
package/package.json +1 -1
package/skills/ai-world-sdk/docs/image-generation.md +25 -2
package/skills/ai-world-sdk/docs/provider-and-models.md +3 -3
package/skills/ai-world-sdk/docs/video-generation.md +131 -9

package/dist/cli/commands/image.js CHANGED Viewed

@@ -180,7 +180,6 @@ function registerImageCommands(program) {
             });
         }
         catch (err) {
-            console.log('----image generate error', err, new Error().stack);
             (0, utils_1.handleError)(err, commandName);
         }
     });

package/dist/config.d.ts CHANGED Viewed

@@ -9,7 +9,7 @@
  *
  * 注意: {VERSION} 占位符会在构建时被替换为实际版本号
  */
-export declare const SDK_SIGNATURE = "AI_WORLD_SDK_V:1.5.5";
+export declare const SDK_SIGNATURE = "AI_WORLD_SDK_V:1.5.6";
 /**
  * 版本兼容性错误
  */
@@ -35,8 +35,8 @@ declare class SDKConfig {
     private _authCheckPromise;
     private _currentUser;
     private _cliMode;
-    readonly sdkSignature = "AI_WORLD_SDK_V:1.5.5";
-    readonly sdkVersion = "1.5.5";
+    readonly sdkSignature = "AI_WORLD_SDK_V:1.5.6";
+    readonly sdkVersion = "1.5.6";
     constructor();
     /**
      * Set global base URL

package/dist/config.js CHANGED Viewed

@@ -7,7 +7,7 @@ Object.defineProperty(exports, "__esModule", { value: true });
 exports.sdkConfig = exports.VersionCompatibilityError = exports.SDK_SIGNATURE = void 0;
 // SDK 版本号（构建时自动从 package.json 更新）
 // 此版本号会在运行 npm run build 时自动从 package.json 读取并更新
-const SDK_VERSION = "1.5.5";
+const SDK_VERSION = "1.5.6";
 /**
  * SDK 特征码 - 用于在构建后的 JS 文件中识别 SDK 版本
  * 格式: AI_WORLD_SDK_V:版本号
@@ -15,7 +15,7 @@ const SDK_VERSION = "1.5.5";
  *
  * 注意: {VERSION} 占位符会在构建时被替换为实际版本号
  */
-exports.SDK_SIGNATURE = "AI_WORLD_SDK_V:1.5.5";
+exports.SDK_SIGNATURE = "AI_WORLD_SDK_V:1.5.6";
 /**
  * 版本兼容性错误
  */

package/dist/video_generation.d.ts CHANGED Viewed

@@ -16,20 +16,55 @@ export interface VideoGenerationContentImage {
     image_url: {
         url: string;
     };
-    role: string;
+    role?: string;
+}
+export interface VideoGenerationContentVideo {
+    type: "video_url";
+    video_url: {
+        url: string;
+    };
+}
+export interface VideoGenerationContentAudio {
+    type: "audio_url";
+    audio_url: {
+        url: string;
+    };
 }
-export type VideoGenerationContent = VideoGenerationContentText | VideoGenerationContentImage;
+export type VideoGenerationContent = VideoGenerationContentText | VideoGenerationContentImage | VideoGenerationContentVideo | VideoGenerationContentAudio;
 export interface VideoGenerationRequest {
+    /** 文本提示词（文本生成视频，与 content 二选一） */
     prompt?: string;
+    /** 图像 URL（图像生成视频，与 content 二选一） */
     image_url?: string;
+    /** 模型名称。Seedance 1.x: doubao-seedance-1-0-pro-fast-251015; Seedance 2.0: doubao-seedance-2-0-260128, doubao-seedance-2-0-fast-260128 */
     model?: string;
+    /**
+     * 内容列表（高级用法，直接传递给 SDK）。
+     * 支持的类型: text, image_url, video_url, audio_url。
+     * 提供时忽略 prompt 和 image_url 字段。
+     *
+     * 示例 — 文本生成视频:
+     *   [{ type: "text", text: "A sunset over the ocean" }]
+     *
+     * 示例 — 图像生成视频（I2V）:
+     *   [{ type: "text", text: "The woman smiles" }, { type: "image_url", image_url: { url: "https://..." } }]
+     *
+     * 示例 — 首尾帧控制:
+     *   [{ type: "text", text: "flower blooms" }, { type: "image_url", image_url: { url: "first.jpg" } }, { type: "image_url", image_url: { url: "last.jpg" } }]
+     *
+     * 示例 — 多模态参考（Seedance 2.0）:
+     *   [{ type: "text", text: "..." }, { type: "image_url", image_url: { url: "..." } }, { type: "video_url", video_url: { url: "..." } }, { type: "audio_url", audio_url: { url: "..." } }]
+     */
     content?: VideoGenerationContent[];
     callback_url?: string;
     return_last_frame?: boolean;
     service_tier?: string;
     execution_expires_after?: number;
+    /** 视频时长（秒），Seedance 1.x: 1-10，Seedance 2.0: 5-15 */
     duration?: number;
-    aspect_ratio?: "16:9" | "9:16" | "1:1";
+    /** 宽高比: "16:9" | "9:16" | "1:1" | "adaptive"（I2V 时自适应原图比例） */
+    aspect_ratio?: string;
+    /** 分辨率: "720p" | "1080p" | "2k" */
     resolution?: string;
     user?: string;
 }

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "ai-world-sdk",
-  "version": "1.5.5",
+  "version": "1.5.6",
   "description": "TypeScript SDK for AI World Platform - Chat Models, Image Generation, and Video Generation",
   "main": "dist/index.js",
   "types": "dist/index.d.ts",

package/skills/ai-world-sdk/docs/image-generation.md CHANGED Viewed

@@ -58,12 +58,35 @@ await client.generate({
 ## Gemini 图像生成
+`provider` 在构造函数中传入，而非 `generate()` 方法。
 ```typescript
 import { GeminiImageGenerationClient } from 'ai-world-sdk';
-const client = new GeminiImageGenerationClient({});
+// provider 在构造函数中指定
+const client = new GeminiImageGenerationClient({ provider: 'gemini' });
 const result = await client.generate({
   prompt: '一只可爱的小猫',
-  provider: 'gemini',
 });
+// result.images — 生成的图像列表
 ```
+### Gemini 图像对话（chat）
+```typescript
+const chatResult = await client.chat({
+  prompt: '把这只猫变成卡通风格',
+  image: 'data:image/png;base64,...',
+  model: 'gemini-3-pro-image-preview',
+});
+```
+### 参数说明
+| 参数 | 位置 | 说明 |
+|------|------|------|
+| `provider` | 构造函数 | 图像生成 Provider（如 `'gemini'`） |
+| `prompt` | `generate()` | 文本提示词 |
+| `model` | `generate()` | 模型名称（默认: `gemini-2.0-flash-exp-image-generation`，chat 默认: `gemini-3-pro-image-preview`） |
+| `image` | `generate()` / `chat()` | 输入图像（base64 或 URL） |
+| `aspect_ratio` | `generate()` | 宽高比 |

package/skills/ai-world-sdk/docs/provider-and-models.md CHANGED Viewed

@@ -15,7 +15,7 @@
 | `aiping` | `anthropic` | 平音 Claude |
 | `gemini` | `gemini` | Google 原生，仅限 Gemini 系列模型 |
 | `openrouter` | `openai` | OpenRouter 聚合服务，SDK 内部自动使用 `createOpenRouter` 和专用代理端点 `/api/llm/openrouter`。模型 ID 格式为 `provider/model`（如 `openai/gpt-4o-mini`、`anthropic/claude-sonnet-4-20250514`） |
-| `kunpo` | `openai` | KUNPO API 统一 LLM 网关（https://llm.ziy.cc），兼容 OpenAI 接口，一个 Key 访问 150+ 模型。SDK 内部使用 `createOpenAI` 并路由到专用代理 `/api/llm/kunpo` |
+| `kunpo` | `openai` | KUNPO API 统一 LLM 网关（https://llm.ziy.cc），兼容 OpenAI 接口，一个 Key 访问 150+ 模型。SDK 内部使用 `createOpenRouter` 并路由到专用代理 `/api/llm/kunpo` |
 ## EndpointType 与模型对应关系
@@ -26,7 +26,7 @@
 | `openai` | OpenAI 兼容 | 模型兼容 OpenAI 格式，可包括 GPT、以及经聚合的 Gemini/Claude 等（视 provider 能力） |
 | `openai` | OpenRouter 兼容 | 当 provider 为 `openrouter` 时，`endpointType` 传 `openai`，SDK 内部自动切换到 `createOpenRouter` 和专用代理端点 |
-规则：**anthropic 不是 provider**，仅 **api2img**、**shubiaobiao**、**aiping** 支持 EndpointType 为 `anthropic`（调用 Claude）；`gemini` provider 用 `gemini` endpoint；`openrouter` provider 的 `endpointType` 传 `openai`，SDK 内部会自动使用 `@openrouter/ai-sdk-provider` 的 `createOpenRouter` 并路由到专用代理 `/api/llm/openrouter`；`kunpo` provider 的 `endpointType` 传 `openai`，SDK 内部使用 `createOpenAI` 并路由到专用代理 `/api/llm/kunpo`；其余按上表组合。
+规则：**anthropic 不是 provider**，仅 **api2img**、**shubiaobiao**、**aiping** 支持 EndpointType 为 `anthropic`（调用 Claude）；`gemini` provider 用 `gemini` endpoint；`openrouter` provider 的 `endpointType` 传 `openai`，SDK 内部会自动使用 `@openrouter/ai-sdk-provider` 的 `createOpenRouter` 并路由到专用代理 `/api/llm/openrouter`；`kunpo` provider 的 `endpointType` 传 `openai`，SDK 内部使用 `createOpenRouter` 并路由到专用代理 `/api/llm/kunpo`；其余按上表组合。
 > `doubao` 不通过 `createProvider` 使用，豆包有专用客户端（见 image-generation.md / video-generation.md）。
@@ -62,7 +62,7 @@ or.languageModel('openai/gpt-4o-mini');
 or.languageModel('anthropic/claude-sonnet-4-20250514');
 or.languageModel('google/gemini-2.5-flash-preview');
-// KUNPO API（endpointType 传 'openai'，SDK 内部使用 createOpenAI + 专用代理 /api/llm/kunpo）
+// KUNPO API（endpointType 传 'openai'，SDK 内部使用 createOpenRouter + 专用代理 /api/llm/kunpo）
 // 兼容 OpenAI Chat Completions 格式，支持 150+ 模型
 const kp = createProvider('kunpo', 'openai', 'my-plugin');
 kp.languageModel('google/gemini-3.1-pro-preview');

package/skills/ai-world-sdk/docs/video-generation.md CHANGED Viewed

@@ -2,22 +2,32 @@
 ## 豆包视频生成（Seedance）
+参考文档: https://www.volcengine.com/docs/82379/1366799 (1.x) / https://www.volcengine.com/docs/82379/2291680 (2.0)
+具体模型列表: https://www.volcengine.com/docs/82379/1330310
+### 支持的模型
+| 模型 | 说明 |
+|------|------|
+| `doubao-seedance-2-0-260128` | Seedance 2.0 标准版 |
+| `doubao-seedance-2-0-fast-260128` | Seedance 2.0 快速版 |
+### 基本用法 — 文本生成视频
 ```typescript
 import { VideoGenerationClient } from 'ai-world-sdk';
 const client = new VideoGenerationClient({});
-// 创建任务
 const task = await client.create({
   prompt: '日落时分的海滩',
-  duration: 5,           // 1-10 秒
-  aspect_ratio: '16:9',  // '16:9' | '9:16' | '1:1'
+  duration: 5,
+  aspect_ratio: '16:9',
   resolution: '720p',
 });
-// 轮询直到完成
 const result = await client.poll(task.id, {
-  interval: 3000,
+  interval: 5000,
   timeout: 300000,
 });
@@ -26,6 +36,119 @@ if (result.status === 'succeeded') {
 }
 ```
+### 使用 content 参数（高级用法）
+`content` 参数是一个数组，支持以下类型：
+| type | 说明 | 限制 |
+|------|------|------|
+| `text` | 文本提示词 | 必须包含至少一个 |
+| `image_url` | 图像参考/首帧/尾帧 | 最多 9 张，每张 < 30MB |
+| `video_url` | 视频参考（Seedance 2.0） | 最多 3 个，2-15秒，< 50MB |
+| `audio_url` | 音频参考（Seedance 2.0） | 最多 3 个，MP3，< 15MB |
+当提供 `content` 时，`prompt` 和 `image_url` 字段将被忽略。
+#### 文本生成视频（T2V）
+```typescript
+const task = await client.create({
+  model: 'doubao-seedance-2-0-260128',
+  content: [
+    { type: 'text', text: 'A golden retriever running through a sunlit wheat field, cinematic' }
+  ],
+  resolution: '1080p',
+  aspect_ratio: '16:9',
+  duration: 5,
+});
+```
+#### 图像生成视频（I2V）
+```typescript
+const task = await client.create({
+  model: 'doubao-seedance-2-0-260128',
+  content: [
+    { type: 'text', text: 'The woman slowly turns her head and smiles' },
+    { type: 'image_url', image_url: { url: 'https://example.com/portrait.jpg' } }
+  ],
+  aspect_ratio: 'adaptive',
+  duration: 5,
+});
+```
+#### 首尾帧控制
+提供两张图片，模型自动识别为首尾帧模式，生成中间过渡动画：
+```typescript
+const task = await client.create({
+  model: 'doubao-seedance-2-0-260128',
+  content: [
+    { type: 'text', text: 'The flower blooms from bud to full open, macro lens' },
+    { type: 'image_url', image_url: { url: 'https://example.com/flower-bud.jpg' } },
+    { type: 'image_url', image_url: { url: 'https://example.com/flower-open.jpg' } }
+  ],
+  aspect_ratio: 'adaptive',
+  duration: 8,
+});
+```
+#### 多模态参考（Seedance 2.0）
+Seedance 2.0 支持同时传入图像、视频、音频参考：
+```typescript
+const task = await client.create({
+  model: 'doubao-seedance-2-0-260128',
+  content: [
+    { type: 'text', text: 'Match the visual style and add background audio' },
+    { type: 'image_url', image_url: { url: 'https://example.com/style-ref.jpg' } },
+    { type: 'video_url', video_url: { url: 'https://example.com/motion-ref.mp4' } },
+    { type: 'audio_url', audio_url: { url: 'https://example.com/bgm.mp3' } }
+  ],
+  duration: 10,
+  aspect_ratio: '16:9',
+});
+```
+### 参数说明
+| 参数 | 类型 | 说明 |
+|------|------|------|
+| `prompt` | `string` | 文本提示词（简化用法，与 content 二选一） |
+| `image_url` | `string` | 图像 URL（简化用法，与 content 二选一） |
+| `model` | `string` | 模型名称（默认: doubao-seedance-1-0-pro-fast-251015） |
+| `content` | `VideoGenerationContent[]` | 内容列表（高级用法，支持 text/image_url/video_url/audio_url） |
+| `duration` | `number` | 视频时长（秒），1.x: 1-10，2.0: 5-15 |
+| `aspect_ratio` | `string` | 宽高比: "16:9" / "9:16" / "1:1" / "adaptive" |
+| `resolution` | `string` | 分辨率: "720p" / "1080p" / "2k" |
+| `callback_url` | `string` | 回调 URL（任务完成时通知） |
+| `return_last_frame` | `boolean` | 是否返回最后一帧图像（用于链式生成） |
+### 轮询与链式生成
+使用 `return_last_frame: true` 获取最后一帧，将其作为下一段视频的首帧，实现长视频链式生成：
+```typescript
+const task1 = await client.create({
+  prompt: 'Scene 1: sunrise over mountains',
+  return_last_frame: true,
+  duration: 5,
+});
+const result1 = await client.poll(task1.id);
+if (result1.status === 'succeeded' && result1.content?.last_frame_url) {
+  const task2 = await client.create({
+    content: [
+      { type: 'text', text: 'Scene 2: camera zooms into the valley' },
+      { type: 'image_url', image_url: { url: result1.content.last_frame_url } }
+    ],
+    duration: 5,
+  });
+}
+```
 ## 豆包视频理解
 使用 `VideoUnderstandingClient` 分析视频内容。基于 Chat Completions API，支持传入视频 URL 进行理解分析。
@@ -48,7 +171,6 @@ import { VideoUnderstandingClient } from 'ai-world-sdk';
 const client = new VideoUnderstandingClient({});
-// 一行代码分析视频
 const description = await client.analyzeVideo(
   'https://example.com/video.mp4',
   { prompt: '请详细描述这个视频的内容' }
@@ -63,11 +185,11 @@ const response = await client.understand({
   video_url: 'https://example.com/video.mp4',
   prompt: '这个视频讲了什么？',
   model: 'doubao-seed-2-0-pro-260215',
-  fps: 1,         // 可选，视频采样帧率，默认为1秒，即每秒从视频中抽取一帧图像
+  fps: 1,
 });
 console.log(response.choices[0].message.content);
-console.log(response.usage); // { prompt_tokens, completion_tokens, total_tokens }
+console.log(response.usage);
 ```
 ### 流式请求
@@ -115,7 +237,7 @@ const response = await client.understand({
 });
 ```
-### 参数说明
+### 视频理解参数说明
 | 参数 | 类型 | 必填 | 说明 |
 |------|------|------|------|