@optima-chat/optima-agent 0.9.6 → 0.9.8

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (91) hide show
  1. package/.claude/skills/.kb-skills-managed.json +9 -9
  2. package/.claude/skills/ads/SKILL.md +244 -244
  3. package/.claude/skills/ads/template/campaign/CREATIVES.md +18 -18
  4. package/.claude/skills/ads/template/campaign/NOTES.md +10 -10
  5. package/.claude/skills/ads/template/campaign/STRATEGY.md +29 -29
  6. package/.claude/skills/ads/template/user/ADS.md +29 -29
  7. package/.claude/skills/ads/template/user/LEARNINGS.md +15 -15
  8. package/.claude/skills/ads/template/user/PROGRESS.md +20 -20
  9. package/.claude/skills/ads/template/user/README.md +25 -25
  10. package/.claude/skills/ads/template/user/assets/.gitignore +2 -2
  11. package/.claude/skills/bi/SKILL.md +131 -131
  12. package/.claude/skills/browser/SKILL.md +201 -201
  13. package/.claude/skills/channels/SKILL.md +188 -188
  14. package/.claude/skills/collection/SKILL.md +88 -88
  15. package/.claude/skills/douyin/SKILL.md +408 -408
  16. package/.claude/skills/ffmpeg/SKILL.md +164 -164
  17. package/.claude/skills/gen/SKILL.md +279 -275
  18. package/.claude/skills/growth/SKILL.md +90 -90
  19. package/.claude/skills/growth/template/ACCOUNTS.md +14 -14
  20. package/.claude/skills/growth/template/CALENDAR.md +7 -7
  21. package/.claude/skills/growth/template/COMMENTS.md +7 -7
  22. package/.claude/skills/growth/template/GROWTH.md +37 -37
  23. package/.claude/skills/growth/template/PROGRESS.md +4 -4
  24. package/.claude/skills/growth/template/README.md +20 -20
  25. package/.claude/skills/growth/template/TOPICS.md +7 -7
  26. package/.claude/skills/homepage/SKILL.md +177 -177
  27. package/.claude/skills/i18n/SKILL.md +517 -517
  28. package/.claude/skills/ingesting-sources/SKILL.md +94 -94
  29. package/.claude/skills/initializing-kb/SKILL.md +117 -117
  30. package/.claude/skills/instagram/SKILL.md +321 -321
  31. package/.claude/skills/inventory/SKILL.md +328 -328
  32. package/.claude/skills/kol-outreach/SKILL.md +232 -232
  33. package/.claude/skills/kol-outreach/template/campaign/CONFIG.md +60 -60
  34. package/.claude/skills/kol-outreach/template/campaign/KOLS.md +6 -6
  35. package/.claude/skills/kol-outreach/template/campaign/PROGRESS.md +3 -3
  36. package/.claude/skills/kol-outreach/template/campaign/TEMPLATES.md +88 -88
  37. package/.claude/skills/kol-outreach/template/merchant/BRAND.md +36 -36
  38. package/.claude/skills/kol-outreach/template/merchant/CAMPAIGNS.md +6 -6
  39. package/.claude/skills/kol-outreach/template/merchant/MERCHANT_LIMITS.md +16 -16
  40. package/.claude/skills/kol-outreach/template/merchant/PROGRESS.md +4 -4
  41. package/.claude/skills/kol-outreach/template/merchant/README.md +20 -20
  42. package/.claude/skills/linting-the-wiki/SKILL.md +68 -68
  43. package/.claude/skills/logistics/SKILL.md +180 -180
  44. package/.claude/skills/markdown-pdf/SKILL.md +72 -72
  45. package/.claude/skills/merchant/SKILL.md +110 -110
  46. package/.claude/skills/multigrid-poster/SKILL.md +192 -0
  47. package/.claude/skills/multigrid-poster/layouts/2x2.json +34 -0
  48. package/.claude/skills/multigrid-poster/layouts/3x3.json +43 -0
  49. package/.claude/skills/multigrid-poster/scripts/compose.py +116 -0
  50. package/.claude/skills/multigrid-poster/scripts/placeholder.png +0 -0
  51. package/.claude/skills/multigrid-poster/shared/fonts/MaShanZheng-Regular.ttf +0 -0
  52. package/.claude/skills/order/SKILL.md +452 -452
  53. package/.claude/skills/product/SKILL.md +379 -379
  54. package/.claude/skills/product-page/SKILL.md +106 -106
  55. package/.claude/skills/querying-the-wiki/SKILL.md +59 -59
  56. package/.claude/skills/reddit/SKILL.md +277 -277
  57. package/.claude/skills/review/SKILL.md +321 -321
  58. package/.claude/skills/scout/SKILL.md +462 -462
  59. package/.claude/skills/sentinel/SKILL.md +281 -281
  60. package/.claude/skills/shein/SKILL.md +246 -246
  61. package/.claude/skills/shipping/SKILL.md +200 -200
  62. package/.claude/skills/shop-content/SKILL.md +101 -101
  63. package/.claude/skills/shopify/SKILL.md +282 -282
  64. package/.claude/skills/skillify/SKILL.md +114 -114
  65. package/.claude/skills/taobao/SKILL.md +238 -238
  66. package/.claude/skills/tiktok/SKILL.md +381 -381
  67. package/.claude/skills/twitter/SKILL.md +302 -302
  68. package/.claude/skills/updating-related-pages/SKILL.md +65 -65
  69. package/.claude/skills/video-edit/SKILL.md +143 -143
  70. package/.claude/skills/video-gen/SKILL.md +548 -571
  71. package/.claude/skills/video-gen/templates/INDEX.md +78 -78
  72. package/.claude/skills/video-gen/templates/before-after-beauty.md +183 -183
  73. package/.claude/skills/video-gen/templates/drama-fmcg.md +183 -183
  74. package/.claude/skills/video-gen/templates/kol-reaction-food.md +193 -193
  75. package/.claude/skills/video-gen/templates/multi-point-apparel.md +185 -185
  76. package/.claude/skills/video-gen/templates/pain-solution-home.md +184 -184
  77. package/.claude/skills/video-gen/templates/pdp-360-showcase.md +189 -189
  78. package/.claude/skills/video-gen/templates/pdp-feature-highlight.md +182 -182
  79. package/.claude/skills/video-gen/templates/scene-digital.md +183 -183
  80. package/.claude/skills/wechat/SKILL.md +174 -161
  81. package/.claude/skills/xhs/SKILL.md +170 -170
  82. package/README.md +276 -276
  83. package/dist/bin/optima.js +26 -26
  84. package/dist/bin/serve.js +23 -23
  85. package/dist/src/agent.js +4 -4
  86. package/dist/src/system-prompt.d.ts.map +1 -1
  87. package/dist/src/system-prompt.js +169 -168
  88. package/dist/src/system-prompt.js.map +1 -1
  89. package/dist/src/tools/memory.js +10 -10
  90. package/dist/src/ui/headless.js +7 -7
  91. package/package.json +79 -79
@@ -1,275 +1,279 @@
1
- ---
2
- name: gen
3
- description: "生成和编辑图片/语音/虚拟试穿。使用场景:生成图片(generate images/生成图片/画图)、编辑图片(edit images/编辑图片/图生图/风格转换)、文本转语音(TTS/语音合成/朗读)、语音识别(ASR/语音转文字/转录)、虚拟试穿(virtual try-on/试穿/换装/试衣)。视频生成请使用 video-gen skill。"
4
- ---
5
-
6
- # AI 内容生成工具
7
-
8
- ## 图片生成
9
-
10
- ### 标准工作流程
11
-
12
- ```bash
13
- # 文生图
14
- gen image "提示词" -o /home/aiuser/project/result.png
15
-
16
- # 图片编辑/风格转换
17
- gen image "转成水彩风格" -i photo.png -o /home/aiuser/project/result.png
18
-
19
- # 读取并描述结果
20
- Read /home/aiuser/project/result.png
21
- ```
22
-
23
- ### gen image 命令
24
-
25
- 统一的图像生成/编辑命令。
26
-
27
- ```bash
28
- gen image <prompt> [options]
29
- ```
30
-
31
- #### 参数
32
-
33
- | 参数 | 说明 |
34
- |------|------|
35
- | `-i, --input <path>` | 输入图像(可多次使用,最多 8 张) |
36
- | `-W, --width <px>` | 输出宽度(默认 1024,最大 2048) |
37
- | `-H, --height <px>` | 输出高度(默认 1024,最大 2048) |
38
- | `-o, --output <path>` | 输出目录或完整路径 |
39
- | `-s, --seed <number>` | 随机种子(可复现结果) |
40
- | `-f, --format <fmt>` | 输出格式:jpeg \| png |
41
-
42
- ### 工作流示例
43
-
44
- #### 文生图
45
-
46
- ```bash
47
- gen image "a cute fluffy cat sitting on a windowsill, natural lighting" -o /home/aiuser/project/cat.png
48
- Read /home/aiuser/project/cat.png
49
- ```
50
-
51
- #### 图片风格转换
52
-
53
- ```bash
54
- gen image "watercolor painting style, artistic brushstrokes" -i photo.jpg -o /home/aiuser/project/watercolor.png
55
- Read /home/aiuser/project/watercolor.png
56
- ```
57
-
58
- #### 多图风格融合
59
-
60
- 将第一张图的风格应用到第二张图的内容上:
61
-
62
- ```bash
63
- gen image "apply the artistic style from image 1 to the content of image 2" -i style.png -i content.png -o /home/aiuser/project/fusion.png
64
- Read /home/aiuser/project/fusion.png
65
- ```
66
-
67
- #### 多图元素组合
68
-
69
- 从多张图中提取元素组合成新图:
70
-
71
- ```bash
72
- gen image "The person from image 1 is petting the cat from image 2, in a cozy living room" -i person.jpg -i cat.jpg -o /home/aiuser/project/combined.png
73
- ```
74
-
75
- #### 精确颜色控制
76
-
77
- 使用 hex code 指定精确颜色:
78
-
79
- ```bash
80
- gen image "a modern logo with brand color #02eb3c as the primary accent" -o /home/aiuser/project/logo.png
81
- ```
82
-
83
- #### 产品海报
84
-
85
- ```bash
86
- gen image "Disney Pixar style 3D poster, [产品描述], cute character, vibrant gradient background, professional studio lighting" -W 1024 -H 1024 -o /home/aiuser/project/poster.png
87
- ```
88
-
89
- ### 提示词指南(FLUX.2)
90
-
91
- #### 结构
92
-
93
- **Subject + Action + Style + Context**
94
-
95
- 词序很重要,靠前的元素优先级更高。
96
-
97
- #### 长度建议
98
-
99
- | 长度 | 词数 | 适用场景 |
100
- |------|------|----------|
101
- | 短 | 10-30 | 快速概念探索 |
102
- | 中 | 30-80 | 大多数项目(推荐) |
103
- | | 80+ | 复杂场景 |
104
-
105
- #### 最佳实践
106
-
107
- | 技巧 | 说明 | 示例 |
108
- |------|------|------|
109
- | 描述想要的 | 不支持负向提示词 | "sharp focus" 而非 "no blur" |
110
- | 精确颜色 | 使用 hex code | `"brand color #1a1a2e"` |
111
- | 文字渲染 | 用引号包裹文字 | `"The text 'OPEN' in red neon"` |
112
- | 摄影风格 | 指定相机/镜头 | `"shot on Fujifilm X-T5, 35mm f/1.4"` |
113
- | 多语言 | 用原生语言更地道 | 法语描述巴黎场景 |
114
-
115
- #### 示例对比
116
-
117
- ```bash
118
- # 简单
119
- gen image "a robot"
120
-
121
- # 添加风格
122
- gen image "a friendly AI robot, cute cartoon style, bright colors, 3D render"
123
-
124
- # 完整描述
125
- gen image "Disney Pixar style 3D animated robot character, friendly cheerful expression, wearing headset, surrounded by floating icons, gradient purple-blue background, professional studio lighting, vibrant colors"
126
- ```
127
-
128
- ### 分辨率选择
129
-
130
- 最大 2048x2048。
131
-
132
- | 用途 | 分辨率 |
133
- |------|--------|
134
- | 社交媒体 | 1024x1024 |
135
- | 宽屏壁纸 | 1920x1088 |
136
- | 竖屏海报 | 768x1280 |
137
-
138
- ### 生成规则
139
-
140
- #### 生成后
141
- - 使用 Read 工具查看生成的图片
142
- - 向用户描述图片内容(颜色、风格、构图、元素)
143
- - 验证是否符合用户要求
144
-
145
- #### 多图参考
146
- - 最多 8 张输入图
147
-
148
- ## 虚拟试穿 (Virtual Try-On)
149
-
150
- 使用 FASHN AI tryon-v1.6 将服装穿到人物照片上。
151
-
152
- ```bash
153
- gen tryon <人物照片> <服装照片> [options]
154
- ```
155
-
156
- ### 参数
157
-
158
- | 参数 | 说明 | 默认值 |
159
- |------|------|--------|
160
- | `-o, --output <path>` | 输出文件路径 | `./gen-output/tryon_{timestamp}.png` |
161
- | `-c, --category <type>` | 服装类别:auto \| tops \| bottoms \| one-pieces | auto |
162
- | `-m, --mode <mode>` | 生成模式:performance \| balanced \| quality | quality |
163
- | `--garment-type <type>` | 服装照片类型:auto \| flat-lay \| model | auto |
164
- | `-n, --num-samples <n>` | 生成数量 (1-4) | 1 |
165
- | `--format <fmt>` | 输出格式:png \| jpeg | png |
166
- | `--seed <n>` | 随机种子(可复现) | - |
167
-
168
- ### 示例
169
-
170
- ```bash
171
- # 基本用法
172
- gen tryon person.jpg garment.jpg -o /home/aiuser/project/result.png
173
- Read /home/aiuser/project/result.png
174
-
175
- # 使用 URL 图片
176
- gen tryon https://example.com/model.jpg https://example.com/dress.jpg -o /home/aiuser/project/result.png
177
-
178
- # 指定服装类别和快速模式
179
- gen tryon person.jpg top.jpg -c tops -m performance -o /home/aiuser/project/result.png
180
-
181
- # 生成多张结果
182
- gen tryon person.jpg dress.jpg -n 4 -c one-pieces -o /home/aiuser/project/result.png
183
- ```
184
-
185
- ### 注意事项
186
-
187
- - 支持本地图片路径和 URL
188
- - 服装类别:auto (自动检测), tops (上装), bottoms (下装), one-pieces (连体)
189
- - 三种模式:performance (~7s), balanced (~9s), quality (~13s)
190
- - 默认保存到 `./gen-output/`
191
-
192
- ## 语音合成 (TTS)
193
-
194
- 使用 DashScope qwen3-tts-flash 将文本转为语音。
195
-
196
- ```bash
197
- gen tts <文本> [options]
198
- ```
199
-
200
- ### 参数
201
-
202
- | 参数 | 说明 | 默认值 |
203
- |------|------|--------|
204
- | `-o, --output <path>` | 输出文件路径 | `./gen-output/tts_{timestamp}.wav` |
205
- | `--voice <name>` | 声音名称 | Cherry |
206
- | `--voices` | 列出可用声音 | - |
207
- | `--play` | 生成后自动播放 | - |
208
-
209
- ### 可用声音
210
-
211
- - 女声:Cherry, Serena, Chelsie, Aria, Bella, Vivian, Jennifer, Katerina, Breeze, Maple, Sakura
212
- - 男声:Ethan, Aiden, Brandon, Ryan, Luke, Leo
213
-
214
- ### 示例
215
-
216
- ```bash
217
- # 中文语音合成
218
- gen tts "你好,欢迎使用语音合成功能" -o /home/aiuser/project/hello.wav
219
-
220
- # 指定男声
221
- gen tts "Hello, welcome!" --voice Ethan -o /home/aiuser/project/greeting.wav
222
-
223
- # 生成后播放
224
- gen tts "测试语音" --play -o /home/aiuser/project/test.wav
225
- ```
226
-
227
- ### 注意事项
228
-
229
- - 输出格式为 WAV
230
- - 最大 5000 字符
231
- - 支持中、英、日、韩、法、德等 10 种语言(自动检测)
232
- - 默认保存到 `./gen-output/`
233
-
234
- ## 语音识别 (ASR)
235
-
236
- 使用 Groq Whisper 将语音转为文字。
237
-
238
- ```bash
239
- gen asr <音频文件> [options]
240
- ```
241
-
242
- ### 参数
243
-
244
- | 参数 | 说明 | 默认值 |
245
- |------|------|--------|
246
- | `--language <lang>` | 语言提示:zh \| en \| ja \| ko 等 | 自动检测 |
247
- | `--model <name>` | Whisper 模型 | whisper-large-v3-turbo |
248
-
249
- ### 示例
250
-
251
- ```bash
252
- # 自动检测语言
253
- gen asr /home/aiuser/project/recording.mp3
254
-
255
- # 指定语言提示(提高准确率)
256
- gen asr /home/aiuser/project/recording.wav --language zh
257
- ```
258
-
259
- ### 注意事项
260
-
261
- - 支持 mp3, wav, m4a, ogg, webm 格式
262
- - 文件大小限制 25MB
263
-
264
- ## 任务管理
265
-
266
- 所有生成命令会自动等待完成。如需查看历史或管理任务:
267
-
268
- ```bash
269
- gen task list # 查看所有任务
270
- gen task list --type image # 按类型过滤
271
- gen task list --status failed # 按状态过滤
272
- gen task get <task_id> # 查看任务详情
273
- gen task cancel <task_id> # 取消任务
274
- gen task retry <task_id> # 重试失败的任务
275
- ```
1
+ ---
2
+ name: gen
3
+ description: "生成和编辑图片/语音/虚拟试穿。使用场景:生成图片(generate images/生成图片/画图)、编辑图片(edit images/编辑图片/图生图/风格转换)、文本转语音(TTS/语音合成/朗读)、语音识别(ASR/语音转文字/转录)、虚拟试穿(virtual try-on/试穿/换装/试衣)。视频生成请使用 video-gen skill。"
4
+ ---
5
+
6
+ # AI 内容生成工具
7
+
8
+ ## 图片生成
9
+
10
+ ### 标准工作流程
11
+
12
+ ```bash
13
+ # 文生图
14
+ gen image "提示词" -o /home/aiuser/project/result.png
15
+
16
+ # 图片编辑/风格转换
17
+ gen image "转成水彩风格" -i photo.png -o /home/aiuser/project/result.png
18
+
19
+ # 读取并描述结果
20
+ Read /home/aiuser/project/result.png
21
+ ```
22
+
23
+ ### gen image 命令
24
+
25
+ 统一的图像生成/编辑命令。
26
+
27
+ ```bash
28
+ gen image <prompt> [options]
29
+ ```
30
+
31
+ #### 参数
32
+
33
+ | 参数 | 说明 |
34
+ |------|------|
35
+ | `-i, --input <path>` | 输入图像(可多次使用,最多 8 张) |
36
+ | `-W, --width <px>` | 输出宽度(默认 1024,最大 2048) |
37
+ | `-H, --height <px>` | 输出高度(默认 1024,最大 2048) |
38
+ | `-o, --output <path>` | 输出目录或完整路径 |
39
+ | `-s, --seed <number>` | 随机种子(可复现结果) |
40
+ | `-f, --format <fmt>` | 输出格式:jpeg \| png |
41
+ | `--provider <name>` | 供应商:grsai(默认) \| bfl |
42
+ | `-m, --model <model>` | 模型:gpt-image-2(默认) \| nano-banana-fast \| nano-banana-pro \| flux-kontext-pro \| flux-kontext-max 等 |
43
+ | `--aspect-ratio <ratio>` | 宽高比:1:1 \| 16:9 \| 9:16 \| 4:3 等 |
44
+ | `--image-size <size>` | nano-banana-pro 输出尺寸:1K \| 2K \| 4K |
45
+
46
+ ### 工作流示例
47
+
48
+ #### 文生图
49
+
50
+ ```bash
51
+ gen image "a cute fluffy cat sitting on a windowsill, natural lighting" -o /home/aiuser/project/cat.png
52
+ Read /home/aiuser/project/cat.png
53
+ ```
54
+
55
+ #### 图片风格转换
56
+
57
+ ```bash
58
+ gen image "watercolor painting style, artistic brushstrokes" -i photo.jpg -o /home/aiuser/project/watercolor.png
59
+ Read /home/aiuser/project/watercolor.png
60
+ ```
61
+
62
+ #### 多图风格融合
63
+
64
+ 将第一张图的风格应用到第二张图的内容上:
65
+
66
+ ```bash
67
+ gen image "apply the artistic style from image 1 to the content of image 2" -i style.png -i content.png -o /home/aiuser/project/fusion.png
68
+ Read /home/aiuser/project/fusion.png
69
+ ```
70
+
71
+ #### 多图元素组合
72
+
73
+ 从多张图中提取元素组合成新图:
74
+
75
+ ```bash
76
+ gen image "The person from image 1 is petting the cat from image 2, in a cozy living room" -i person.jpg -i cat.jpg -o /home/aiuser/project/combined.png
77
+ ```
78
+
79
+ #### 精确颜色控制
80
+
81
+ 使用 hex code 指定精确颜色:
82
+
83
+ ```bash
84
+ gen image "a modern logo with brand color #02eb3c as the primary accent" -o /home/aiuser/project/logo.png
85
+ ```
86
+
87
+ #### 产品海报
88
+
89
+ ```bash
90
+ gen image "Disney Pixar style 3D poster, [产品描述], cute character, vibrant gradient background, professional studio lighting" -W 1024 -H 1024 -o /home/aiuser/project/poster.png
91
+ ```
92
+
93
+ ### 提示词指南
94
+
95
+ #### 结构
96
+
97
+ **Subject + Action + Style + Context**
98
+
99
+ 词序很重要,靠前的元素优先级更高。
100
+
101
+ #### 长度建议
102
+
103
+ | 长度 | 词数 | 适用场景 |
104
+ |------|------|----------|
105
+ | 短 | 10-30 | 快速概念探索 |
106
+ | 中 | 30-80 | 大多数项目(推荐) |
107
+ | | 80+ | 复杂场景 |
108
+
109
+ #### 最佳实践
110
+
111
+ | 技巧 | 说明 | 示例 |
112
+ |------|------|------|
113
+ | 描述想要的 | 不支持负向提示词 | "sharp focus" 而非 "no blur" |
114
+ | 精确颜色 | 使用 hex code | `"brand color #1a1a2e"` |
115
+ | 文字渲染 | 用引号包裹文字 | `"The text 'OPEN' in red neon"` |
116
+ | 摄影风格 | 指定相机/镜头 | `"shot on Fujifilm X-T5, 35mm f/1.4"` |
117
+ | 多语言 | 用原生语言更地道 | 法语描述巴黎场景 |
118
+
119
+ #### 示例对比
120
+
121
+ ```bash
122
+ # 简单
123
+ gen image "a robot"
124
+
125
+ # 添加风格
126
+ gen image "a friendly AI robot, cute cartoon style, bright colors, 3D render"
127
+
128
+ # 完整描述
129
+ gen image "Disney Pixar style 3D animated robot character, friendly cheerful expression, wearing headset, surrounded by floating icons, gradient purple-blue background, professional studio lighting, vibrant colors"
130
+ ```
131
+
132
+ ### 分辨率选择
133
+
134
+ 最大 2048x2048。
135
+
136
+ | 用途 | 分辨率 |
137
+ |------|--------|
138
+ | 社交媒体 | 1024x1024 |
139
+ | 宽屏壁纸 | 1920x1088 |
140
+ | 竖屏海报 | 768x1280 |
141
+
142
+ ### 生成规则
143
+
144
+ #### 生成后
145
+ - 使用 Read 工具查看生成的图片
146
+ - 向用户描述图片内容(颜色、风格、构图、元素)
147
+ - 验证是否符合用户要求
148
+
149
+ #### 多图参考
150
+ - 最多 8 张输入图
151
+
152
+ ## 虚拟试穿 (Virtual Try-On)
153
+
154
+ 使用 FASHN AI tryon-v1.6 将服装穿到人物照片上。
155
+
156
+ ```bash
157
+ gen tryon <人物照片> <服装照片> [options]
158
+ ```
159
+
160
+ ### 参数
161
+
162
+ | 参数 | 说明 | 默认值 |
163
+ |------|------|--------|
164
+ | `-o, --output <path>` | 输出文件路径 | `./gen-output/tryon_{timestamp}.png` |
165
+ | `-c, --category <type>` | 服装类别:auto \| tops \| bottoms \| one-pieces | auto |
166
+ | `-m, --mode <mode>` | 生成模式:performance \| balanced \| quality | quality |
167
+ | `--garment-type <type>` | 服装照片类型:auto \| flat-lay \| model | auto |
168
+ | `-n, --num-samples <n>` | 生成数量 (1-4) | 1 |
169
+ | `--format <fmt>` | 输出格式:png \| jpeg | png |
170
+ | `--seed <n>` | 随机种子(可复现) | - |
171
+
172
+ ### 示例
173
+
174
+ ```bash
175
+ # 基本用法
176
+ gen tryon person.jpg garment.jpg -o /home/aiuser/project/result.png
177
+ Read /home/aiuser/project/result.png
178
+
179
+ # 使用 URL 图片
180
+ gen tryon https://example.com/model.jpg https://example.com/dress.jpg -o /home/aiuser/project/result.png
181
+
182
+ # 指定服装类别和快速模式
183
+ gen tryon person.jpg top.jpg -c tops -m performance -o /home/aiuser/project/result.png
184
+
185
+ # 生成多张结果
186
+ gen tryon person.jpg dress.jpg -n 4 -c one-pieces -o /home/aiuser/project/result.png
187
+ ```
188
+
189
+ ### 注意事项
190
+
191
+ - 支持本地图片路径和 URL
192
+ - 服装类别:auto (自动检测), tops (上装), bottoms (下装), one-pieces (连体)
193
+ - 三种模式:performance (~7s), balanced (~9s), quality (~13s)
194
+ - 默认保存到 `./gen-output/`
195
+
196
+ ## 语音合成 (TTS)
197
+
198
+ 使用 DashScope qwen3-tts-flash 将文本转为语音。
199
+
200
+ ```bash
201
+ gen tts <文本> [options]
202
+ ```
203
+
204
+ ### 参数
205
+
206
+ | 参数 | 说明 | 默认值 |
207
+ |------|------|--------|
208
+ | `-o, --output <path>` | 输出文件路径 | `./gen-output/tts_{timestamp}.wav` |
209
+ | `--voice <name>` | 声音名称 | Cherry |
210
+ | `--voices` | 列出可用声音 | - |
211
+ | `--play` | 生成后自动播放 | - |
212
+
213
+ ### 可用声音
214
+
215
+ - 女声:Cherry, Serena, Chelsie, Aria, Bella, Vivian, Jennifer, Katerina, Breeze, Maple, Sakura
216
+ - 男声:Ethan, Aiden, Brandon, Ryan, Luke, Leo
217
+
218
+ ### 示例
219
+
220
+ ```bash
221
+ # 中文语音合成
222
+ gen tts "你好,欢迎使用语音合成功能" -o /home/aiuser/project/hello.wav
223
+
224
+ # 指定男声
225
+ gen tts "Hello, welcome!" --voice Ethan -o /home/aiuser/project/greeting.wav
226
+
227
+ # 生成后播放
228
+ gen tts "测试语音" --play -o /home/aiuser/project/test.wav
229
+ ```
230
+
231
+ ### 注意事项
232
+
233
+ - 输出格式为 WAV
234
+ - 最大 5000 字符
235
+ - 支持中、英、日、韩、法、德等 10 种语言(自动检测)
236
+ - 默认保存到 `./gen-output/`
237
+
238
+ ## 语音识别 (ASR)
239
+
240
+ 使用 Groq Whisper 将语音转为文字。
241
+
242
+ ```bash
243
+ gen asr <音频文件> [options]
244
+ ```
245
+
246
+ ### 参数
247
+
248
+ | 参数 | 说明 | 默认值 |
249
+ |------|------|--------|
250
+ | `--language <lang>` | 语言提示:zh \| en \| ja \| ko 等 | 自动检测 |
251
+ | `--model <name>` | Whisper 模型 | whisper-large-v3-turbo |
252
+
253
+ ### 示例
254
+
255
+ ```bash
256
+ # 自动检测语言
257
+ gen asr /home/aiuser/project/recording.mp3
258
+
259
+ # 指定语言提示(提高准确率)
260
+ gen asr /home/aiuser/project/recording.wav --language zh
261
+ ```
262
+
263
+ ### 注意事项
264
+
265
+ - 支持 mp3, wav, m4a, ogg, webm 格式
266
+ - 文件大小限制 25MB
267
+
268
+ ## 任务管理
269
+
270
+ 所有生成命令会自动等待完成。如需查看历史或管理任务:
271
+
272
+ ```bash
273
+ gen task list # 查看所有任务
274
+ gen task list --type image # 按类型过滤
275
+ gen task list --status failed # 按状态过滤
276
+ gen task get <task_id> # 查看任务详情
277
+ gen task cancel <task_id> # 取消任务
278
+ gen task retry <task_id> # 重试失败的任务
279
+ ```