@optima-chat/optima-agent 0.9.8 → 0.9.9

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (171) hide show
  1. package/.claude/settings.local.json +166 -0
  2. package/.claude/skills/.kb-skills-managed.json +9 -9
  3. package/.claude/skills/ads/SKILL.md +244 -244
  4. package/.claude/skills/ads/template/campaign/CREATIVES.md +18 -18
  5. package/.claude/skills/ads/template/campaign/NOTES.md +10 -10
  6. package/.claude/skills/ads/template/campaign/STRATEGY.md +29 -29
  7. package/.claude/skills/ads/template/user/ADS.md +29 -29
  8. package/.claude/skills/ads/template/user/LEARNINGS.md +15 -15
  9. package/.claude/skills/ads/template/user/PROGRESS.md +20 -20
  10. package/.claude/skills/ads/template/user/README.md +25 -25
  11. package/.claude/skills/ads/template/user/assets/.gitignore +2 -2
  12. package/.claude/skills/bi/SKILL.md +131 -131
  13. package/.claude/skills/browser/SKILL.md +201 -201
  14. package/.claude/skills/channels/SKILL.md +188 -188
  15. package/.claude/skills/collection/SKILL.md +88 -88
  16. package/.claude/skills/douyin/SKILL.md +408 -408
  17. package/.claude/skills/ffmpeg/SKILL.md +164 -164
  18. package/.claude/skills/gen/SKILL.md +279 -279
  19. package/.claude/skills/growth/SKILL.md +90 -90
  20. package/.claude/skills/growth/template/ACCOUNTS.md +14 -14
  21. package/.claude/skills/growth/template/CALENDAR.md +7 -7
  22. package/.claude/skills/growth/template/COMMENTS.md +7 -7
  23. package/.claude/skills/growth/template/GROWTH.md +37 -37
  24. package/.claude/skills/growth/template/PROGRESS.md +4 -4
  25. package/.claude/skills/growth/template/README.md +20 -20
  26. package/.claude/skills/growth/template/TOPICS.md +7 -7
  27. package/.claude/skills/homepage/SKILL.md +177 -177
  28. package/.claude/skills/i18n/SKILL.md +517 -517
  29. package/.claude/skills/ingesting-sources/SKILL.md +94 -94
  30. package/.claude/skills/initializing-kb/SKILL.md +117 -117
  31. package/.claude/skills/instagram/SKILL.md +321 -321
  32. package/.claude/skills/inventory/SKILL.md +328 -328
  33. package/.claude/skills/kol-outreach/SKILL.md +232 -232
  34. package/.claude/skills/kol-outreach/template/campaign/CONFIG.md +60 -60
  35. package/.claude/skills/kol-outreach/template/campaign/KOLS.md +6 -6
  36. package/.claude/skills/kol-outreach/template/campaign/PROGRESS.md +3 -3
  37. package/.claude/skills/kol-outreach/template/campaign/TEMPLATES.md +88 -88
  38. package/.claude/skills/kol-outreach/template/merchant/BRAND.md +36 -36
  39. package/.claude/skills/kol-outreach/template/merchant/CAMPAIGNS.md +6 -6
  40. package/.claude/skills/kol-outreach/template/merchant/MERCHANT_LIMITS.md +16 -16
  41. package/.claude/skills/kol-outreach/template/merchant/PROGRESS.md +4 -4
  42. package/.claude/skills/kol-outreach/template/merchant/README.md +20 -20
  43. package/.claude/skills/linting-the-wiki/SKILL.md +68 -68
  44. package/.claude/skills/logistics/SKILL.md +180 -180
  45. package/.claude/skills/markdown-pdf/SKILL.md +72 -72
  46. package/.claude/skills/merchant/SKILL.md +110 -110
  47. package/.claude/skills/multigrid-poster/SKILL.md +192 -192
  48. package/.claude/skills/multigrid-poster/layouts/2x2.json +34 -34
  49. package/.claude/skills/multigrid-poster/layouts/3x3.json +43 -43
  50. package/.claude/skills/multigrid-poster/scripts/compose.py +116 -116
  51. package/.claude/skills/order/SKILL.md +452 -452
  52. package/.claude/skills/product/SKILL.md +379 -379
  53. package/.claude/skills/product-page/SKILL.md +106 -106
  54. package/.claude/skills/querying-the-wiki/SKILL.md +59 -59
  55. package/.claude/skills/reddit/SKILL.md +277 -277
  56. package/.claude/skills/review/SKILL.md +321 -321
  57. package/.claude/skills/scout/SKILL.md +575 -462
  58. package/.claude/skills/sentinel/SKILL.md +281 -281
  59. package/.claude/skills/shein/SKILL.md +246 -246
  60. package/.claude/skills/shipping/SKILL.md +200 -200
  61. package/.claude/skills/shop-content/SKILL.md +101 -101
  62. package/.claude/skills/shopify/SKILL.md +282 -282
  63. package/.claude/skills/skillify/SKILL.md +114 -114
  64. package/.claude/skills/taobao/SKILL.md +238 -238
  65. package/.claude/skills/tiktok/SKILL.md +381 -381
  66. package/.claude/skills/twitter/SKILL.md +302 -302
  67. package/.claude/skills/updating-related-pages/SKILL.md +65 -65
  68. package/.claude/skills/video-edit/SKILL.md +143 -143
  69. package/.claude/skills/video-gen/SKILL.md +548 -548
  70. package/.claude/skills/video-gen/templates/INDEX.md +78 -78
  71. package/.claude/skills/video-gen/templates/before-after-beauty.md +183 -183
  72. package/.claude/skills/video-gen/templates/drama-fmcg.md +183 -183
  73. package/.claude/skills/video-gen/templates/kol-reaction-food.md +193 -193
  74. package/.claude/skills/video-gen/templates/multi-point-apparel.md +185 -185
  75. package/.claude/skills/video-gen/templates/pain-solution-home.md +184 -184
  76. package/.claude/skills/video-gen/templates/pdp-360-showcase.md +189 -189
  77. package/.claude/skills/video-gen/templates/pdp-feature-highlight.md +182 -182
  78. package/.claude/skills/video-gen/templates/scene-digital.md +183 -183
  79. package/.claude/skills/wechat/SKILL.md +174 -174
  80. package/.claude/skills/xhs/SKILL.md +170 -170
  81. package/README.md +276 -276
  82. package/dist/bin/bi-cli.js +0 -0
  83. package/dist/bin/browser-cli.js +0 -0
  84. package/dist/bin/comfy.d.ts +3 -0
  85. package/dist/bin/comfy.d.ts.map +1 -0
  86. package/dist/bin/comfy.js +3 -0
  87. package/dist/bin/comfy.js.map +1 -0
  88. package/dist/bin/commerce.js +0 -0
  89. package/dist/bin/gen.js +0 -0
  90. package/dist/bin/google-ads.js +0 -0
  91. package/dist/bin/growth.d.ts +3 -0
  92. package/dist/bin/growth.d.ts.map +1 -0
  93. package/dist/bin/growth.js +3 -0
  94. package/dist/bin/growth.js.map +1 -0
  95. package/dist/bin/logistics.js +0 -0
  96. package/dist/bin/optima.js +26 -26
  97. package/dist/bin/scout.js +0 -0
  98. package/dist/bin/sentinel.js +0 -0
  99. package/dist/bin/serve.js +23 -23
  100. package/dist/bin/shopify.js +0 -0
  101. package/dist/src/agent.js +4 -4
  102. package/dist/src/hooks-loader.d.ts +6 -0
  103. package/dist/src/hooks-loader.d.ts.map +1 -0
  104. package/dist/src/hooks-loader.js +215 -0
  105. package/dist/src/hooks-loader.js.map +1 -0
  106. package/dist/src/system-prompt.d.ts.map +1 -1
  107. package/dist/src/system-prompt.js +173 -169
  108. package/dist/src/system-prompt.js.map +1 -1
  109. package/dist/src/tools/memory.js +10 -10
  110. package/dist/src/ui/App.d.ts +6 -0
  111. package/dist/src/ui/App.d.ts.map +1 -0
  112. package/dist/src/ui/App.js +164 -0
  113. package/dist/src/ui/App.js.map +1 -0
  114. package/dist/src/ui/components/Composer.d.ts +10 -0
  115. package/dist/src/ui/components/Composer.d.ts.map +1 -0
  116. package/dist/src/ui/components/Composer.js +13 -0
  117. package/dist/src/ui/components/Composer.js.map +1 -0
  118. package/dist/src/ui/components/Header.d.ts +7 -0
  119. package/dist/src/ui/components/Header.d.ts.map +1 -0
  120. package/dist/src/ui/components/Header.js +7 -0
  121. package/dist/src/ui/components/Header.js.map +1 -0
  122. package/dist/src/ui/components/Message.d.ts +12 -0
  123. package/dist/src/ui/components/Message.d.ts.map +1 -0
  124. package/dist/src/ui/components/Message.js +21 -0
  125. package/dist/src/ui/components/Message.js.map +1 -0
  126. package/dist/src/ui/components/MessageList.d.ts +9 -0
  127. package/dist/src/ui/components/MessageList.d.ts.map +1 -0
  128. package/dist/src/ui/components/MessageList.js +18 -0
  129. package/dist/src/ui/components/MessageList.js.map +1 -0
  130. package/dist/src/ui/components/Spinner.d.ts +6 -0
  131. package/dist/src/ui/components/Spinner.d.ts.map +1 -0
  132. package/dist/src/ui/components/Spinner.js +7 -0
  133. package/dist/src/ui/components/Spinner.js.map +1 -0
  134. package/dist/src/ui/components/StatusBar.d.ts +11 -0
  135. package/dist/src/ui/components/StatusBar.d.ts.map +1 -0
  136. package/dist/src/ui/components/StatusBar.js +7 -0
  137. package/dist/src/ui/components/StatusBar.js.map +1 -0
  138. package/dist/src/ui/components/index.d.ts +7 -0
  139. package/dist/src/ui/components/index.d.ts.map +1 -0
  140. package/dist/src/ui/components/index.js +7 -0
  141. package/dist/src/ui/components/index.js.map +1 -0
  142. package/dist/src/ui/headless.js +7 -7
  143. package/dist/src/validation/error-formatter.d.ts +21 -0
  144. package/dist/src/validation/error-formatter.d.ts.map +1 -0
  145. package/dist/src/validation/error-formatter.js +98 -0
  146. package/dist/src/validation/error-formatter.js.map +1 -0
  147. package/dist/src/validation/index.d.ts +10 -0
  148. package/dist/src/validation/index.d.ts.map +1 -0
  149. package/dist/src/validation/index.js +10 -0
  150. package/dist/src/validation/index.js.map +1 -0
  151. package/dist/src/validation/json-validator.d.ts +25 -0
  152. package/dist/src/validation/json-validator.d.ts.map +1 -0
  153. package/dist/src/validation/json-validator.js +173 -0
  154. package/dist/src/validation/json-validator.js.map +1 -0
  155. package/dist/src/validation/schema.d.ts +353 -0
  156. package/dist/src/validation/schema.d.ts.map +1 -0
  157. package/dist/src/validation/schema.js +57 -0
  158. package/dist/src/validation/schema.js.map +1 -0
  159. package/dist/src/validation/suggestions.d.ts +25 -0
  160. package/dist/src/validation/suggestions.d.ts.map +1 -0
  161. package/dist/src/validation/suggestions.js +144 -0
  162. package/dist/src/validation/suggestions.js.map +1 -0
  163. package/dist/src/validation/types.d.ts +40 -0
  164. package/dist/src/validation/types.d.ts.map +1 -0
  165. package/dist/src/validation/types.js +5 -0
  166. package/dist/src/validation/types.js.map +1 -0
  167. package/dist/src/validation/yaml-validator.d.ts +25 -0
  168. package/dist/src/validation/yaml-validator.d.ts.map +1 -0
  169. package/dist/src/validation/yaml-validator.js +177 -0
  170. package/dist/src/validation/yaml-validator.js.map +1 -0
  171. package/package.json +79 -79
@@ -1,279 +1,279 @@
1
- ---
2
- name: gen
3
- description: "生成和编辑图片/语音/虚拟试穿。使用场景:生成图片(generate images/生成图片/画图)、编辑图片(edit images/编辑图片/图生图/风格转换)、文本转语音(TTS/语音合成/朗读)、语音识别(ASR/语音转文字/转录)、虚拟试穿(virtual try-on/试穿/换装/试衣)。视频生成请使用 video-gen skill。"
4
- ---
5
-
6
- # AI 内容生成工具
7
-
8
- ## 图片生成
9
-
10
- ### 标准工作流程
11
-
12
- ```bash
13
- # 文生图
14
- gen image "提示词" -o /home/aiuser/project/result.png
15
-
16
- # 图片编辑/风格转换
17
- gen image "转成水彩风格" -i photo.png -o /home/aiuser/project/result.png
18
-
19
- # 读取并描述结果
20
- Read /home/aiuser/project/result.png
21
- ```
22
-
23
- ### gen image 命令
24
-
25
- 统一的图像生成/编辑命令。
26
-
27
- ```bash
28
- gen image <prompt> [options]
29
- ```
30
-
31
- #### 参数
32
-
33
- | 参数 | 说明 |
34
- |------|------|
35
- | `-i, --input <path>` | 输入图像(可多次使用,最多 8 张) |
36
- | `-W, --width <px>` | 输出宽度(默认 1024,最大 2048) |
37
- | `-H, --height <px>` | 输出高度(默认 1024,最大 2048) |
38
- | `-o, --output <path>` | 输出目录或完整路径 |
39
- | `-s, --seed <number>` | 随机种子(可复现结果) |
40
- | `-f, --format <fmt>` | 输出格式:jpeg \| png |
41
- | `--provider <name>` | 供应商:grsai(默认) \| bfl |
42
- | `-m, --model <model>` | 模型:gpt-image-2(默认) \| nano-banana-fast \| nano-banana-pro \| flux-kontext-pro \| flux-kontext-max 等 |
43
- | `--aspect-ratio <ratio>` | 宽高比:1:1 \| 16:9 \| 9:16 \| 4:3 等 |
44
- | `--image-size <size>` | nano-banana-pro 输出尺寸:1K \| 2K \| 4K |
45
-
46
- ### 工作流示例
47
-
48
- #### 文生图
49
-
50
- ```bash
51
- gen image "a cute fluffy cat sitting on a windowsill, natural lighting" -o /home/aiuser/project/cat.png
52
- Read /home/aiuser/project/cat.png
53
- ```
54
-
55
- #### 图片风格转换
56
-
57
- ```bash
58
- gen image "watercolor painting style, artistic brushstrokes" -i photo.jpg -o /home/aiuser/project/watercolor.png
59
- Read /home/aiuser/project/watercolor.png
60
- ```
61
-
62
- #### 多图风格融合
63
-
64
- 将第一张图的风格应用到第二张图的内容上:
65
-
66
- ```bash
67
- gen image "apply the artistic style from image 1 to the content of image 2" -i style.png -i content.png -o /home/aiuser/project/fusion.png
68
- Read /home/aiuser/project/fusion.png
69
- ```
70
-
71
- #### 多图元素组合
72
-
73
- 从多张图中提取元素组合成新图:
74
-
75
- ```bash
76
- gen image "The person from image 1 is petting the cat from image 2, in a cozy living room" -i person.jpg -i cat.jpg -o /home/aiuser/project/combined.png
77
- ```
78
-
79
- #### 精确颜色控制
80
-
81
- 使用 hex code 指定精确颜色:
82
-
83
- ```bash
84
- gen image "a modern logo with brand color #02eb3c as the primary accent" -o /home/aiuser/project/logo.png
85
- ```
86
-
87
- #### 产品海报
88
-
89
- ```bash
90
- gen image "Disney Pixar style 3D poster, [产品描述], cute character, vibrant gradient background, professional studio lighting" -W 1024 -H 1024 -o /home/aiuser/project/poster.png
91
- ```
92
-
93
- ### 提示词指南
94
-
95
- #### 结构
96
-
97
- **Subject + Action + Style + Context**
98
-
99
- 词序很重要,靠前的元素优先级更高。
100
-
101
- #### 长度建议
102
-
103
- | 长度 | 词数 | 适用场景 |
104
- |------|------|----------|
105
- | 短 | 10-30 | 快速概念探索 |
106
- | 中 | 30-80 | 大多数项目(推荐) |
107
- | 长 | 80+ | 复杂场景 |
108
-
109
- #### 最佳实践
110
-
111
- | 技巧 | 说明 | 示例 |
112
- |------|------|------|
113
- | 描述想要的 | 不支持负向提示词 | "sharp focus" 而非 "no blur" |
114
- | 精确颜色 | 使用 hex code | `"brand color #1a1a2e"` |
115
- | 文字渲染 | 用引号包裹文字 | `"The text 'OPEN' in red neon"` |
116
- | 摄影风格 | 指定相机/镜头 | `"shot on Fujifilm X-T5, 35mm f/1.4"` |
117
- | 多语言 | 用原生语言更地道 | 法语描述巴黎场景 |
118
-
119
- #### 示例对比
120
-
121
- ```bash
122
- # 简单
123
- gen image "a robot"
124
-
125
- # 添加风格
126
- gen image "a friendly AI robot, cute cartoon style, bright colors, 3D render"
127
-
128
- # 完整描述
129
- gen image "Disney Pixar style 3D animated robot character, friendly cheerful expression, wearing headset, surrounded by floating icons, gradient purple-blue background, professional studio lighting, vibrant colors"
130
- ```
131
-
132
- ### 分辨率选择
133
-
134
- 最大 2048x2048。
135
-
136
- | 用途 | 分辨率 |
137
- |------|--------|
138
- | 社交媒体 | 1024x1024 |
139
- | 宽屏壁纸 | 1920x1088 |
140
- | 竖屏海报 | 768x1280 |
141
-
142
- ### 生成规则
143
-
144
- #### 生成后
145
- - 使用 Read 工具查看生成的图片
146
- - 向用户描述图片内容(颜色、风格、构图、元素)
147
- - 验证是否符合用户要求
148
-
149
- #### 多图参考
150
- - 最多 8 张输入图
151
-
152
- ## 虚拟试穿 (Virtual Try-On)
153
-
154
- 使用 FASHN AI tryon-v1.6 将服装穿到人物照片上。
155
-
156
- ```bash
157
- gen tryon <人物照片> <服装照片> [options]
158
- ```
159
-
160
- ### 参数
161
-
162
- | 参数 | 说明 | 默认值 |
163
- |------|------|--------|
164
- | `-o, --output <path>` | 输出文件路径 | `./gen-output/tryon_{timestamp}.png` |
165
- | `-c, --category <type>` | 服装类别:auto \| tops \| bottoms \| one-pieces | auto |
166
- | `-m, --mode <mode>` | 生成模式:performance \| balanced \| quality | quality |
167
- | `--garment-type <type>` | 服装照片类型:auto \| flat-lay \| model | auto |
168
- | `-n, --num-samples <n>` | 生成数量 (1-4) | 1 |
169
- | `--format <fmt>` | 输出格式:png \| jpeg | png |
170
- | `--seed <n>` | 随机种子(可复现) | - |
171
-
172
- ### 示例
173
-
174
- ```bash
175
- # 基本用法
176
- gen tryon person.jpg garment.jpg -o /home/aiuser/project/result.png
177
- Read /home/aiuser/project/result.png
178
-
179
- # 使用 URL 图片
180
- gen tryon https://example.com/model.jpg https://example.com/dress.jpg -o /home/aiuser/project/result.png
181
-
182
- # 指定服装类别和快速模式
183
- gen tryon person.jpg top.jpg -c tops -m performance -o /home/aiuser/project/result.png
184
-
185
- # 生成多张结果
186
- gen tryon person.jpg dress.jpg -n 4 -c one-pieces -o /home/aiuser/project/result.png
187
- ```
188
-
189
- ### 注意事项
190
-
191
- - 支持本地图片路径和 URL
192
- - 服装类别:auto (自动检测), tops (上装), bottoms (下装), one-pieces (连体)
193
- - 三种模式:performance (~7s), balanced (~9s), quality (~13s)
194
- - 默认保存到 `./gen-output/`
195
-
196
- ## 语音合成 (TTS)
197
-
198
- 使用 DashScope qwen3-tts-flash 将文本转为语音。
199
-
200
- ```bash
201
- gen tts <文本> [options]
202
- ```
203
-
204
- ### 参数
205
-
206
- | 参数 | 说明 | 默认值 |
207
- |------|------|--------|
208
- | `-o, --output <path>` | 输出文件路径 | `./gen-output/tts_{timestamp}.wav` |
209
- | `--voice <name>` | 声音名称 | Cherry |
210
- | `--voices` | 列出可用声音 | - |
211
- | `--play` | 生成后自动播放 | - |
212
-
213
- ### 可用声音
214
-
215
- - 女声:Cherry, Serena, Chelsie, Aria, Bella, Vivian, Jennifer, Katerina, Breeze, Maple, Sakura
216
- - 男声:Ethan, Aiden, Brandon, Ryan, Luke, Leo
217
-
218
- ### 示例
219
-
220
- ```bash
221
- # 中文语音合成
222
- gen tts "你好,欢迎使用语音合成功能" -o /home/aiuser/project/hello.wav
223
-
224
- # 指定男声
225
- gen tts "Hello, welcome!" --voice Ethan -o /home/aiuser/project/greeting.wav
226
-
227
- # 生成后播放
228
- gen tts "测试语音" --play -o /home/aiuser/project/test.wav
229
- ```
230
-
231
- ### 注意事项
232
-
233
- - 输出格式为 WAV
234
- - 最大 5000 字符
235
- - 支持中、英、日、韩、法、德等 10 种语言(自动检测)
236
- - 默认保存到 `./gen-output/`
237
-
238
- ## 语音识别 (ASR)
239
-
240
- 使用 Groq Whisper 将语音转为文字。
241
-
242
- ```bash
243
- gen asr <音频文件> [options]
244
- ```
245
-
246
- ### 参数
247
-
248
- | 参数 | 说明 | 默认值 |
249
- |------|------|--------|
250
- | `--language <lang>` | 语言提示:zh \| en \| ja \| ko 等 | 自动检测 |
251
- | `--model <name>` | Whisper 模型 | whisper-large-v3-turbo |
252
-
253
- ### 示例
254
-
255
- ```bash
256
- # 自动检测语言
257
- gen asr /home/aiuser/project/recording.mp3
258
-
259
- # 指定语言提示(提高准确率)
260
- gen asr /home/aiuser/project/recording.wav --language zh
261
- ```
262
-
263
- ### 注意事项
264
-
265
- - 支持 mp3, wav, m4a, ogg, webm 格式
266
- - 文件大小限制 25MB
267
-
268
- ## 任务管理
269
-
270
- 所有生成命令会自动等待完成。如需查看历史或管理任务:
271
-
272
- ```bash
273
- gen task list # 查看所有任务
274
- gen task list --type image # 按类型过滤
275
- gen task list --status failed # 按状态过滤
276
- gen task get <task_id> # 查看任务详情
277
- gen task cancel <task_id> # 取消任务
278
- gen task retry <task_id> # 重试失败的任务
279
- ```
1
+ ---
2
+ name: gen
3
+ description: "生成和编辑图片/语音/虚拟试穿。使用场景:生成图片(generate images/生成图片/画图)、编辑图片(edit images/编辑图片/图生图/风格转换)、文本转语音(TTS/语音合成/朗读)、语音识别(ASR/语音转文字/转录)、虚拟试穿(virtual try-on/试穿/换装/试衣)。视频生成请使用 video-gen skill。"
4
+ ---
5
+
6
+ # AI 内容生成工具
7
+
8
+ ## 图片生成
9
+
10
+ ### 标准工作流程
11
+
12
+ ```bash
13
+ # 文生图
14
+ gen image "提示词" -o /home/aiuser/project/result.png
15
+
16
+ # 图片编辑/风格转换
17
+ gen image "转成水彩风格" -i photo.png -o /home/aiuser/project/result.png
18
+
19
+ # 读取并描述结果
20
+ Read /home/aiuser/project/result.png
21
+ ```
22
+
23
+ ### gen image 命令
24
+
25
+ 统一的图像生成/编辑命令。
26
+
27
+ ```bash
28
+ gen image <prompt> [options]
29
+ ```
30
+
31
+ #### 参数
32
+
33
+ | 参数 | 说明 |
34
+ |------|------|
35
+ | `-i, --input <path>` | 输入图像(可多次使用,最多 8 张) |
36
+ | `-W, --width <px>` | 输出宽度(默认 1024,最大 2048) |
37
+ | `-H, --height <px>` | 输出高度(默认 1024,最大 2048) |
38
+ | `-o, --output <path>` | 输出目录或完整路径 |
39
+ | `-s, --seed <number>` | 随机种子(可复现结果) |
40
+ | `-f, --format <fmt>` | 输出格式:jpeg \| png |
41
+ | `--provider <name>` | 供应商:grsai(默认) \| bfl |
42
+ | `-m, --model <model>` | 模型:gpt-image-2(默认) \| nano-banana-fast \| nano-banana-pro \| flux-kontext-pro \| flux-kontext-max 等 |
43
+ | `--aspect-ratio <ratio>` | 宽高比:1:1 \| 16:9 \| 9:16 \| 4:3 等 |
44
+ | `--image-size <size>` | nano-banana-pro 输出尺寸:1K \| 2K \| 4K |
45
+
46
+ ### 工作流示例
47
+
48
+ #### 文生图
49
+
50
+ ```bash
51
+ gen image "a cute fluffy cat sitting on a windowsill, natural lighting" -o /home/aiuser/project/cat.png
52
+ Read /home/aiuser/project/cat.png
53
+ ```
54
+
55
+ #### 图片风格转换
56
+
57
+ ```bash
58
+ gen image "watercolor painting style, artistic brushstrokes" -i photo.jpg -o /home/aiuser/project/watercolor.png
59
+ Read /home/aiuser/project/watercolor.png
60
+ ```
61
+
62
+ #### 多图风格融合
63
+
64
+ 将第一张图的风格应用到第二张图的内容上:
65
+
66
+ ```bash
67
+ gen image "apply the artistic style from image 1 to the content of image 2" -i style.png -i content.png -o /home/aiuser/project/fusion.png
68
+ Read /home/aiuser/project/fusion.png
69
+ ```
70
+
71
+ #### 多图元素组合
72
+
73
+ 从多张图中提取元素组合成新图:
74
+
75
+ ```bash
76
+ gen image "The person from image 1 is petting the cat from image 2, in a cozy living room" -i person.jpg -i cat.jpg -o /home/aiuser/project/combined.png
77
+ ```
78
+
79
+ #### 精确颜色控制
80
+
81
+ 使用 hex code 指定精确颜色:
82
+
83
+ ```bash
84
+ gen image "a modern logo with brand color #02eb3c as the primary accent" -o /home/aiuser/project/logo.png
85
+ ```
86
+
87
+ #### 产品海报
88
+
89
+ ```bash
90
+ gen image "Disney Pixar style 3D poster, [产品描述], cute character, vibrant gradient background, professional studio lighting" -W 1024 -H 1024 -o /home/aiuser/project/poster.png
91
+ ```
92
+
93
+ ### 提示词指南
94
+
95
+ #### 结构
96
+
97
+ **Subject + Action + Style + Context**
98
+
99
+ 词序很重要,靠前的元素优先级更高。
100
+
101
+ #### 长度建议
102
+
103
+ | 长度 | 词数 | 适用场景 |
104
+ |------|------|----------|
105
+ | 短 | 10-30 | 快速概念探索 |
106
+ | 中 | 30-80 | 大多数项目(推荐) |
107
+ | 长 | 80+ | 复杂场景 |
108
+
109
+ #### 最佳实践
110
+
111
+ | 技巧 | 说明 | 示例 |
112
+ |------|------|------|
113
+ | 描述想要的 | 不支持负向提示词 | "sharp focus" 而非 "no blur" |
114
+ | 精确颜色 | 使用 hex code | `"brand color #1a1a2e"` |
115
+ | 文字渲染 | 用引号包裹文字 | `"The text 'OPEN' in red neon"` |
116
+ | 摄影风格 | 指定相机/镜头 | `"shot on Fujifilm X-T5, 35mm f/1.4"` |
117
+ | 多语言 | 用原生语言更地道 | 法语描述巴黎场景 |
118
+
119
+ #### 示例对比
120
+
121
+ ```bash
122
+ # 简单
123
+ gen image "a robot"
124
+
125
+ # 添加风格
126
+ gen image "a friendly AI robot, cute cartoon style, bright colors, 3D render"
127
+
128
+ # 完整描述
129
+ gen image "Disney Pixar style 3D animated robot character, friendly cheerful expression, wearing headset, surrounded by floating icons, gradient purple-blue background, professional studio lighting, vibrant colors"
130
+ ```
131
+
132
+ ### 分辨率选择
133
+
134
+ 最大 2048x2048。
135
+
136
+ | 用途 | 分辨率 |
137
+ |------|--------|
138
+ | 社交媒体 | 1024x1024 |
139
+ | 宽屏壁纸 | 1920x1088 |
140
+ | 竖屏海报 | 768x1280 |
141
+
142
+ ### 生成规则
143
+
144
+ #### 生成后
145
+ - 使用 Read 工具查看生成的图片
146
+ - 向用户描述图片内容(颜色、风格、构图、元素)
147
+ - 验证是否符合用户要求
148
+
149
+ #### 多图参考
150
+ - 最多 8 张输入图
151
+
152
+ ## 虚拟试穿 (Virtual Try-On)
153
+
154
+ 使用 FASHN AI tryon-v1.6 将服装穿到人物照片上。
155
+
156
+ ```bash
157
+ gen tryon <人物照片> <服装照片> [options]
158
+ ```
159
+
160
+ ### 参数
161
+
162
+ | 参数 | 说明 | 默认值 |
163
+ |------|------|--------|
164
+ | `-o, --output <path>` | 输出文件路径 | `./gen-output/tryon_{timestamp}.png` |
165
+ | `-c, --category <type>` | 服装类别:auto \| tops \| bottoms \| one-pieces | auto |
166
+ | `-m, --mode <mode>` | 生成模式:performance \| balanced \| quality | quality |
167
+ | `--garment-type <type>` | 服装照片类型:auto \| flat-lay \| model | auto |
168
+ | `-n, --num-samples <n>` | 生成数量 (1-4) | 1 |
169
+ | `--format <fmt>` | 输出格式:png \| jpeg | png |
170
+ | `--seed <n>` | 随机种子(可复现) | - |
171
+
172
+ ### 示例
173
+
174
+ ```bash
175
+ # 基本用法
176
+ gen tryon person.jpg garment.jpg -o /home/aiuser/project/result.png
177
+ Read /home/aiuser/project/result.png
178
+
179
+ # 使用 URL 图片
180
+ gen tryon https://example.com/model.jpg https://example.com/dress.jpg -o /home/aiuser/project/result.png
181
+
182
+ # 指定服装类别和快速模式
183
+ gen tryon person.jpg top.jpg -c tops -m performance -o /home/aiuser/project/result.png
184
+
185
+ # 生成多张结果
186
+ gen tryon person.jpg dress.jpg -n 4 -c one-pieces -o /home/aiuser/project/result.png
187
+ ```
188
+
189
+ ### 注意事项
190
+
191
+ - 支持本地图片路径和 URL
192
+ - 服装类别:auto (自动检测), tops (上装), bottoms (下装), one-pieces (连体)
193
+ - 三种模式:performance (~7s), balanced (~9s), quality (~13s)
194
+ - 默认保存到 `./gen-output/`
195
+
196
+ ## 语音合成 (TTS)
197
+
198
+ 使用 DashScope qwen3-tts-flash 将文本转为语音。
199
+
200
+ ```bash
201
+ gen tts <文本> [options]
202
+ ```
203
+
204
+ ### 参数
205
+
206
+ | 参数 | 说明 | 默认值 |
207
+ |------|------|--------|
208
+ | `-o, --output <path>` | 输出文件路径 | `./gen-output/tts_{timestamp}.wav` |
209
+ | `--voice <name>` | 声音名称 | Cherry |
210
+ | `--voices` | 列出可用声音 | - |
211
+ | `--play` | 生成后自动播放 | - |
212
+
213
+ ### 可用声音
214
+
215
+ - 女声:Cherry, Serena, Chelsie, Aria, Bella, Vivian, Jennifer, Katerina, Breeze, Maple, Sakura
216
+ - 男声:Ethan, Aiden, Brandon, Ryan, Luke, Leo
217
+
218
+ ### 示例
219
+
220
+ ```bash
221
+ # 中文语音合成
222
+ gen tts "你好,欢迎使用语音合成功能" -o /home/aiuser/project/hello.wav
223
+
224
+ # 指定男声
225
+ gen tts "Hello, welcome!" --voice Ethan -o /home/aiuser/project/greeting.wav
226
+
227
+ # 生成后播放
228
+ gen tts "测试语音" --play -o /home/aiuser/project/test.wav
229
+ ```
230
+
231
+ ### 注意事项
232
+
233
+ - 输出格式为 WAV
234
+ - 最大 5000 字符
235
+ - 支持中、英、日、韩、法、德等 10 种语言(自动检测)
236
+ - 默认保存到 `./gen-output/`
237
+
238
+ ## 语音识别 (ASR)
239
+
240
+ 使用 Groq Whisper 将语音转为文字。
241
+
242
+ ```bash
243
+ gen asr <音频文件> [options]
244
+ ```
245
+
246
+ ### 参数
247
+
248
+ | 参数 | 说明 | 默认值 |
249
+ |------|------|--------|
250
+ | `--language <lang>` | 语言提示:zh \| en \| ja \| ko 等 | 自动检测 |
251
+ | `--model <name>` | Whisper 模型 | whisper-large-v3-turbo |
252
+
253
+ ### 示例
254
+
255
+ ```bash
256
+ # 自动检测语言
257
+ gen asr /home/aiuser/project/recording.mp3
258
+
259
+ # 指定语言提示(提高准确率)
260
+ gen asr /home/aiuser/project/recording.wav --language zh
261
+ ```
262
+
263
+ ### 注意事项
264
+
265
+ - 支持 mp3, wav, m4a, ogg, webm 格式
266
+ - 文件大小限制 25MB
267
+
268
+ ## 任务管理
269
+
270
+ 所有生成命令会自动等待完成。如需查看历史或管理任务:
271
+
272
+ ```bash
273
+ gen task list # 查看所有任务
274
+ gen task list --type image # 按类型过滤
275
+ gen task list --status failed # 按状态过滤
276
+ gen task get <task_id> # 查看任务详情
277
+ gen task cancel <task_id> # 取消任务
278
+ gen task retry <task_id> # 重试失败的任务
279
+ ```