@sogni-ai/sogni-creative-agent-skill 3.3.4 → 3.3.5
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +2 -2
- package/SKILL.md +40 -28
- package/openclaw.plugin.json +1 -1
- package/package.json +2 -2
- package/skill-package.json +1 -1
- package/version.mjs +1 -1
package/README.md
CHANGED
|
@@ -322,9 +322,9 @@ sogni-agent --api-workflow storyboard-video "10s neon city flyover"
|
|
|
322
322
|
|
|
323
323
|
# Local segment + concat with external soundtrack
|
|
324
324
|
sogni-agent --video --workflow v2v --ref-video dance.mp4 \
|
|
325
|
-
--video-start 10 --duration 8 --controlnet-name pose -o
|
|
325
|
+
--video-start 10 --duration 8 --controlnet-name pose -o ./clip-2.mp4 \
|
|
326
326
|
"robot dancing"
|
|
327
|
-
sogni-agent --concat-videos
|
|
327
|
+
sogni-agent --concat-videos ./final.mp4 ./clip-1.mp4 ./clip-2.mp4 \
|
|
328
328
|
--concat-audio song.mp3 --concat-audio-start 0
|
|
329
329
|
|
|
330
330
|
# Balances and help
|
package/SKILL.md
CHANGED
|
@@ -2,7 +2,7 @@
|
|
|
2
2
|
name: sogni-creative-agent-skill
|
|
3
3
|
description: "Sogni Creative Agent Skill: agent skill and CLI for image, video, and music generation using Sogni AI's decentralized GPU network. Supports personas (named people with saved reference photos and voice clips), persistent memories, custom personality, style transfer, angle synthesis, Seedance/LTX/WAN video, music/lyrics, hosted chat, durable workflows, replay records, and multi-step creative workflows. Ask the agent to \"draw\", \"generate\", \"create an image\", \"make a video/animate\", \"make music\", \"apply a style\", or \"generate me as a superhero\"."
|
|
4
4
|
metadata:
|
|
5
|
-
version: "3.3.
|
|
5
|
+
version: "3.3.5"
|
|
6
6
|
homepage: https://sogni.ai
|
|
7
7
|
clawdbot:
|
|
8
8
|
emoji: "🎨"
|
|
@@ -110,6 +110,18 @@ ln -sfn node_modules/@sogni-ai/sogni-creative-agent-skill sogni-creative-agent-s
|
|
|
110
110
|
|
|
111
111
|
When this skill is distributed via ClawHub, it bootstraps its local runtime dependencies from `skill-package.json` during install. That avoids relying on a root `package.json` being present in the published skill artifact.
|
|
112
112
|
|
|
113
|
+
## Output Path Convention
|
|
114
|
+
|
|
115
|
+
**Always save generated images, videos, and music to the user's current working directory (PWD), not `/tmp`.** Pass a relative path or bare filename to `-o`/`--output`:
|
|
116
|
+
|
|
117
|
+
```bash
|
|
118
|
+
sogni-agent -o ./cat.png "a cat wearing a hat" # ✓ lands in PWD
|
|
119
|
+
sogni-agent -o cat.png "a cat wearing a hat" # ✓ lands in PWD
|
|
120
|
+
sogni-agent -o /tmp/cat.png "a cat wearing a hat" # ✗ avoid — user can't easily find it
|
|
121
|
+
```
|
|
122
|
+
|
|
123
|
+
`/tmp` (and `mkdtempSync(...)`) is reserved internally for transient intermediate files the CLI cleans up itself (audio re-encodes, intermediate clips during stitching). Final renders the user is asking for must remain inside their working directory unless they explicitly request a different location.
|
|
124
|
+
|
|
113
125
|
## Filesystem Paths and Overrides
|
|
114
126
|
|
|
115
127
|
Default file paths used by this skill:
|
|
@@ -172,8 +184,8 @@ sogni-agent --video --ref hero.png -n 3 --duration 5 \
|
|
|
172
184
|
# Token auto-fallback for native Sogni models (tries SPARK, falls back to SOGNI)
|
|
173
185
|
sogni-agent --token-type auto "a cat wearing a hat"
|
|
174
186
|
|
|
175
|
-
# Save to file
|
|
176
|
-
sogni-agent -o
|
|
187
|
+
# Save to file (relative paths land in the current working directory)
|
|
188
|
+
sogni-agent -o ./cat.png "a cat wearing a hat"
|
|
177
189
|
|
|
178
190
|
# JSON output (for scripting)
|
|
179
191
|
sogni-agent --json "a cat wearing a hat"
|
|
@@ -185,7 +197,7 @@ sogni-agent --balance
|
|
|
185
197
|
sogni-agent --json --balance
|
|
186
198
|
|
|
187
199
|
# Quiet mode (suppress progress)
|
|
188
|
-
sogni-agent -q -o
|
|
200
|
+
sogni-agent -q -o ./cat.png "a cat wearing a hat"
|
|
189
201
|
|
|
190
202
|
# Direct music/audio generation
|
|
191
203
|
sogni-agent --music --duration 30 \
|
|
@@ -673,10 +685,10 @@ Uses SDXL Turbo (`coreml-sogniXLturbo_alpha1_ad`) at 1024x1024 by default. The f
|
|
|
673
685
|
**Agent usage:**
|
|
674
686
|
```bash
|
|
675
687
|
# Photobooth: stylize a face photo
|
|
676
|
-
sogni-agent -q --photobooth --ref /path/to/face.jpg -o
|
|
688
|
+
sogni-agent -q --photobooth --ref /path/to/face.jpg -o ./stylized.png "80s fashion portrait"
|
|
677
689
|
|
|
678
690
|
# Multiple photobooth outputs
|
|
679
|
-
sogni-agent -q --photobooth --ref /path/to/face.jpg -n 4 -o
|
|
691
|
+
sogni-agent -q --photobooth --ref /path/to/face.jpg -n 4 -o ./stylized.png "LinkedIn professional headshot"
|
|
680
692
|
```
|
|
681
693
|
|
|
682
694
|
## Multiple Angles (Turnaround)
|
|
@@ -695,7 +707,7 @@ sogni-agent --angles-360 -c subject.jpg --distance medium --elevation eye-level
|
|
|
695
707
|
"studio portrait, same person"
|
|
696
708
|
|
|
697
709
|
# 360 sweep video (looping mp4, uses i2v between angles; requires ffmpeg)
|
|
698
|
-
sogni-agent --angles-360 --angles-360-video
|
|
710
|
+
sogni-agent --angles-360 --angles-360-video ./turntable.mp4 \
|
|
699
711
|
-c subject.jpg --distance medium --elevation eye-level \
|
|
700
712
|
"studio portrait, same person"
|
|
701
713
|
```
|
|
@@ -725,7 +737,7 @@ When a user requests a "360 video", follow this workflow:
|
|
|
725
737
|
|
|
726
738
|
4. **Example command**:
|
|
727
739
|
```bash
|
|
728
|
-
sogni-agent --angles-360 --angles-360-video
|
|
740
|
+
sogni-agent --angles-360 --angles-360-video ./output.mp4 \
|
|
729
741
|
-c /path/to/image.png --elevation eye-level --distance medium \
|
|
730
742
|
"description of subject"
|
|
731
743
|
```
|
|
@@ -929,35 +941,35 @@ When user asks to generate/draw/create an image:
|
|
|
929
941
|
|
|
930
942
|
```bash
|
|
931
943
|
# Generate and save locally (use -Q for quality presets instead of memorizing model IDs)
|
|
932
|
-
sogni-agent -q -Q fast -o
|
|
933
|
-
sogni-agent -q -Q pro -o
|
|
944
|
+
sogni-agent -q -Q fast -o ./generated.png "user's prompt"
|
|
945
|
+
sogni-agent -q -Q pro -o ./generated.png "user's prompt"
|
|
934
946
|
|
|
935
947
|
# Generate with prompt variations (diverse images in one call)
|
|
936
|
-
sogni-agent -q -n 3 -o
|
|
948
|
+
sogni-agent -q -n 3 -o ./cars.png "a {red|blue|green} sports car"
|
|
937
949
|
|
|
938
950
|
# Edit an existing image
|
|
939
|
-
sogni-agent -q -c /path/to/input.jpg -o
|
|
951
|
+
sogni-agent -q -c /path/to/input.jpg -o ./edited.png "make it pop art style"
|
|
940
952
|
|
|
941
953
|
# Generate video from image
|
|
942
|
-
sogni-agent -q --video --ref /path/to/image.png -o
|
|
954
|
+
sogni-agent -q --video --ref /path/to/image.png -o ./video.mp4 "A medium shot holds on the subject in soft late-afternoon light as fabric edges and background details remain clear and stable. The camera performs a slow push-in while the subject shifts weight subtly and turns slightly toward the lens, keeping the motion gentle and continuous. Leaves rustle softly in the background and the scene maintains smooth cinematic movement with no abrupt action changes."
|
|
943
955
|
|
|
944
956
|
# Generate text-to-video
|
|
945
|
-
sogni-agent -q --video -o
|
|
957
|
+
sogni-agent -q --video -o ./video.mp4 "A wide cinematic shot opens on ocean waves rolling toward a rocky shoreline at sunset, golden light spreading across the water while sea mist drifts through the air. Foam patterns form and recede over the dark sand as the horizon glows orange and pink in the distance. The camera glides forward in one continuous movement, holding smooth stabilized motion and calm environmental detail throughout the scene."
|
|
946
958
|
|
|
947
959
|
# Generate direct music/audio
|
|
948
|
-
sogni-agent -q --music --duration 30 -o
|
|
960
|
+
sogni-agent -q --music --duration 30 -o ./music.mp3 "uplifting cinematic synthwave theme for a product launch"
|
|
949
961
|
|
|
950
962
|
# HD / "4K" text-to-video: prefer LTX-2.3
|
|
951
|
-
sogni-agent -q --video -m ltx23-22b-fp8_t2v_distilled -w 1920 -h 1088 -o
|
|
963
|
+
sogni-agent -q --video -m ltx23-22b-fp8_t2v_distilled -w 1920 -h 1088 -o ./video.mp4 "A wide cinematic aerial shot opens over a rugged ocean coastline at golden hour, warm sunlight catching the cliff faces while white surf breaks against dark rock below. Low sea mist hangs over the water and bands of foam trace the shoreline as gulls wheel through the distance. The camera glides forward in one continuous pass, revealing the curve of the coast while wet stone flashes with reflected light and the scene keeps smooth stabilized motion from start to finish. The overall mood feels expansive and polished, with crisp environmental detail and steady travel-film energy."
|
|
952
964
|
|
|
953
965
|
# HD / "4K" image-to-video: prefer LTX i2v
|
|
954
|
-
sogni-agent -q --video --ref /path/to/image.png -m ltx23-22b-fp8_i2v_distilled -w 1920 -h 1088 -o
|
|
966
|
+
sogni-agent -q --video --ref /path/to/image.png -m ltx23-22b-fp8_i2v_distilled -w 1920 -h 1088 -o ./video.mp4 "A medium cinematic shot holds on the scene with clean subject separation and stable environmental detail as directional light shapes the surfaces and background depth. The camera performs a slow push-in while the main subject makes one subtle continuous movement, keeping posture and identity consistent from start to finish. Ambient motion in the background stays gentle and the overall clip remains smooth, stabilized, and visually coherent."
|
|
955
967
|
|
|
956
968
|
# Photobooth: stylize a face photo
|
|
957
|
-
sogni-agent -q --photobooth --ref /path/to/face.jpg -o
|
|
969
|
+
sogni-agent -q --photobooth --ref /path/to/face.jpg -o ./stylized.png "80s fashion portrait"
|
|
958
970
|
|
|
959
971
|
# Token auto-fallback for native Sogni models (tries SPARK first, retries with SOGNI on insufficient balance)
|
|
960
|
-
sogni-agent -q --token-type auto -o
|
|
972
|
+
sogni-agent -q --token-type auto -o ./generated.png "user's prompt"
|
|
961
973
|
|
|
962
974
|
# Check current SPARK/SOGNI balances (no prompt required)
|
|
963
975
|
sogni-agent --json --balance
|
|
@@ -1028,7 +1040,7 @@ When a user asks to **animate between two images**, use `--ref` (first frame) an
|
|
|
1028
1040
|
|
|
1029
1041
|
```bash
|
|
1030
1042
|
# Animate from image A to image B
|
|
1031
|
-
sogni-agent -q --video --ref
|
|
1043
|
+
sogni-agent -q --video --ref ./imageA.png --ref-end ./imageB.png -o ./transition.mp4 "descriptive prompt of the transition"
|
|
1032
1044
|
```
|
|
1033
1045
|
|
|
1034
1046
|
### Animate a Video to an Image (Scene Continuation)
|
|
@@ -1037,15 +1049,15 @@ When a user asks to **animate from a video to an image** (or "continue" a video
|
|
|
1037
1049
|
|
|
1038
1050
|
1. **Extract the last frame** of the existing video using the built-in safe wrapper:
|
|
1039
1051
|
```bash
|
|
1040
|
-
sogni-agent --extract-last-frame
|
|
1052
|
+
sogni-agent --extract-last-frame ./existing.mp4 ./lastframe.png
|
|
1041
1053
|
```
|
|
1042
1054
|
2. **Generate a new video** using the last frame as `--ref` and the target image as `--ref-end`:
|
|
1043
1055
|
```bash
|
|
1044
|
-
sogni-agent -q --video --ref
|
|
1056
|
+
sogni-agent -q --video --ref ./lastframe.png --ref-end ./target.png -o ./continuation.mp4 "scene transition prompt"
|
|
1045
1057
|
```
|
|
1046
1058
|
3. **Concatenate the videos** using the built-in safe wrapper:
|
|
1047
1059
|
```bash
|
|
1048
|
-
sogni-agent --concat-videos
|
|
1060
|
+
sogni-agent --concat-videos ./full_sequence.mp4 ./existing.mp4 ./continuation.mp4
|
|
1049
1061
|
```
|
|
1050
1062
|
|
|
1051
1063
|
This ensures visual continuity — the new clip picks up exactly where the previous one ended.
|
|
@@ -1069,7 +1081,7 @@ When the final stitched output needs a single external soundtrack, add `--concat
|
|
|
1069
1081
|
"width": 512,
|
|
1070
1082
|
"height": 512,
|
|
1071
1083
|
"urls": ["https://..."],
|
|
1072
|
-
"localPath": "
|
|
1084
|
+
"localPath": "./cat.png"
|
|
1073
1085
|
}
|
|
1074
1086
|
```
|
|
1075
1087
|
|
|
@@ -1122,7 +1134,7 @@ sogni-agent --persona-list --json
|
|
|
1122
1134
|
sogni-agent --persona-resolve "me" --json
|
|
1123
1135
|
|
|
1124
1136
|
# Generate using a persona (auto-injects photo as context)
|
|
1125
|
-
sogni-agent --persona "Mark" -o
|
|
1137
|
+
sogni-agent --persona "Mark" -o ./hero.png "superhero in dramatic lighting"
|
|
1126
1138
|
|
|
1127
1139
|
# Remove a persona
|
|
1128
1140
|
sogni-agent --persona-remove "Mark"
|
|
@@ -1183,13 +1195,13 @@ Apply artistic styles to existing images:
|
|
|
1183
1195
|
|
|
1184
1196
|
```bash
|
|
1185
1197
|
# Apply a named artist style
|
|
1186
|
-
sogni-agent -c photo.jpg -o
|
|
1198
|
+
sogni-agent -c photo.jpg -o ./styled.png "Apply style: Andy Warhol pop art with bold primary colors"
|
|
1187
1199
|
|
|
1188
1200
|
# Studio Ghibli transformation
|
|
1189
|
-
sogni-agent -c photo.jpg -o
|
|
1201
|
+
sogni-agent -c photo.jpg -o ./ghibli.png "Apply style: Studio Ghibli watercolor with soft pastel sky and lush greenery"
|
|
1190
1202
|
|
|
1191
1203
|
# For photos with people, always preserve identity
|
|
1192
|
-
sogni-agent -c portrait.jpg -o
|
|
1204
|
+
sogni-agent -c portrait.jpg -o ./styled.png "Apply style: oil painting in the style of Vermeer. Preserve all facial features, expressions, and identity."
|
|
1193
1205
|
```
|
|
1194
1206
|
|
|
1195
1207
|
**Tips:** Reference artists and styles BY NAME for best results. Use positive phrasing. For photos with people, always append identity preservation instructions.
|
package/openclaw.plugin.json
CHANGED
|
@@ -2,7 +2,7 @@
|
|
|
2
2
|
"id": "sogni-creative-agent-skill",
|
|
3
3
|
"name": "Sogni Creative Agent Skill — Image, Video & Music Generation",
|
|
4
4
|
"description": "Agent skill and CLI for Sogni AI image, video, and music generation.",
|
|
5
|
-
"version": "3.3.
|
|
5
|
+
"version": "3.3.5",
|
|
6
6
|
"skills": [
|
|
7
7
|
"."
|
|
8
8
|
],
|
package/package.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
{
|
|
2
2
|
"name": "@sogni-ai/sogni-creative-agent-skill",
|
|
3
|
-
"version": "3.3.
|
|
3
|
+
"version": "3.3.5",
|
|
4
4
|
"description": "Sogni Creative Agent Skill: agent skill and CLI for Sogni AI image, video, and music generation.",
|
|
5
5
|
"type": "module",
|
|
6
6
|
"main": "sogni-agent.mjs",
|
|
@@ -67,7 +67,7 @@
|
|
|
67
67
|
"sogni-agent.mjs"
|
|
68
68
|
],
|
|
69
69
|
"dependencies": {
|
|
70
|
-
"@sogni-ai/sogni-intelligence-client": "^3.0.
|
|
70
|
+
"@sogni-ai/sogni-intelligence-client": "^3.0.11",
|
|
71
71
|
"execa": "^9.6.1",
|
|
72
72
|
"json5": "^2.2.3",
|
|
73
73
|
"sharp": "^0.34.5"
|
package/skill-package.json
CHANGED
package/version.mjs
CHANGED
|
@@ -1 +1 @@
|
|
|
1
|
-
export const PACKAGE_VERSION = '3.3.
|
|
1
|
+
export const PACKAGE_VERSION = '3.3.5';
|