npm - @agentmedia/schema - Versions diffs - 0.5.0 → 0.5.2 - Mend

@agentmedia/schema 0.5.0 → 0.5.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (12) hide show

package/dist/v2/generators.d.ts.map +1 -1
package/dist/v2/generators.js +14 -6
package/dist/v2/generators.js.map +1 -1
package/dist/v2/selfie.d.ts +53 -30
package/dist/v2/selfie.d.ts.map +1 -1
package/dist/v2/selfie.js +69 -29
package/dist/v2/selfie.js.map +1 -1
package/package.json +13 -13
package/scripts/generate-v2-docs.ts +384 -290
package/src/v2/generators.ts +14 -6
package/src/v2/selfie.ts +86 -30
package/LICENSE +0 -199

package/scripts/generate-v2-docs.ts CHANGED Viewed

@@ -18,9 +18,6 @@ import { fileURLToPath } from 'node:url';
 import { zodToJsonSchema } from 'zod-to-json-schema';
 import {
   V2_GENERATORS,
-  V2_SHOT_PRESETS,
-  V2_VIBES,
-  quoteV2Credits,
   type V2GeneratorRecord,
 } from '../src/v2/index.js';
@@ -49,19 +46,11 @@ function fmtInputSchema(def: V2GeneratorRecord): string {
   return '```json\n' + JSON.stringify(body, null, 2) + '\n```';
 }
-function fmtPricing(def: V2GeneratorRecord): string {
-  if (!def.pricing) return '_Pricing not declared on this generator._';
-  if (def.pricing.basis === 'one_shot') {
-    const c = def.pricing.baseCredits;
-    return `One-shot: **${c} credits** ($${(c / 100).toFixed(2)})`;
-  }
-  // per_clip — show 5/10/15
-  const rows = [5, 10, 15].map((s) => {
-    const c = quoteV2Credits(def.id as any, { durationSeconds: s });
-    return `| ${s}s | ${c} | $${(c / 100).toFixed(2)} |`;
-  });
-  return `Per-clip (base ${def.pricing.baseCredits} + ${def.pricing.perSecondCredits}/sec):\n\n| Duration | Credits | USD |\n|---|---:|---:|\n${rows.join('\n')}`;
-}
+// Pricing display is intentionally suppressed everywhere — agents and
+// docs should never surface USD or credit numbers. The API debits
+// internally; users get no cost-anxiety prompts. (Server-side allows a
+// soft -10 credit overdraft so a final job never gets rejected on a
+// micro-balance edge case.)
 // ── docs/v2/api-reference.md ──────────────────────────────────────────────
@@ -82,10 +71,6 @@ function renderApiReference(): string {
         '',
         g.description,
         '',
-        '### Pricing',
-        '',
-        fmtPricing(g),
-        '',
         '### Request body',
         '',
         fmtInputSchema(g),
@@ -100,16 +85,7 @@ function renderApiReference(): string {
         '',
         '```json',
         JSON.stringify(
-          {
-            job_id: '<uuid>',
-            status: 'submitted',
-            credits_deducted: g.pricing
-              ? g.pricing.basis === 'one_shot'
-                ? g.pricing.baseCredits
-                : g.pricing.baseCredits + g.pricing.perSecondCredits * 8
-              : 0,
-            generator: g.id,
-          },
+          { job_id: '<uuid>', status: 'submitted', generator: g.id },
           null,
           2,
         ),
@@ -158,390 +134,508 @@ function renderApiReference(): string {
     '- `character_id` — present on jobs that create a v2 character (`char_xxxxxxxxxx`).',
     '- `video_url` — present on completed video jobs.',
     '',
-    '### Shot grammar (Selfie)',
-    '',
-    `Selfie's \`preset\` field accepts one of:`,
-    '',
-    V2_SHOT_PRESETS.map((p) => `- \`${p}\``).join('\n'),
+    '### Selfie pipeline artifacts',
     '',
-    `Or \`custom-scene:<text>\` to compose a new shot ad-hoc.`,
+    'Selfie jobs expose intermediate URLs while processing:',
     '',
-    '### Vibes (Selfie)',
+    '- `portrait_url` — generated actor face portrait, unless reusing a saved character.',
+    '- `character_sheet_url` / `sheet_url` — full-body multi-angle character reference.',
+    '- `wireframe_url` — photographic storyboard/wireframe board with 8-10 frames and captions.',
+    '- `video_url` / `result_url` — final Seedance MP4 after completion.',
     '',
-    V2_VIBES.map((v) => `- \`${v}\``).join('\n'),
+    'Agents should surface each artifact as soon as it appears in status instead of waiting silently for the final video.',
     '',
   ].join('\n');
 }
-// ── skills/agent-media-v2/SKILL.md ─────────────────────────────────────────
-function renderSkill(): string {
+// ─────────────────────────────────────────────────────────────────────────────
+// Multi-file skill emit
+//
+// Layout under skills/agent-media-v2/:
+//   SKILL.md                          — eager-loaded entry, ~2 KB
+//   reference/
+//     conversation-flow.md            — MUST-READ before any CLI call
+//     pricing.md                      — formula + tables
+//     subtitle-styles.md              — 17 subtitle styles
+//     realism-rubric.md               — visual-quality guard
+//     errors.md                       — common error codes + fixes
+//     generators/
+//       selfie.md                     — flags + CLI/MCP/REST + examples
+//       character-create.md           — character_create cheat-sheet
+//       subs.md                       — subs cheat-sheet
+//
+// Adding a new v2 product = a new V2_GENERATORS row + this file emits a
+// fresh reference/generators/<id>.md automatically.
+// ─────────────────────────────────────────────────────────────────────────────
+const SKILL_DIR = resolve(repoRoot, 'skills/agent-media-v2');
+interface EmittedFile {
+  /** path relative to SKILL_DIR */
+  relPath: string;
+  content: string;
+}
+function renderSkillIndex(): string {
   const generators = Object.values(V2_GENERATORS);
-  const generatorBlocks = generators
-    .map((g) => {
-      const cliExample = g.cli?.examples?.[0] ?? `agent-media ${g.cli?.command ?? g.id} …`;
-      const pricingLine = g.pricing
-        ? g.pricing.basis === 'one_shot'
-          ? `Cost: **${g.pricing.baseCredits} credits** ($${(g.pricing.baseCredits / 100).toFixed(2)}).`
-          : `Cost: **${g.pricing.baseCredits} + ${g.pricing.perSecondCredits}/sec** (8s ≈ ${quoteV2Credits(g.id as any, { durationSeconds: 8 })} credits ≈ $${(quoteV2Credits(g.id as any, { durationSeconds: 8 }) / 100).toFixed(2)}).`
-        : '';
-      return [
-        `### ${g.id}`,
-        '',
-        g.description,
-        '',
-        pricingLine,
-        '',
-        '**CLI:**',
-        '',
-        '```bash',
-        cliExample,
-        '```',
-        '',
-        '**MCP tool:** `' + (g.mcp?.toolName ?? '(none)') + '`',
-        '',
-        '**REST:** `' + (g.rest?.method ?? '') + ' ' + (g.rest?.path ?? '(internal)') + '`',
-        '',
-      ].join('\n');
-    })
-    .join('---\n\n');
+  const generatorRows = generators
+    .map(
+      (g) =>
+        `| **${g.cli?.command ?? g.id}** | ${g.summary.replace(/\|/g, '\\|')} | [\`reference/generators/${g.id}.md\`](reference/generators/${g.id}.md) |`,
+    )
+    .join('\n');
   return [
     '---',
     'name: agent-media-v2',
-    'description: AI UGC video production via agent-media v2 — Selfie videos and reusable Characters. Use this skill when the user wants to make TikTok-style "AI person talking to camera" clips or save a character for reuse across multiple generations.',
-    'homepage: https://agent-media.ai/skill',
-    `version: 1.3.0`,
+    // CRITICAL: the description string is what Claude reads when deciding whether to
+    // load this skill AND it's the most-attended-to text once the skill is loaded.
+    // Put the hard gate here, not buried in section 3 of the body.
+    'description: AI UGC video production via agent-media (selfie, character, subs, plus more soon). BEFORE running ANY agent-media command you MUST first Read reference/conversation-flow.md and walk the user through the 4 gates IN ORDER — (1) confirm script OR scene_action; if no speech, also propose background_music, (2) RUN `agent-media character list --json` YOURSELF (don\'t ask the user, don\'t mention char_xxx ids — present saved characters BY NAME if any, otherwise confirm the new description), (3) propose a director\'s brief with setting, lighting, wardrobe, props/product, and action; pass non-default motion/product handling through --scene-action, (4) duration with script-pacing awareness (2-4 words/sec). While jobs run, poll status and open portrait, character sheet, wireframe, and final video as each URL appears. When user says "no subs" → pass --subtitles false. When no script → pass --background-music. NEVER auto-pick a character. NEVER expose char_xxx ids. NEVER mention pricing/credits/USD.',
     '---',
     '',
     GENERATED_NOTE,
     '',
-    '# agent-media — STRICT RULES (read first, every time)',
+    '# agent-media — Claude skill',
     '',
-    '## 0. CONVERSATION FLOW — follow this in order',
+    'agent-media is a CLI for AI UGC video generation. This skill tells you how to drive it. **Loaded files are intentionally small** — open the right reference file for the task you have, don\'t try to memorize everything.',
     '',
-    'Before you EVER call the CLI, walk the user through these steps. Ask in batches of 2-3 questions at a time, never one-by-one, never silently default. Use the user\'s answers to populate the CLI args.',
+    '## 🛑 HARD GATE — read this first, every conversation',
     '',
-    '### Step 1 — What\'s the video about?',
+    'Before calling ANY `agent-media` shell command, you MUST:',
     '',
-    'This is the FIRST question, every time. Even if the user typed a full prompt with a script, confirm:',
+    '1. **Read** [`reference/conversation-flow.md`](reference/conversation-flow.md) — the full 4-gate protocol with templates.',
+    '2. **Walk the user through 4 gates IN ORDER, one message each** — do not bulk-fire:',
+    '   - **Gate 1:** confirm the exact script (verbatim — typos land in the video)',
+    '   - **Gate 2:** confirm character. YOU run `agent-media character list --json` (do not ask the user "do you have a saved character?" — they don\'t know that\'s a thing). If the list is empty, just confirm the description from their original prompt. If non-empty, present each saved character BY NAME (not by `char_xxx` id — that format is internal). The user picks by NAME or says "new"; you map name → id internally. 🛑 NEVER auto-pick. NEVER show `char_xxx` ids to the user. Never ask for a photo by default.',
+    '   - **Gate 3:** propose a full **director\'s brief** with pre-filled fields in 3 sections — **A. Intent+Performance**, **B. Scene+Look**, **C. Output**. Put visual direction into `--description` and action/product handling into `--scene-action`. The shot composition and energy are inferred from the brief; you can OPTIONALLY pin them with `--shot-preset` and `--vibe`, or override the realism defaults with `--camera-locked` / `--phone-in-frame` / `--polish` (rare — only when the user explicitly asks for a stable shot, a phone-in-hand composition, or a different polish look). Baseline realism policy: handheld camera stays on, visible phone stays off unless explicitly requested.',
+    '   - **Gate 4:** duration + **script-pacing check**. Count the words in the script and PROPOSE the duration that fits (5s ≈ 10-20 words, 10s ≈ 20-40 words, 15s ≈ 30-60 words at the natural 2-4 words/sec pace).',
+    '3. Only then call the CLI.',
     '',
-    '> *"Got it — quick check before I generate:*',
-    '> *• What\'s the video about?  (the topic / what they\'re selling / what\'s happening in the scene)*',
-    '> *• What\'s the exact line you want them to say?  (the script — 1-3 sentences usually works best)"*',
+    '**The director\'s brief at Gate 3 is non-optional.** It\'s where quality lives. Skipping it = generic output. PROPOSE smart defaults from the script + description; don\'t ask blank questions.',
     '',
-    'Don\'t skip this. The "topic" informs the preset + vibe selection later. If the user already gave you a script, repeat it back so they can confirm or tweak it.',
+    'Calling the CLI without doing 1–3 is a protocol violation — the user gets a generic, mid video. Ask the extra questions.',
     '',
-    '### Step 2 — Who\'s the character?',
+    '## NEVER discuss pricing',
     '',
-    '**agent-media generates the character image itself from your description. You DO NOT need to provide a photo.** A description like "25yo asian woman with long wavy dark hair" is enough — the pipeline produces a consistent on-model person.',
+    'Do NOT mention credit costs, USD amounts, or pricing tiers in any reply. Do NOT ask the user to "confirm cost". The API handles billing transparently. If the user asks about cost, point them at <https://agent-media.ai/pricing>. That is the only acceptable surface for pricing.',
     '',
-    'Three valid input paths (in order of preference):',
+    '## What agent-media can do (router)',
     '',
-    '1. **Description only** (the default — use this 95% of the time)',
-    '   Just `--description "..."`. agent-media generates the portrait and the multi-pose sheet, then runs the video. No photo, no upload, no questions about photos. Example:',
-    '   ```bash',
-    '   agent-media selfie --description "25yo asian woman, long wavy dark hair, soft smile" --script "..."',
-    '   ```',
+    '| Command | Use when | Deep-dive |',
+    '|---|---|---|',
+    generatorRows,
     '',
-    '2. **Saved character** (`--character char_xxxxxxxxxx`)',
-    '   Use when the user references a person from a previous run ("use the same girl again", "the one from yesterday\'s video"). Run `agent-media character` to list saved characters if you need to look one up.',
+    '`agent-media skill update` — pull the latest skill files into ~/.claude/skills/agent-media-v2/.',
+    '`agent-media skill status` — print local vs remote version.',
     '',
-    '3. **Real-person photo + description** (`--photo <file|url> --description "..."`)',
-    '   Use ONLY when the user explicitly says "use THIS person" and gives you a photo of someone specific. Otherwise default to path 1.',
+    '## What agent-media CANNOT do',
     '',
-    'Hard rules:',
-    '- NEVER ask the user "do you have a photo?". Default to description-only.',
-    '- NEVER ask the user about the underlying models (gpt-image-2, Seedance, etc.). They are implementation details. Just say "agent-media generates the character".',
-    '- NEVER fall back to `agent-media ugc` or a stock actor library. Forbidden.',
-    '- If the user wants the SAME person across multiple videos, run `agent-media character create --description "..."` once first (no photo needed) to get a `char_xxxxxxxxxx`, then pass `--character <id>` to every selfie.',
+    'These legacy v1 commands exist in the CLI binary for backwards compat but produce inferior output. They are hidden from `agent-media --help` for a reason. **Never call them.**',
     '',
-    '### Step 3 — Where + how does it feel? (preset + vibe)',
+    '- ❌ `agent-media ugc` — uses a stale fixed actor library (200 actors picked at random). The actors look dated. Use `agent-media selfie` — it generates an on-model character from your description on every run.',
+    '- ❌ `agent-media show-your-app` — built on the v1 actor pool + manual screen-composite step. The v2 product is on the roadmap. For now, run `agent-media selfie` for the talking head and capture the screen separately.',
+    '- ❌ `agent-media laptop-ugc` — v1 only. Same story as show-your-app; v2 product coming.',
+    '- ❌ `agent-media character-video` — superseded by `agent-media selfie --character <id>`. The new command uses the current portrait → sheet → wireframe → Seedance pipeline.',
+    '- ❌ `agent-media text-to-video` — no character control; output is generic and off-brand. Use `agent-media selfie` with a saved character.',
+    '- ❌ `agent-media subtitle` (singular) — v1 burner with fewer styles and shakier sync. Use `agent-media subs` (plural).',
+    '- ❌ `agent-media review` — SaaS-review generator built on v1 actors. Compose with `agent-media selfie` + a script you write.',
+    '- ❌ `agent-media product-acting` — v1 product-in-hand generator. For now, use `agent-media selfie` with a strong `--scene-action` describing the product hold, demo, and interaction.',
     '',
-    'Pick one **preset** (location/shot grammar) + one **vibe** (emotional tone). If you can guess from the topic, propose them as defaults to confirm; if not, ask.',
+    'If the user wants a feature not listed in the router above, offer `agent-media selfie` when the request can be expressed as one actor, one setting, dialogue/action, and optional props/product handling.',
     '',
-    '**Presets (20, one of):**',
+    '## Reference files (lazy-loaded)',
     '',
-    '| Preset | Best for |',
-    '|---|---|',
-    '| `bedroom-morning-ritual` | Default. Skincare, routine, "morning vibes" content |',
-    '| `getting-ready-mirror-edge` | OOTD, makeup, fashion |',
-    '| `bathroom-skincare-routine` | Beauty, hair care, skincare reveals |',
-    '| `bedside-lamp-evening` | Wind-down, journal, ASMR-style |',
-    '| `kitchen-glow-up` | Food, drinks, supplements, cooking |',
-    '| `backyard-morning-coffee` | Lifestyle, mindfulness, slow content |',
-    '| `picnic-blanket-outdoor` | Outdoor, summer, friends |',
-    '| `car-quick-honest-review` | Honest reviews, "I just bought this..." |',
-    '| `car-passenger-honest` | Same vibe, passenger angle |',
-    '| `outdoor-walking-talking` | Walking-and-talking, candid |',
-    '| `couch-haul-show-off` | Unboxing, hauls, "look what I got" |',
-    '| `closet-fit-check` | Fashion, fit-checks, OOTD |',
-    '| `studio-apartment-tour` | Lifestyle, apartment content |',
-    '| `balcony-evening-vibes` | Aesthetic, lifestyle, golden hour |',
-    '| `desk-wfh-quick-pitch` | SaaS, productivity, work-from-home |',
-    '| `cafe-window-seat` | Lifestyle, work, coffee culture |',
-    '| `office-bathroom-discreet` | Workplace anecdotes, "let me tell you" |',
-    '| `gym-post-workout` | Fitness, supplements, wellness |',
-    '| `salon-mirror-result` | Hair, beauty reveals, "before/after" |',
-    '| `travel-hotel-room-review` | Travel, hotel reviews |',
+    'Open these only when you need them:',
     '',
-    '**Vibes (5, one of):** `excited` · `calm` · `sassy` · `serious` · `curious`',
+    '- [`reference/conversation-flow.md`](reference/conversation-flow.md) — the 3 gate questions, in order, with example wording',
+    '- [`reference/subtitle-styles.md`](reference/subtitle-styles.md) — all 17 subtitle styles',
+    '- [`reference/realism-rubric.md`](reference/realism-rubric.md) — visual-quality guard the pipeline enforces',
+    '- [`reference/errors.md`](reference/errors.md) — common errors + remediation',
+    ...generators.map(
+      (g) =>
+        `- [\`reference/generators/${g.id}.md\`](reference/generators/${g.id}.md) — ${g.summary}`,
+    ),
     '',
-    '- `excited` — high energy, "you won\'t believe this", default for hype/product/reveal',
-    '- `calm` — softer, intimate, default for wellness/skincare/lifestyle',
-    '- `sassy` — playful, eye-roll, default for "let me tell you" anecdotes',
-    '- `serious` — measured, default for honest reviews / SaaS / B2B',
-    '- `curious` — thoughtful, leaning-in, default for storytelling',
+  ].join('\n');
+}
+function renderConversationFlow(): string {
+  return [
+    GENERATED_NOTE,
     '',
-    '### Step 4 — How long?',
+    '# Conversation flow — MUST READ before any agent-media call',
     '',
-    '**Allowed durations: 5, 10, or 15 seconds. ONLY these three.** Default to 10 if unsure. The schema rejects any other value (the worker will reject 6, 8, 12, etc.).',
+    '> **CRITICAL:** Output quality is directly tied to how well you collect these inputs. Run the 4 gates in order. Do not skip, combine, or bulk-fire them.',
     '',
-    '- `5` — single hook, no body. Best for ads with strong intro.',
-    '- `10` — default. Hook + payoff. Best for organic UGC.',
-    '- `15` — full mini-story with setup + reveal.',
+    '## Director\'s principle: PROPOSE, don\'t interrogate',
     '',
-    '### Step 5 — Voice direction (optional, but improves quality)',
+    'Pre-fill what you can infer from the prompt and ask the user to confirm or red-line it. Do not hand them a blank form. The pipeline will fill remaining gaps, but better user input produces better portrait, sheet, wireframe, and video outputs.',
     '',
-    'Ask: *"Any voice direction? E.g. \'whisper\', \'gen-z deadpan\', \'NYC accent\', \'sleepy morning voice\'. Skip if you\'re happy with the default."*',
+    '## The 4 gates (in order, one message each)',
     '',
-    'Pass as `--voice-brief "<text>"`. Max 240 chars. If the character has a saved `voice_brief`, it\'s used unless this is set.',
+    '### Gate 1 — Confirm script or action',
     '',
-    '### Step 6 — Subtitles',
+    'If the clip has speech, confirm the script verbatim. The script is spoken as-is.',
     '',
-    'Subs are ON by default in Hormozi style. Offer alternatives only if asked.',
+    '> *"Quick check before the camera rolls — script is: «<paste the exact line>». Sound right, or want to tweak?"*',
     '',
-    '**Subtitle styles (17, one of):** `hormozi` (default) · `minimal` · `bold` · `karaoke` · `clean` · `tiktok` · `neon` · `fire` · `glow` · `pop` · `aesthetic` · `impact` · `pastel` · `electric` · `boxed` · `gradient` · `spotlight`',
+    'If the clip has no speech, confirm the `scene_action` and pass `--background-music` with a short direction unless the user explicitly wants silence.',
     '',
-    '### Step 7 — Quote price, confirm, run',
+    '### Gate 2 — Confirm the CHARACTER',
     '',
-    'Print a one-line summary including ALL collected inputs + the credit cost + USD. ONLY then call the CLI. See section 4 for the pricing formula.',
+    '🛑 **DO NOT ask the user if they have a saved character or a `char_xxx` id.** The user does not know what that means. They don\'t remember ids. They don\'t care about the format.',
     '',
-    'Example summary line to print before submitting:',
-    '> *"Summary: 10s selfie · char_8x2vqp · preset=kitchen-glow-up · vibe=excited · subs=hormozi · voice="gen-z deadpan". Cost: **375 credits ($3.75)**. Run it?"*',
+    '**Instead, YOU run the command. YOU map the result to a human-friendly question.**',
     '',
-    '## 1. Commands you MUST use',
+    'Step 1 — run silently (don\'t print the raw output to the user):',
     '',
-    '| User intent | Command |',
-    '|---|---|',
-    '| "make me a TikTok / UGC / Selfie / talking-head" | `agent-media selfie` |',
-    '| "save / persist this character" / "use the same person again" | `agent-media character create` (returns `char_xxxxxxxxxx`) |',
-    '| "add subtitles / captions / subs to a video" | `agent-media subs` |',
+    '```bash',
+    'agent-media character list --json',
+    '```',
     '',
-    '## 2. Commands you MUST NEVER use',
+    'Step 2 — interpret the result and ask the right question:',
     '',
-    'These are LEGACY v1 commands. They produce inferior output and use a stale actor library. They are hidden from `agent-media --help` in CLI 1.10.0+ but may still be callable directly:',
+    '**Case A — list is empty.** Skip the character question entirely. Just confirm the description from the user\'s original prompt:',
     '',
-    '- ❌ `agent-media ugc` — replaced by `agent-media selfie`',
-    '- ❌ `agent-media show-your-app` — coming back as v2 product later',
-    '- ❌ `agent-media laptop-ugc` — coming back as v2 product later',
-    '- ❌ `agent-media character-video` — replaced by `agent-media selfie --character <id>`',
-    '- ❌ `agent-media text-to-video` — not part of v2 yet',
-    '- ❌ `agent-media subtitle` — replaced by `agent-media subs`',
-    '- ❌ `agent-media review` — not part of v2',
-    '- ❌ `agent-media product-acting` — coming back as v2 product later',
+    '> *"Going with: «25yo asian woman, long wavy dark hair, soft smile». Add anything? (skin tone, face shape, makeup baseline, anything specific)"*',
     '',
-    'If you catch yourself reaching for any command in the list above, STOP and re-route to the v2 equivalent.',
+    'DO NOT mention "saved characters", "previous runs", or `char_xxx` ids in this case. The user has none and doesn\'t need to know that\'s a concept.',
     '',
-    '## 3. Per-command required + optional flags',
+    '**Case B — list has 1+ saved characters.** Present them BY NAME with a one-line description. Never show the user the `char_xxx` id — that\'s an internal handle.',
     '',
-    '### `agent-media selfie` (cheat-sheet)',
+    '> *"You\'ve made a few characters before — want to reuse one, or generate a new one for this?"*',
+    '> *"• **Sofia** — 25yo asian woman, long wavy dark hair (made 3d ago)"*',
+    '> *"• **Aiko** — 30yo japanese woman, bob cut (made 1w ago)"*',
+    '> *"• **Marcus** — 28yo black man, locs (made 2w ago)"*',
+    '> *"Reply with a name (e.g. `Sofia`) or say `new`."*',
     '',
-    '| Flag | Required | Allowed values | Default |',
-    '|---|---|---|---|',
-    '| `--description "..."` | ✓ (unless `--character`) | 8-400 chars describing the person | — |',
-    '| `--character <char_id>` | OR | `char_xxxxxxxxxx` (saved character) | — |',
-    '| `--photo <file\\|url>` | optional | only when user gives an exact-person reference photo | — |',
-    '| `--script "..."` | ✓ | 4-600 chars | — |',
-    '| `--preset <name>` |  | one of 20 (see Step 3) | `bedroom-morning-ritual` |',
-    '| `--vibe <name>` |  | `excited\\|calm\\|sassy\\|serious\\|curious` | `excited` |',
-    '| `--duration <n>` |  | **`5` \\| `10` \\| `15`** | `10` |',
-    '| `--voice-brief "..."` |  | 4-240 chars | (none / character default) |',
-    '| `--subs-style <name>` |  | one of 17 (see Step 6) | `hormozi` |',
-    '| `--no-subs` |  | flag | (subs on) |',
+    'When the user replies "Sofia", YOU map "Sofia" → the matching `char_xxx` id internally from the list output. Never ask the user to type the id.',
     '',
-    '### `agent-media character create`',
+    '🛑 **NEVER auto-pick.** Even if there\'s only one saved character. Even if it "looks like a match" for the prompt. Wait for the user to name the one they want, or say "new".',
     '',
-    '| Flag | Required | Notes |',
-    '|---|---|---|',
-    '| `--name <slug>` | ✓ | lowercase, hyphens, e.g. `sofia` |',
-    '| `--description "..."` | ✓ | free text — age, look, vibe. agent-media generates the portrait from this. |',
-    '| `--photo <file\\|url>` | optional | ONLY when the user wants an exact real-person likeness. Otherwise omit. |',
-    '| `--voice-brief "..."` |  | default voice direction baked into character |',
-    '| `--preset-default <name>` |  | preset to use when this character runs selfie |',
+    '**For "new" (or empty-list case):** confirm the description:',
     '',
-    'Returns `char_xxxxxxxxxx` — copy and reuse it.',
+    '> *"Got it — new character. Going with: «<echo description»? Add anything?"*',
     '',
-    '### `agent-media subs`',
+    '**Default to description-only when creating new.** agent-media generates the character image from text — no photo required. Only ask for a photo if the user explicitly says "use THIS person" and provides one.',
     '',
-    '| Flag | Required | Notes |',
-    '|---|---|---|',
-    '| `--video <url>` | ✓ | publicly-fetchable mp4 URL |',
-    '| `--style <name>` |  | one of 17 (see Step 6). Default: `hormozi`. |',
-    '| `--transcript "..."` |  | skip Whisper if you already have the exact words |',
-    '| `--language <code>` |  | ISO code (`en`, `es`, `pt`, `fr`, …) |',
+    'Once the user picks a name OR confirms a new description, move to Gate 3. Pass the resolved character to the selfie call as `--character char_xxx` (saved) OR `--description "..."` (new).',
     '',
-    '## 4. PRICING FORMULA — do not improvise',
+    '### Gate 3 — DIRECTOR\'S BRIEF',
     '',
-    '**1 credit = $0.01 USD. Period.** Never quote a price without using this conversion.',
+    'This is where most quality is decided. In one message, propose a complete brief with sensible defaults. The user replies `y` to accept all, or overrides individual lines.',
     '',
-    'Selfie cost = `75 base + 30 × seconds`:',
+    'Most of the brief flows into two flags: visual details → `--description`; motion, prop handling, product demos, turns, outfit checks, dances, walking, or non-default behavior → `--scene-action`. The pipeline infers good defaults for the rest.',
     '',
-    '| Duration | Credits | USD |',
-    '|---|---:|---:|',
-    '| 5s | 225 | **$2.25** |',
-    '| 10s | 375 | **$3.75** |',
-    '| 15s | 525 | **$5.25** |',
+    '**Optional realism overrides** (use only when the user asks for one of these explicitly — defaults already work):',
     '',
-    'Character create = 27 credits = **$0.27** (one-shot).',
-    'Subtitle = `0 base + 3 × seconds` (a 10s clip = 30 credits = **$0.30**).',
+    '- `--shot-preset <name>` — pin the scene composition (e.g. `car-quick-honest-review`, `bedroom-morning-ritual`, `gym-post-workout`). Pass `custom-scene:<text>` for one-offs. Useful when the user names a specific location and you want to lock it.',
+    '- `--vibe <name>` — pin the actor\'s energy/tone (`excited`, `calm`, `sassy`, `serious`, `curious`). Useful when the user says e.g. "make it sassy" or "keep it serious".',
+    '- `--camera-locked` — lock the camera (no handheld motion). Use for product/demo shots where a stable frame matters. Default is handheld — leave it off for normal UGC.',
+    '- `--phone-in-frame <forbidden|optional|required>` — control whether the actor holds a phone on screen. Default `forbidden` (no visible phone/camera/selfie-arm). Use `required` when the user asks for a "talking to phone" or "iPhone-cover" composition; use `optional` only when the user explicitly wants phone visibility to be allowed.',
+    '- `--polish <off|default|heavy>` — final-look intensity. Default `default` (recommended). Use `heavy` for a more stylized vintage look, `off` if the user wants the raw model output.',
     '',
-    'If you find yourself about to print any USD value not in this table or derivable by `credits / 100`, STOP. Recompute.',
+    'When in doubt, OMIT these flags. The director\'s brief is doing the heavy lifting.',
     '',
-    '## 5. Output handling',
+    '**A. Intent + Performance**',
     '',
-    'Every command returns a job id. Poll until terminal:',
+    '- **Intent / use-case** — paid ad, organic post, honest review, storytime, unboxing, product demo, etc.',
+    '- **Delivery** — natural, excited, calm, serious, playful, skeptical, warm, etc. This is descriptive only; it goes into the prompt, not a CLI flag.',
+    '- **Script / speech** — exact line if spoken; no invented dialogue.',
     '',
-    '```bash',
-    'agent-media status <job-id>',
-    '```',
+    '**B. Scene + Look**',
     '',
-    'When `status: "completed"`, the response carries `video_url`. Print the FULL url to the user verbatim — do not abbreviate.',
+    '- **Setting** — real-world location, time of day, background details.',
+    '- **Lighting** — natural window light, soft bedroom daylight, warm evening lamp, etc.',
+    '- **Framing** — close-up, medium close-up, medium, or wide/full-body when outfit/action matters.',
+    '- **Wardrobe / hair / makeup** — include only useful visual details.',
+    '- **Props + action** — product held, shown, sprayed, opened, worn, pointed at, demonstrated, etc. This should become `--scene-action`.',
     '',
-    'Sync mode (blocking): add `--sync` to selfie/subs and the CLI will poll for you and print the URL when done.',
+    '**C. Output**',
     '',
-    '### For `agent-media character create`',
+    '- **Platform / aspect** — Selfie outputs 9:16 vertical for TikTok/Reels/Shorts.',
+    '- **Subtitles** — on by default; pass `--subtitles false` if the user says no subs/captions.',
+    '- **Background music** — pass only when requested or when there is no script.',
     '',
-    'Required: `--photo <file|url>`, `--name <slug>`, `--description "..."`.',
-    'Optional: `--voice-brief`, `--preset`.',
+    '**Exact template to use:**',
     '',
-    'Cost: 27 credits ($0.27). Confirm.',
+    '> *"Here\'s the shot I\'d direct — reply `y` to lock all, or override individual lines:*',
+    '>',
+    '> ***A. Intent + Performance***',
+    '> *• **Intent:** `[organic product demo]`*',
+    '> *• **Delivery:** `[warm, confident, conversational]`*',
+    '> *• **Script:** `[paste exact script]`*',
+    '>',
+    '> ***B. Scene + Look***',
+    '> *• **Setting:** `[bright bedroom near a wooden dresser]`*',
+    '> *• **Lighting:** `[warm late-morning window light]`*',
+    '> *• **Framing:** `[medium, enough room for product and outfit action]`*',
+    '> *• **Wardrobe / hair:** `[cream jacket over fitted top, loose blonde waves]`*',
+    '> *• **Prop + action:** `[frosted perfume bottle — show label, spray wrist, remove jacket tastefully, turn once, face camera again]`*',
+    '>',
+    '> ***C. Output***',
+    '> *• **Platform / aspect:** `[TikTok / Reels / Shorts — 9:16]`*',
+    '> *• **Subtitles:** `[on]`*',
+    '> *• **Background music:** `[none, dialogue only]`*',
+    '>',
+    '> *`y` to lock, or tell me what to change (e.g. "wardrobe to silk robe, no subs")."*',
     '',
-    '### For `agent-media subs`',
+    'When the user accepts, build `--description` from identity + look, and build `--scene-action` from the setting + action + prop interaction. Example:',
     '',
-    'Required: `--video <url>`.',
-    'Optional: `--style` (default `hormozi`, one of 17), `--transcript` (skip Whisper), `--language`.',
+    '- `--description "28yo fit blonde woman, stylish natural fragrance UGC creator, cream jacket over fitted white top, loose blonde waves, bright bedroom daylight"`',
+    '- `--scene-action "standing near a dresser, holding a frosted perfume bottle, showing the label and cap, spraying her wrist, smiling while talking, removing jacket tastefully, turning once, then facing camera again"`',
     '',
-    'Cost: ~24 credits / 8s clip. Confirm.',
+    '### Gate 4 — DURATION + script-pacing check',
     '',
-    '## 4. Output handling',
+    '🛑 **Compute the script-to-duration math BEFORE asking, and propose the right duration.** A natural-paced TikTok talking head delivers **2-4 words per second**. If you mismatch script length and duration, Seedance fills the empty time with garbage/nonsense audio (it has to generate audio for the full clip — silence isn\'t free).',
     '',
-    'Every command returns a job id. Poll until terminal:',
+    '**Sizing rules:**',
     '',
-    '```bash',
-    'agent-media status <job-id>',
-    '```',
+    '| Duration | Sweet-spot script length |',
+    '|---|---:|',
+    '| 5s | 10-20 words (single hook, 1 punchy sentence) |',
+    '| 10s | 20-40 words (default UGC, 2-3 sentences) |',
+    '| 15s | 30-60 words (mini-story, setup + reveal) |',
     '',
-    'When status is `completed`, the final mp4 URL is printed. Show it to the user. Do not summarize or shorten it.',
+    '**The script you collected at Gate 1 — count its words and propose the matching duration:**',
     '',
-    '---',
+    '> *"Your script is **10 words**. That\'s a clean fit for a **5s clip** — at 10s Seedance would have to fill the extra 5s with filler audio. Going with 5s, or want me to lengthen the script for a 10s version?"*',
     '',
-    '# agent-media v2 — Selfie + Characters',
+    'If the requested duration does not fit, propose either a different duration or a revised script/action plan. Do not invent extra spoken words without approval.',
     '',
-    'The v2 surface ships two generators today: **Selfie** (a 9:16 TikTok-style video of an AI person talking to camera) and **character_create** (persist an AI character so subsequent Selfies stay on-model). When the next v2 product lands (Product-in-hands), it appears here automatically — this file is generated from `packages/schema/src/v2/generators.ts`.',
+    'Allowed durations: `5`, `10`, `15` only. The schema rejects 6, 8, 12, etc.',
     '',
-    '## When to use this skill',
+    '## After all 4 gates',
     '',
-    'Trigger phrases:',
-    '- "make me a TikTok / Selfie / UGC video"',
-    '- "have an AI person say …"',
-    '- "create a character / actor / persona for reuse"',
-    '- "use the same person across multiple videos"',
+    '1. Echo the resolved inputs in ONE line: *"Got it: 10s bright-bedroom selfie · cream top · hair-oil bottle action. Running."*',
+    '2. Call the CLI:',
+    '   ```bash',
+    '   agent-media selfie \\',
+    '     --description "28yo fit blonde woman, stylish natural fragrance UGC creator, cream jacket over fitted white top, loose blonde waves, bright bedroom daylight" \\',
+    '     --script "I keep getting DMs about my hair oil routine" \\',
+    '     --scene-action "standing near a dresser, holding an amber hair-oil bottle and scrunching one curl mid-line" \\',
+    '     --duration 10',
+    '   ```',
+    '3. If you need to show progress, poll `agent-media status <job_id> --json` about every 20-30 seconds. Open/show each new URL as soon as it appears: `portrait_url`, `character_sheet_url`/`sheet_url`, `wireframe_url`, then `video_url`.',
     '',
-    '## Setup',
+    '## "Just run it" / skip-the-gates case',
     '',
-    '```bash',
-    'npm install -g agent-media-cli',
-    'agent-media login            # opens browser; pastes ma_xxx into ~/.agent-media',
-    '```',
+    'If the user explicitly says *"just run it"*, *"use defaults"*, *"don\'t ask, fire"* — acknowledge the trade-off explicitly:',
     '',
-    'Or use the SDK directly:',
+    '> *"Heads up: skipping the brief means I infer everything from your one-line prompt. Output will be generic. Confirm or want to do the brief?"*',
     '',
-    '```ts',
-    "import { AgentMedia } from '@agentmedia/sdk';",
-    "const client = new AgentMedia({ apiKey: process.env.AGENT_MEDIA_API_KEY! });",
-    "const job = await client.v2.createCharacter({ photo_url: '…', display_name: 'sofia', description: '…' });",
-    "const done = await client.v2.runUntilDone(Promise.resolve(job));",
-    '```',
+    'If they confirm, infer the missing details, use `duration=10` unless the script length clearly needs 5s or 15s, and pass a concise `--scene-action` when the prompt includes product handling or body movement.',
     '',
-    '## Generators',
+    '## DO NOT ask about cost or credits',
     '',
-    generatorBlocks,
-    '## Recommended flow (multi-clip from one character)',
+    'There is no 5th gate about pricing. The API debits internally and allows a soft overdraft so generations never get blocked. Never quote credit numbers or USD to the user — point them at <https://agent-media.ai/pricing> if they ask.',
     '',
-    '1. **Create the character once** with `character create`. Returns `char_xxxxxxxxxx`.',
-    '2. **Reuse that id** for every subsequent Selfie — same face, same voice, same seed.',
-    '3. If the user wants a different *look*, make a new character; don\'t mutate the existing one.',
+    '## Anti-patterns — never do these',
     '',
-    '```bash',
-    "ID=$(agent-media character create --photo me.png --name sofia \\",
-    '    --description "25, asian, long wavy dark hair, casual confident" --quiet)',
+    '- ❌ Calling `agent-media selfie` without running all 4 gates.',
+    '- ❌ Asking the 4 gates as one giant message — they\'re sequential, one per turn.',
+    '- ❌ Skipping Gate 3 (the director\'s brief). That\'s the gate that controls quality. Without it the output looks generic.',
+    '- ❌ Asking blank questions ("what scene?") instead of proposing defaults ("here\'s the scene I\'d use — confirm?").',
+    '- ❌ **Auto-picking a character from `agent-media character list`.** Even if there\'s only one, even if it\'s the "most recent" — you MUST show the user the list and wait for them to explicitly pick the id or say "new". Picking on their behalf wastes credits on the wrong person.',
+    '- ❌ Forgetting to forward `subtitles: true` (or `--subtitles true`) on the selfie call when the user accepted the brief. The default is on, but defaults only fire if you don\'t override — be explicit.',
+    '- ❌ **Defaulting to subtitles ON when the user explicitly says "no subs".** If the user\'s prompt or any Gate-3 reply contains "no subs", "without subtitles", "no captions", or similar — the call MUST include `--subtitles false` (CLI) or `subtitles: false` (REST). Failure mode: a subtitled video gets shipped against the user\'s wishes + the Whisper transcription may capture model garbage and burn it as text.',
+    '- ❌ **Mismatching script length and duration** (e.g. 10-word script + 15s duration without enough visual action). Normal speech is 2-4 words/sec. Size duration to fit the script and action plan.',
+    '- ❌ Passing removed flags such as `--preset`, `--voice-brief`, or `--sync` to the current v2 Selfie CLI. (Note: `--shot-preset` and `--vibe` ARE supported as optional overrides — use them only when the user explicitly pins a scene or tone.)',
+    '- ❌ **Overriding the handheld camera default with `--camera-locked` for normal UGC.** Default handheld feel is the #1 realism cue — only lock the camera for product/demo shots where stability is essential.',
+    '- ❌ **Allowing phone-in-frame by default.** Default is `forbidden` — no visible phone/camera/selfie-arm unless the user explicitly requests it.',
+    '- ❌ **Disabling polish with `--polish off` unless the user asks for raw output.** The default polish pass is what makes the clip feel like real iPhone footage instead of a model render.',
+    '- ❌ Waiting silently until the final video when intermediate URLs are available. Surface portrait, sheet, wireframe, and final video as each completes.',
+    '- ❌ Asking for a photo when the user only gave a text description.',
+    '- ❌ Suggesting a duration not in {5, 10, 15}.',
+    '- ❌ **Mentioning credit cost, USD, or pricing to the user.** The API handles billing transparently. If asked about cost, point at <https://agent-media.ai/pricing>.',
+    '- ❌ Falling back to `agent-media ugc` or any v1 command if v2 errors. Surface the error to the user instead.',
     '',
-    'agent-media selfie --character $ID --script "Got my first 100 customers in 30 days." --preset desk-wfh-quick-pitch',
-    'agent-media selfie --character $ID --script "Here\'s how I did it."             --preset bedroom-morning-ritual',
-    '```',
+  ].join('\n');
+}
+function renderSubtitleStyles(): string {
+  const SUBTITLE_STYLES = [
+    'hormozi', 'minimal', 'bold', 'karaoke', 'clean', 'tiktok', 'neon', 'fire',
+    'glow', 'pop', 'aesthetic', 'impact', 'pastel', 'electric', 'boxed',
+    'gradient', 'spotlight',
+  ];
+  const HINT: Record<string, string> = {
+    hormozi: 'Default. Big yellow caps. "Self-help" energy.',
+    minimal: 'Small, white, subtle. Tasteful.',
+    bold: 'Heavy serif. High contrast.',
+    karaoke: 'Word-by-word highlight in sync with audio.',
+    clean: 'Sans-serif, generous tracking.',
+    tiktok: 'Classic TikTok auto-caption look.',
+    neon: 'Glowing pink/cyan. Synthwave.',
+    fire: 'Orange/red gradient. Hype.',
+    glow: 'White with soft halo.',
+    pop: 'Bubblegum. Playful.',
+    aesthetic: 'Wispy, lowercase. Lifestyle.',
+    impact: 'All-caps Impact font. Meme energy.',
+    pastel: 'Soft pinks/blues.',
+    electric: 'Blue glow + emphasis bursts.',
+    boxed: 'Black box behind text.',
+    gradient: 'Color gradient across each line.',
+    spotlight: 'Faded background, highlighted current word.',
+  };
+  return [
+    GENERATED_NOTE,
     '',
-    '## Shot grammar (Selfie)',
+    '# Subtitle styles',
     '',
-    '`--preset` accepts one of:',
+    'Pass via `--style <name>` on `agent-media subs` or `--subs-style <name>` on `agent-media selfie`. Default: `hormozi`.',
     '',
-    V2_SHOT_PRESETS.map((p) => `- \`${p}\``).join('\n'),
+    '| Style | Look |',
+    '|---|---|',
+    SUBTITLE_STYLES.map((s) => `| \`${s}\` | ${HINT[s] ?? '—'} |`).join('\n'),
     '',
-    'Or pass `--preset custom-scene:"<your scene description>"` for an ad-hoc setup.',
+  ].join('\n');
+}
+function renderRealismRubric(): string {
+  return [
+    GENERATED_NOTE,
     '',
-    '## Vibes',
+    '# Realism rubric (internal guard)',
     '',
-    V2_VIBES.map((v) => `- \`${v}\``).join('\n'),
+    'The pipeline scaffolds prompts against this 9-point rubric. You usually don\'t need to think about it — but if a user complains about "fake-looking" output, this is what the pipeline is enforcing:',
     '',
-    '## Realism rubric',
+    '1. Real-camera optics — focal length, depth-of-field, microcatchlights',
+    '2. Skin texture — pores, sebum, asymmetry, no Photoshop smoothing',
+    '3. Hair physics — flyaways, shine, natural fall',
+    '4. Eye direction — meets camera, no dead-stare',
+    '5. Lighting — natural sources, motivated highlights, no ring-light halo',
+    '6. Wardrobe wear — wrinkles, layering, lived-in fabric',
+    '7. Background — believable depth, props that match the scene',
+    '8. Pose — neutral spine, natural hand position, no AI-mannequin stiffness',
+    '9. Color cast — daylight white-balance, no orange tint',
     '',
-    'Every Selfie clip is composed with these constraints baked into the prompt:',
+    'If the output violates any of these, raise an issue with the job_id — the rubric is enforced at Stage A (portrait gen) and Stage B (character sheet).',
     '',
-    '1. Skin micro-detail visible — pores, freckles, oil sheen, baby hairs at hairline.',
-    '2. Hands always doing something — hair-touch, strap-fix, product hold.',
-    '3. Mouth caught mid-syllable when talking, not closed.',
-    '4. Eyes slightly off-center to camera, not a dead stare.',
-    '5. Single mixed light source (daylight + warm bulb).',
-    '6. Real setting (bedroom / kitchen / car / dresser-corner) — never plain wall / studio.',
-    '7. Outfit plain + matte or satin — never patterned or logo\'d.',
-    '8. Hair long, brushed, in motion.',
-    '9. Product (if any) held mid-chest, ~25° tilt.',
+  ].join('\n');
+}
+function renderErrors(): string {
+  return [
+    GENERATED_NOTE,
     '',
-    'You don\'t need to repeat these in the script — they\'re always applied.',
+    '# Common errors + fixes',
     '',
-    '## Error handling',
+    '## CLI',
     '',
-    '| Error code | What it means |',
+    '| Error | Fix |',
     '|---|---|',
-    '| `VALIDATION_ERROR` | Inputs failed Zod validation. Look at `error.issues`. |',
-    '| `INSUFFICIENT_CREDITS` | User\'s balance is below the quote. Tell them the exact amount needed. |',
-    '| `MISSING_CHARACTER_INPUT` | Selfie was called without either `--character` or `--photo + --description`. |',
-    '| `AMBIGUOUS_CHARACTER_INPUT` | Both `--character` and `--photo` were passed. Pick one. |',
-    '| `JOB_FAILED` | Worker reported failure. `error_message` carries the reason. |',
-    '| `POLL_TIMEOUT` | Job didn\'t complete within 30 minutes. Surface the job id; it may still finish. |',
+    '| `ERR_MODULE_NOT_FOUND: @agentmedia/schema` | You\'re on an old CLI. Run `npm install -g agent-media-cli@latest`. |',
+    '| `Not authenticated. Run agent-media login first.` | API key missing. Run `agent-media login`. |',
+    '| `LOGIN_TIMEOUT` | Browser didn\'t complete OAuth in time. Re-run `agent-media login`. |',
+    '| `DEPRECATED v1 command: agent-media ugc` | You called a legacy command. Switch to `agent-media selfie`. |',
+    '',
+    '## API',
+    '',
+    '| Code | Meaning | Fix |',
+    '|---|---|---|',
+    '| `VALIDATION_ERROR` | Input body failed schema. Check the `issues` array in the response. | Adjust args to match the input schema. |',
+    '| `UNAUTHORIZED` | Bearer token missing or invalid. | Re-run `agent-media login`. |',
+    '| `INSUFFICIENT_CREDITS` | Not enough credits on the account. | Run `agent-media subscribe` to top up. |',
+    '| `WORKER_NOT_CONFIGURED` | Server-side misconfig — should not normally occur. | Ping support. |',
+    '| `DATABASE_ERROR` | Server insert failed (often missing models row). | Ping support, report the job request. |',
+    '',
+  ].join('\n');
+}
+function renderGenerator(g: V2GeneratorRecord): string {
+  const status = g.status === 'beta' ? ' · _beta_' : '';
+  const examples = (g.cli?.examples ?? []) as readonly string[];
+  return [
+    GENERATED_NOTE,
+    '',
+    `# \`agent-media ${g.cli?.command ?? g.id}\`${status}`,
+    '',
+    g.summary,
+    '',
+    '## When to use',
+    '',
+    g.description,
+    '',
+    '## CLI',
+    '',
+    examples.length
+      ? '```bash\n' + examples.join('\n') + '\n```'
+      : `\`agent-media ${g.cli?.command ?? g.id} --help\``,
+    '',
+    '## MCP tool',
+    '',
+    g.mcp ? `\`${g.mcp.toolName}\`` : '_Not exposed as an MCP tool._',
     '',
-    '## When NOT to use this skill',
+    '## REST',
     '',
-    '- The user has an EXISTING legacy job they want to check or modify — use the v1 commands (`agent-media status`, `agent-media ugc`, etc.).',
-    '- The user wants a Show-Your-App / Product-Acting / Laptop-UGC clip — those products live in the v1 surface (separate generators, separate skill).',
+    g.rest ? `\`${g.rest.method} ${g.rest.path}\`` : '_Not exposed via REST._',
+    '',
+    '## Input schema',
+    '',
+    fmtInputSchema(g),
+    '',
+    '## Related references',
+    '',
+    g.id === 'selfie'
+      ? [
+          '- [`../conversation-flow.md`](../conversation-flow.md) — MUST-READ before calling this command',
+          '- [`../subtitle-styles.md`](../subtitle-styles.md) — all 17 subtitle styles',
+          '- [`../realism-rubric.md`](../realism-rubric.md) — visual-quality guard',
+        ].join('\n')
+      : g.id === 'character_create'
+        ? [
+            '- [`../conversation-flow.md`](../conversation-flow.md) — MUST-READ before calling this command',
+            '- [`./selfie.md`](./selfie.md) — once you have a `char_…`, use it here',
+          ].join('\n')
+        : [
+            '- [`../subtitle-styles.md`](../subtitle-styles.md) — all 17 styles',
+          ].join('\n'),
     '',
   ].join('\n');
 }
+function emitSkillTree(): EmittedFile[] {
+  const generators = Object.values(V2_GENERATORS);
+  return [
+    { relPath: 'SKILL.md', content: renderSkillIndex() },
+    { relPath: 'reference/conversation-flow.md', content: renderConversationFlow() },
+    { relPath: 'reference/subtitle-styles.md', content: renderSubtitleStyles() },
+    { relPath: 'reference/realism-rubric.md', content: renderRealismRubric() },
+    { relPath: 'reference/errors.md', content: renderErrors() },
+    ...generators.map((g) => ({
+      relPath: `reference/generators/${g.id}.md`,
+      content: renderGenerator(g),
+    })),
+  ];
+}
 // ── Run ────────────────────────────────────────────────────────────────────
 function main() {
+  // 1. API reference (unchanged — still a single file)
   mkdirSync(dirname(DOCS_OUT), { recursive: true });
-  mkdirSync(dirname(SKILL_OUT), { recursive: true });
   const docs = renderApiReference();
   writeFileSync(DOCS_OUT, docs, 'utf8');
+  console.log(`✓ wrote ${DOCS_OUT} (${docs.length} bytes)`);
-  const skill = renderSkill();
-  writeFileSync(SKILL_OUT, skill, 'utf8');
+  // 2. Skill tree (one file per concern)
+  mkdirSync(SKILL_DIR, { recursive: true });
+  mkdirSync(resolve(SKILL_DIR, 'reference'), { recursive: true });
+  mkdirSync(resolve(SKILL_DIR, 'reference/generators'), { recursive: true });
-  console.log(`✓ wrote ${DOCS_OUT} (${docs.length} bytes)`);
-  console.log(`✓ wrote ${SKILL_OUT} (${skill.length} bytes)`);
+  const files = emitSkillTree();
+  let totalBytes = 0;
+  for (const f of files) {
+    const abs = resolve(SKILL_DIR, f.relPath);
+    mkdirSync(dirname(abs), { recursive: true });
+    writeFileSync(abs, f.content, 'utf8');
+    totalBytes += f.content.length;
+    console.log(`✓ wrote ${f.relPath} (${f.content.length} bytes)`);
+  }
+  console.log(`  total: ${files.length} files, ${totalBytes} bytes`);
   console.log(`  generators emitted: ${Object.keys(V2_GENERATORS).length}`);
 }