npm - @writepanda/mcp - Versions diffs - 1.34.0 → 1.38.0 - Mend

@writepanda/mcp 1.34.0 → 1.38.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (2) hide show

package/bin/server.mjs +152 -7
package/package.json +1 -1

package/bin/server.mjs CHANGED Viewed

@@ -162,6 +162,37 @@ const TOOLS = [
 		inputSchema: { type: "object", properties: {} },
 		command: "system.list",
 	},
+	{
+		name: "system_get_transcription_language",
+		description:
+			"Read the active transcription engine selection for the current workspace. Returns { language } where language is one of: 'auto' (Parakeet TDT v3, default — auto-detects English + 25 European languages including Russian/Ukrainian), 'chinese' / 'japanese' / 'korean' / 'hindi' / 'arabic' / 'thai' (each routes to Whisper Large-v3-turbo). Use this when surfacing the active engine to the user or before recommending a switch.",
+		inputSchema: { type: "object", properties: {} },
+		command: "system.getTranscriptionLanguage",
+	},
+	{
+		name: "system_set_transcription_language",
+		description:
+			"Switch the transcription engine for the current workspace. Default 'auto' uses Parakeet (English + 25 European languages, auto-detected, word-level timestamps native). Non-'auto' values route to Whisper Large-v3-turbo with that language locked in. **Important**: non-'auto' choices require a one-time ~1.1 GB Whisper model download — call `system_is_whisper_model_downloaded` first, and surface the download requirement to the user before switching. Use this when the user explicitly asks for a non-European transcription language (e.g., 'transcribe this in Chinese'), or when project content clearly indicates a different language than the current setting.",
+		inputSchema: {
+			type: "object",
+			properties: {
+				language: {
+					type: "string",
+					enum: ["auto", "chinese", "japanese", "korean", "hindi", "arabic", "thai"],
+					description: "Target language. 'auto' = Parakeet (default); the others route to Whisper.",
+				},
+			},
+			required: ["language"],
+		},
+		command: "system.setTranscriptionLanguage",
+	},
+	{
+		name: "system_is_whisper_model_downloaded",
+		description:
+			"Check whether the Whisper Large-v3-turbo model has been downloaded yet. Returns { downloaded: boolean }. ALWAYS call this before `system_set_transcription_language` to a non-'auto' value — Whisper transcription fails with a structured error if the model isn't on disk, and surprising the user with a 1.1 GB download mid-flow is bad UX.",
+		inputSchema: { type: "object", properties: {} },
+		command: "system.isWhisperModelDownloaded",
+	},
 	// ── workspaces (v1.19) ──────────────────────────────────────────
 	// Multi-workspace isolation: each workspace has its own projects,
@@ -436,7 +467,7 @@ const TOOLS = [
 	{
 		name: "project_read",
 		description:
-			"Read a project's full JSON. Returns { path, project, clipStates, workspaceId, workspaceName, isInActiveWorkspace }. `clipStates` is a per-clip summary: { clipId, mediaPath, durationMs, transcribed, wordCount, audioCleaned, cleanedAudioPath? } — use it to decide whether to call transcript_transcribe or audio_clean before editing. **Workspace fields:** every read includes the project's owning workspace; if `isInActiveWorkspace` is false, the YouTube account and Replicate key in scope are NOT the ones that own this project — surface the mismatch to the user before any export or publish. Pass `project.revision` back as `expectedRevision` on subsequent writes for conflict-safe edits. **Performance tip:** pass `includeTranscript: false` after your first read to drop the per-clip transcript words from the response — they're typically 600+ KB on a 5-minute recording and most agent flows don't need them after pacing is done. clipStates always tells you the transcribed/wordCount status either way.",
+			"Read a project's full JSON. Returns { path, project, clipStates, workspaceId, workspaceName, isInActiveWorkspace }. `clipStates` is a per-clip summary: { clipId, mediaPath, durationMs, transcribed, wordCount, audioCleaned, cleanedAudioPath? } — use it to decide whether to call transcript_transcribe or audio_clean before editing. **Workspace fields:** every read includes the project's owning workspace; if `isInActiveWorkspace` is false, the YouTube account and Replicate key in scope are NOT the ones that own this project — surface the mismatch to the user before any export or publish. Pass `project.revision` back as `expectedRevision` on subsequent writes for conflict-safe edits. **Performance tip:** pass `includeTranscript: false` after your first read to drop the per-clip transcript words from the response — they're typically 600+ KB on a 5-minute recording and most agent flows don't need them after pacing is done. clipStates always tells you the transcribed/wordCount status either way. Clips at project.mainTrack.clips[], overlays at project.editor.mediaOverlayRegions[]. Response includes editedDurationMs, sourceDurationMs, totalTrimmedMs, trimCount.",
 		inputSchema: {
 			type: "object",
 			properties: {
@@ -507,16 +538,21 @@ const TOOLS = [
 	{
 		name: "project_add_motion_graphic",
 		description:
-			"Drop a motion-graphic MP4 onto the timeline. The `file` argument MUST be the exact `outputPath` returned by a prior motion_render_html / motion_generate / motion_concat / motion_screenshot job — NEVER hand-author or guess this path. Optional SFX plays when it appears.",
+			"Drop a motion-graphic MP4/WebM onto the timeline. PREFERRED: pass `fromJob` (the jobId from motion_render_html / motion_generate / motion_concat) — the server resolves the outputPath internally, so you never handle the path string at all. Fallback: pass `file` (an absolute path) only for external/uploaded files. Optional SFX plays when it appears.",
 		inputSchema: {
 			type: "object",
 			properties: {
 				id: { type: "string" },
 				path: { type: "string" },
+				fromJob: {
+					type: "string",
+					description:
+						"PREFERRED for render outputs. The jobId returned by motion_render_html / motion_generate / motion_concat. The server reads the outputPath the job produced — you never construct or pass a path, eliminating the path-truncation failure mode entirely. The job must have succeeded (call job_wait first). Mutually exclusive with `file`.",
+				},
 				file: {
 					type: "string",
 					description:
-						"Absolute path to the rendered MP4/WebM. MUST be the exact `outputPath` returned by motion_render_html (or motion_generate / motion_concat / motion_screenshot). Do NOT construct paths manually — guessed paths get truncated at whitespace (e.g. `/Users/.../Library/Application` from `Application Support`) and the overlay flickers and disappears in preview. If you don't have an outputPath, render one first.",
+						"Absolute path to an external MP4/WebM (e.g. a user upload). For RENDER outputs use `fromJobId` instead. If you must use `file`, pass the exact `outputPath` from a render job — never construct paths manually (they get truncated at the space in `Application Support` and the overlay silently fails). One of `fromJobId` or `file` is required.",
 				},
 				durationMs: { type: "number" },
 				atMs: { type: "number", description: "Default: end of timeline" },
@@ -551,10 +587,71 @@ const TOOLS = [
 				},
 				expectedRevision: { type: "number" },
 			},
-			required: ["file", "durationMs"],
+			required: ["durationMs"],
 		},
 		command: "project.add-motion-graphic",
 	},
+	{
+		name: "project_add_designed_segment",
+		description:
+			"Create a 'designed segment' — the YouTube split where the host stays LIVE on one half and a motion-graphic panel fills the other (host right / panel left, like a Vox or MKBHD explainer beat). ONE atomic call places both pieces over the same time range with the same transition and source anchor, so they can't drift or mismatch: the camera is repositioned + cover-cropped into its half (a full-bleed split clip-transform) and a full-frame transparent panel graphic is composited on top. Stays in the live compositor — camera is full-quality and scrubbable, nothing baked. IMPORTANT: author the panel graphic as a FULL-FRAME (1920×1080) TRANSPARENT render via motion_render_html --transparent — paint the opaque panel + content on the panel side, leave the camera's half fully transparent (it reveals the repositioned host). See SKILL.md 'Designed segments'.",
+		inputSchema: {
+			type: "object",
+			properties: {
+				id: { type: "string" },
+				path: { type: "string" },
+				fromJob: {
+					type: "string",
+					description:
+						"PREFERRED. The jobId from the transparent motion_render_html job (the full-frame panel graphic with the camera half transparent). Server resolves the outputPath internally — no shell, no path truncation. Mutually exclusive with `file`.",
+				},
+				file: {
+					type: "string",
+					description:
+						"Absolute path to the transparent panel graphic (WebM/MOV with alpha). Prefer `fromJob`; if used, pass a render job's exact outputPath — never hand-construct (truncates at the space in 'Application Support').",
+				},
+				durationMs: { type: "number" },
+				atMs: { type: "number", description: "Default: end of timeline" },
+				cameraSide: {
+					type: "string",
+					enum: ["left", "right"],
+					description:
+						"Which half the CAMERA fills; the panel graphic fills the opposite half. 'right' is the canonical reference (host right, panel left).",
+				},
+				cameraRatio: {
+					type: "number",
+					enum: [50, 55],
+					description:
+						"Camera's share of the frame width: 55 (default, the reference split) or 50 (balanced). Panel gets the remaining 45 or 50. Author the panel's opaque width to match (e.g. left 45% for cameraSide=right, cameraRatio=55).",
+				},
+				transitionMs: {
+					type: "number",
+					description: "Slide-in/out window at each edge in ms. Default 320.",
+				},
+				soundUrl: {
+					type: "string",
+					description:
+						"Optional SFX when the segment appears. Bundled id (bundled:sound/<id>), absolute path, or file:// URL. Use asset_list_sounds to discover.",
+				},
+				soundVolume: {
+					type: "number",
+					description: "Sound volume 0–1. Default 1 when soundUrl is set.",
+				},
+				anchorSourceMs: {
+					type: "number",
+					description:
+						"Anchor BOTH regions to a SOURCE-time moment (transcript word startMs). Pass when atMs was derived from a transcript word so the whole segment stays glued across later transcript edits. Omit for free-floating placement.",
+				},
+				anchorSourceEndMs: {
+					type: "number",
+					description: "Optional anchor end (source ms) for ranged anchoring.",
+				},
+				expectedRevision: { type: "number" },
+			},
+			required: ["durationMs", "cameraSide"],
+		},
+		command: "project.add-designed-segment",
+	},
 	{
 		name: "project_set_overlay_backdrop_blur",
 		description:
@@ -1413,13 +1510,26 @@ const TOOLS = [
 	{
 		name: "caption_set_template",
 		description:
-			"Pick a caption template: classic, modern, minimal, bold, spotlight, boxed, neon, or colored.",
+			"Pick a caption template: classic, modern, minimal, bold, spotlight, boxed, neon, colored, or texture. `texture` fills large uppercase words with a flowing texture mask (lava/marble/metal/wood/concrete/rock) — pick the texture via caption_set_style `texture` (defaults to lava).",
 		inputSchema: {
 			type: "object",
 			properties: {
 				id: { type: "string" },
 				path: { type: "string" },
-				templateId: { type: "string" },
+				templateId: {
+					type: "string",
+					enum: [
+						"classic",
+						"modern",
+						"minimal",
+						"bold",
+						"spotlight",
+						"boxed",
+						"neon",
+						"colored",
+						"texture",
+					],
+				},
 				expectedRevision: { type: "number" },
 			},
 			required: ["templateId"],
@@ -1454,6 +1564,11 @@ const TOOLS = [
 				strokeColor: { type: "string", description: "Text stroke/outline color" },
 				strokeWidth: { type: "number", description: "Text stroke width in px" },
 				fontSize: { type: "string", description: "CSS font-size value, e.g. '28px'" },
+				texture: {
+					type: "string",
+					enum: ["lava", "marble", "metal", "wood", "concrete", "rock"],
+					description: "Texture for the 'texture' caption template. Ignored by other templates.",
+				},
 				expectedRevision: { type: "number" },
 			},
 		},
@@ -1868,6 +1983,19 @@ const TOOLS = [
 	},
 	// ── async jobs ─────────────────────────────────────────────────
+	{
+		name: "job_cancel",
+		description:
+			"Cancel a running or queued job. Idempotent — already-terminal jobs are returned as-is.",
+		inputSchema: {
+			type: "object",
+			properties: {
+				id: { type: "string", description: "Job id" },
+			},
+			required: ["id"],
+		},
+		command: "job.cancel",
+	},
 	{
 		name: "job_wait",
 		description:
@@ -1896,6 +2024,23 @@ const TOOLS = [
 		command: "job.get",
 	},
+	// ── timeline helpers ────────────────────────────────────────────
+	{
+		name: "timeline_source_to_edited",
+		description:
+			"Convert source-time ms to edited-timeline ms, accounting for trims and speed regions. Returns null if inside a trimmed region.",
+		inputSchema: {
+			type: "object",
+			properties: {
+				id: { type: "string" },
+				path: { type: "string" },
+				sourceMs: { type: "number", description: "Source-time position in ms" },
+			},
+			required: ["sourceMs"],
+		},
+		command: "timeline.source-to-edited",
+	},
 	// ── escape hatch ────────────────────────────────────────────────
 	{
 		name: "pandastudio_call",
@@ -1918,7 +2063,7 @@ const TOOLS = [
 const server = new Server(
 	{
 		name: "pandastudio",
-		version: "1.17.0",
+		version: "1.19.0",
 	},
 	{
 		capabilities: {

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
 	"name": "@writepanda/mcp",
-	"version": "1.34.0",
+	"version": "1.38.0",
 	"description": "Model Context Protocol server for PandaStudio. Exposes the desktop video editor's automation surface to Cursor, Continue, Cline, Claude Desktop, and any MCP-compliant client.",
 	"keywords": [
 		"pandastudio",