npm - @mindstudio-ai/remy - Versions diffs - 0.1.20 → 0.1.22 - Mend

@mindstudio-ai/remy 0.1.20 → 0.1.22

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (21) hide show

package/dist/compiled/design.md +2 -1
package/dist/compiled/msfm.md +1 -0
package/dist/headless.js +172 -113
package/dist/index.js +186 -115
package/dist/prompt/.notes.md +1 -1
package/dist/prompt/compiled/design.md +2 -1
package/dist/prompt/compiled/msfm.md +1 -0
package/dist/prompt/sources/frontend-design-notes.md +1 -0
package/dist/prompt/static/authoring.md +4 -4
package/dist/prompt/static/team.md +7 -3
package/dist/static/authoring.md +4 -4
package/dist/static/team.md +7 -3
package/dist/subagents/codeSanityCheck/prompt.md +12 -0
package/dist/subagents/designExpert/.notes.md +3 -2
package/dist/subagents/designExpert/data/compile-inspiration.sh +2 -2
package/dist/subagents/designExpert/prompts/frontend-design-notes.md +1 -0
package/dist/subagents/designExpert/prompts/identity.md +3 -3
package/dist/subagents/designExpert/prompts/images.md +3 -2
package/dist/subagents/designExpert/prompts/layout.md +1 -1
package/dist/subagents/productVision/prompt.md +1 -1
package/package.json +1 -1

package/dist/compiled/design.md CHANGED Viewed

@@ -43,7 +43,7 @@ Derive additional implementation colors (borders, focus states, hover states, di
 ### Typography block format
-A `` ```typography `` fenced block in a `type: design/typography` spec file declares fonts (with source URLs) and one or two anchor styles (typically Display and Body). Derive additional styles (labels, buttons, captions, overlines) from these anchors:
+A `` ```typography `` fenced block in a `type: design/typography` spec file declares fonts (with source URLs) and one or two anchor styles (typically Display and Body). Styles can include an optional `case` field (`uppercase`, `lowercase`, `capitalize`) for text-transform. Derive additional styles (labels, buttons, captions, overlines) from these anchors:
 ```typography
 fonts:
@@ -59,6 +59,7 @@ styles:
     weight: 600
     letterSpacing: -0.03em
     lineHeight: 1.1
+    case: uppercase
     description: Page titles and hero text
   Body:
     font: Satoshi

package/dist/compiled/msfm.md CHANGED Viewed

@@ -181,6 +181,7 @@ styles:
     weight: 600
     letterSpacing: -0.03em
     lineHeight: 1.1
+    case: uppercase
     description: Page titles and hero text
   Body:
     font: Satoshi

package/dist/headless.js CHANGED Viewed

@@ -1242,8 +1242,32 @@ var confirmDestructiveActionTool = {
   }
 };
-// src/subagents/sdkConsultant/index.ts
+// src/subagents/common/runCli.ts
 import { exec } from "child_process";
+function runCli(cmd, options) {
+  return new Promise((resolve) => {
+    exec(
+      cmd,
+      {
+        timeout: options?.timeout ?? 6e4,
+        maxBuffer: options?.maxBuffer ?? 1024 * 1024
+      },
+      (err, stdout, stderr) => {
+        if (stdout.trim()) {
+          resolve(stdout.trim());
+          return;
+        }
+        if (err) {
+          resolve(`Error: ${stderr.trim() || err.message}`);
+          return;
+        }
+        resolve("(no response)");
+      }
+    );
+  });
+}
+// src/subagents/sdkConsultant/index.ts
 var askMindStudioSdkTool = {
   definition: {
     name: "askMindStudioSdk",
@@ -1261,28 +1285,13 @@ var askMindStudioSdkTool = {
   },
   async execute(input) {
     const query = input.query;
-    return new Promise((resolve) => {
-      exec(
-        `mindstudio ask ${JSON.stringify(query)}`,
-        { timeout: 6e4, maxBuffer: 512 * 1024 },
-        (err, stdout, stderr) => {
-          if (stdout.trim()) {
-            resolve(stdout.trim());
-            return;
-          }
-          if (err) {
-            resolve(`Error: ${stderr.trim() || err.message}`);
-            return;
-          }
-          resolve("(no response)");
-        }
-      );
+    return runCli(`mindstudio ask ${JSON.stringify(query)}`, {
+      maxBuffer: 512 * 1024
     });
   }
 };
 // src/tools/common/fetchUrl.ts
-import { exec as exec2 } from "child_process";
 var fetchUrlTool = {
   definition: {
     name: "scapeWebUrl",
@@ -1309,29 +1318,13 @@ var fetchUrlTool = {
     if (screenshot) {
       pageOptions.screenshot = true;
     }
-    const cmd = `mindstudio scrape-url --url ${JSON.stringify(url)} --page-options ${JSON.stringify(JSON.stringify(pageOptions))} --no-meta`;
-    return new Promise((resolve) => {
-      exec2(
-        cmd,
-        { timeout: 6e4, maxBuffer: 1024 * 1024 },
-        (err, stdout, stderr) => {
-          if (stdout.trim()) {
-            resolve(stdout.trim());
-            return;
-          }
-          if (err) {
-            resolve(`Error: ${stderr.trim() || err.message}`);
-            return;
-          }
-          resolve("(no response)");
-        }
-      );
-    });
+    return runCli(
+      `mindstudio scrape-url --url ${JSON.stringify(url)} --page-options ${JSON.stringify(JSON.stringify(pageOptions))} --no-meta`
+    );
   }
 };
 // src/tools/common/searchGoogle.ts
-import { exec as exec3 } from "child_process";
 var searchGoogleTool = {
   definition: {
     name: "searchGoogle",
@@ -1349,24 +1342,10 @@ var searchGoogleTool = {
   },
   async execute(input) {
     const query = input.query;
-    const cmd = `mindstudio search-google --query ${JSON.stringify(query)} --export-type json --output-key results --no-meta`;
-    return new Promise((resolve) => {
-      exec3(
-        cmd,
-        { timeout: 6e4, maxBuffer: 512 * 1024 },
-        (err, stdout, stderr) => {
-          if (stdout.trim()) {
-            resolve(stdout.trim());
-            return;
-          }
-          if (err) {
-            resolve(`Error: ${stderr.trim() || err.message}`);
-            return;
-          }
-          resolve("(no response)");
-        }
-      );
-    });
+    return runCli(
+      `mindstudio search-google --query ${JSON.stringify(query)} --export-type json --output-key results --no-meta`,
+      { maxBuffer: 512 * 1024 }
+    );
   }
 };
@@ -1691,7 +1670,7 @@ ${unifiedDiff(input.path, content, updated)}`;
 };
 // src/tools/code/bash.ts
-import { exec as exec4 } from "child_process";
+import { exec as exec2 } from "child_process";
 var DEFAULT_TIMEOUT_MS = 12e4;
 var DEFAULT_MAX_LINES3 = 500;
 var bashTool = {
@@ -1725,7 +1704,7 @@ var bashTool = {
     const maxLines = input.maxLines === 0 ? Infinity : input.maxLines || DEFAULT_MAX_LINES3;
     const timeoutMs = input.timeout ? input.timeout * 1e3 : DEFAULT_TIMEOUT_MS;
     return new Promise((resolve) => {
-      exec4(
+      exec2(
         input.command,
         {
           timeout: timeoutMs,
@@ -1765,7 +1744,7 @@ var bashTool = {
 };
 // src/tools/code/grep.ts
-import { exec as exec5 } from "child_process";
+import { exec as exec3 } from "child_process";
 var DEFAULT_MAX = 50;
 function formatResults(stdout, max) {
   const lines = stdout.trim().split("\n");
@@ -1812,12 +1791,12 @@ var grepTool = {
     const rgCmd = `rg -n --no-heading --max-count=${max}${globFlag} '${escaped}' ${searchPath}`;
     const grepCmd = `grep -rn --max-count=${max} '${escaped}' ${searchPath} --include='*.ts' --include='*.tsx' --include='*.js' --include='*.json' --include='*.md'`;
     return new Promise((resolve) => {
-      exec5(rgCmd, { maxBuffer: 512 * 1024 }, (err, stdout) => {
+      exec3(rgCmd, { maxBuffer: 512 * 1024 }, (err, stdout) => {
         if (stdout?.trim()) {
           resolve(formatResults(stdout, max));
           return;
         }
-        exec5(grepCmd, { maxBuffer: 512 * 1024 }, (_err, grepStdout) => {
+        exec3(grepCmd, { maxBuffer: 512 * 1024 }, (_err, grepStdout) => {
           if (grepStdout?.trim()) {
             resolve(formatResults(grepStdout, max));
           } else {
@@ -2049,17 +2028,38 @@ var runMethodTool = {
 };
 // src/tools/code/screenshot.ts
+var DEFAULT_PROMPT = "Describe this app screenshot for a developer who cannot see it. What is visible on screen: the layout, content, interactive elements, any loading or error states. Be concise and factual.";
 var screenshotTool = {
   definition: {
     name: "screenshot",
-    description: "Capture a screenshot of the app preview. Returns a CDN URL with dimensions. Useful for visually checking the current state after UI changes or when debugging layout issues.",
+    description: "Capture a screenshot of the app preview and get a description of what's on screen. Optionally provide a specific question about what you're looking for.",
     inputSchema: {
       type: "object",
-      properties: {}
+      properties: {
+        prompt: {
+          type: "string",
+          description: "Optional question about the screenshot. If omitted, returns a general description of what's visible."
+        }
+      }
     }
   },
-  async execute() {
-    return "ok";
+  async execute(input) {
+    try {
+      const { url } = await sidecarRequest(
+        "/screenshot",
+        {},
+        { timeout: 3e4 }
+      );
+      const analysisPrompt = input.prompt || DEFAULT_PROMPT;
+      const analysis = await runCli(
+        `mindstudio analyze-image --prompt ${JSON.stringify(analysisPrompt)} --image-url ${JSON.stringify(url)} --output-key analysis --no-meta`
+      );
+      return `Screenshot: ${url}
+${analysis}`;
+    } catch (err) {
+      return `Error taking screenshot: ${err.message}`;
+    }
   }
 };
@@ -2413,7 +2413,6 @@ var browserAutomationTool = {
 };
 // src/subagents/designExpert/tools.ts
-import { exec as exec6 } from "child_process";
 var DESIGN_REFERENCE_PROMPT = `Analyze this website/app screenshot as a design reference. Assess:
 1) Mood/aesthetic
 2) Color palette with approximate hex values and palette strategy
@@ -2421,7 +2420,7 @@ var DESIGN_REFERENCE_PROMPT = `Analyze this website/app screenshot as a design r
 4) Layout composition (symmetric/asymmetric, grid structure, whitespace usage, content density)
 5) What makes it distinctive and interesting vs generic AI-generated interfaces
 Be specific and concise.`;
-var DESIGN_RESEARCH_TOOLS = [
+var DESIGN_EXPERT_TOOLS = [
   {
     name: "searchGoogle",
     description: "Search Google for web results. Use for finding design inspiration, font recommendations, UI patterns, real products in a domain, and reference material.",
@@ -2496,7 +2495,7 @@ var DESIGN_RESEARCH_TOOLS = [
   },
   {
     name: "generateImages",
-    description: "Generate images using AI (Seedream). Returns CDN URLs. Produces high-quality results for both photorealistic images and abstract/creative visuals. Pass multiple prompts to generate in parallel.",
+    description: "Generate images using AI (Seedream). Returns CDN URLs with a quality analysis for each image. Produces high-quality results for both photorealistic images and abstract/creative visuals. Pass multiple prompts to generate in parallel. No need to analyze images separately after generating \u2014 the analysis is included.",
     inputSchema: {
       type: "object",
       properties: {
@@ -2520,27 +2519,26 @@ var DESIGN_RESEARCH_TOOLS = [
     }
   }
 ];
-function runCli(cmd) {
-  return new Promise((resolve) => {
-    exec6(
-      cmd,
-      { timeout: 6e4, maxBuffer: 1024 * 1024 },
-      (err, stdout, stderr) => {
-        if (stdout.trim()) {
-          resolve(stdout.trim());
-          return;
-        }
-        if (err) {
-          resolve(`Error: ${stderr.trim() || err.message}`);
-          return;
-        }
-        resolve("(no response)");
-      }
-    );
-  });
-}
-async function executeDesignTool(name, input) {
+async function executeDesignExpertTool(name, input) {
   switch (name) {
+    case "screenshot": {
+      try {
+        const { url } = await sidecarRequest(
+          "/screenshot",
+          {},
+          { timeout: 3e4 }
+        );
+        const analysisPrompt = input.prompt || "Describe this app screenshot for a visual designer reviewing the current state. What is visible: layout, typography, colors, spacing, imagery. Note anything that looks broken or off. Be concise.";
+        const analysis = await runCli(
+          `mindstudio analyze-image --prompt ${JSON.stringify(analysisPrompt)} --image-url ${JSON.stringify(url)} --output-key analysis --no-meta`
+        );
+        return `Screenshot: ${url}
+${analysis}`;
+      } catch (err) {
+        return `Error taking screenshot: ${err.message}`;
+      }
+    }
     case "searchGoogle":
       return runCli(
         `mindstudio search-google --query ${JSON.stringify(input.query)} --export-type json --output-key results --no-meta`
@@ -2585,6 +2583,8 @@ ${analysis}`;
       const prompts = input.prompts;
       const width = input.width || 2048;
       const height = input.height || 2048;
+      const ANALYZE_PROMPT = "You are reviewing this image for a visual designer sourcing assets for a project. Describe: what the image depicts, the mood and color palette, how the lighting and composition work, whether there are any issues (unwanted text, artifacts, distortions), and how it could be used in a layout (hero background, feature section, card texture, etc). Be concise and practical.";
+      let imageUrls;
       if (prompts.length === 1) {
         const step = JSON.stringify({
           prompt: prompts[0],
@@ -2593,21 +2593,47 @@ ${analysis}`;
             config: { width, height }
           }
         });
-        return runCli(
+        const url = await runCli(
           `mindstudio generate-image '${step}' --output-key imageUrl --no-meta`
         );
-      }
-      const steps = prompts.map((prompt) => ({
-        stepType: "generateImage",
-        step: {
-          prompt,
-          imageModelOverride: {
-            model: "seedream-4.5",
-            config: { width, height }
+        imageUrls = [url];
+      } else {
+        const steps = prompts.map((prompt) => ({
+          stepType: "generateImage",
+          step: {
+            prompt,
+            imageModelOverride: {
+              model: "seedream-4.5",
+              config: { width, height }
+            }
           }
+        }));
+        const batchResult = await runCli(
+          `mindstudio batch '${JSON.stringify(steps)}' --no-meta`
+        );
+        try {
+          const parsed = JSON.parse(batchResult);
+          imageUrls = parsed.results.map(
+            (r) => r.output?.imageUrl ?? `Error: ${r.error}`
+          );
+        } catch {
+          return batchResult;
         }
-      }));
-      return runCli(`mindstudio batch '${JSON.stringify(steps)}' --no-meta`);
+      }
+      const analyses = await Promise.all(
+        imageUrls.map(async (url, i) => {
+          if (url.startsWith("Error")) {
+            return `Image ${i + 1}: ${url}`;
+          }
+          const analysis = await runCli(
+            `mindstudio analyze-image --prompt ${JSON.stringify(ANALYZE_PROMPT)} --image-url ${JSON.stringify(url)} --output-key analysis --no-meta`
+          );
+          return `**Image ${i + 1}:** ${url}
+Prompt: ${prompts[i]}
+Analysis: ${analysis}`;
+        })
+      );
+      return analyses.join("\n\n");
     }
     default:
       return `Error: unknown tool "${name}"`;
@@ -2757,7 +2783,7 @@ function sample(arr, n) {
   }
   return copy.slice(0, n);
 }
-function getDesignResearchPrompt() {
+function getDesignExpertPrompt() {
   const fonts = sample(fontData.fonts, 30);
   const pairings = sample(fontData.pairings, 20);
   const images = sample(inspirationImages, 15);
@@ -2811,7 +2837,7 @@ ${specContext}`;
 // src/subagents/designExpert/index.ts
 var DESCRIPTION = `
-Visual design expert. Handles fonts, colors, palettes, gradients, layouts, imagery, icons, and visual direction. Can answer from expertise alone or research the web. Returns concrete resources: hex values, font names with CSS URLs, image URLs, layout descriptions. Include app context in your task \u2014 the agent cannot see your conversation with the user.
+Visual design expert. Describe the situation and what you need \u2014 the agent decides what to deliver. It reads the spec files automatically. Include relevant user requirements and context it can't get from the spec, but do not list specific deliverables or tell it how to do its job.
 `.trim();
 var designExpertTool = {
   definition: {
@@ -2830,17 +2856,17 @@ var designExpertTool = {
   },
   async execute(input, context) {
     if (!context) {
-      return "Error: design research requires execution context";
+      return "Error: visual design expert requires execution context";
     }
     const result = await runSubAgent({
-      system: getDesignResearchPrompt(),
+      system: getDesignExpertPrompt(),
       task: input.task,
-      tools: DESIGN_RESEARCH_TOOLS,
-      externalTools: /* @__PURE__ */ new Set(["screenshot"]),
-      executeTool: executeDesignTool,
+      tools: DESIGN_EXPERT_TOOLS,
+      externalTools: /* @__PURE__ */ new Set(),
+      executeTool: executeDesignExpertTool,
       apiConfig: context.apiConfig,
       model: context.model,
-      subAgentId: "designExpert",
+      subAgentId: "visualDesignExpert",
       signal: context.signal,
       parentToolId: context.toolCallId,
       onEvent: context.onEvent,
@@ -3709,7 +3735,6 @@ var EXTERNAL_TOOLS = /* @__PURE__ */ new Set([
   "runScenario",
   "runMethod",
   "browserCommand",
-  "screenshot",
   "setProjectName"
 ]);
 function createAgentState() {
@@ -3753,6 +3778,12 @@ async function runTurn(params) {
     });
   }
   state.messages.push(userMsg);
+  const STATUS_EXCLUDED_TOOLS = /* @__PURE__ */ new Set([
+    "setProjectOnboardingState",
+    "setProjectName",
+    "clearSyncStatus",
+    "editsFinished"
+  ]);
   let lastCompletedTools = "";
   let lastCompletedResult = "";
   while (true) {
@@ -3841,7 +3872,7 @@ async function runTurn(params) {
       apiConfig,
       getContext: () => ({
         assistantText: getTextContent(contentBlocks).slice(-500),
-        lastToolName: getToolCalls(contentBlocks).at(-1)?.name || lastCompletedTools || void 0,
+        lastToolName: getToolCalls(contentBlocks).filter((tc) => !STATUS_EXCLUDED_TOOLS.has(tc.name)).at(-1)?.name || lastCompletedTools || void 0,
         lastToolResult: lastCompletedResult || void 0
       }),
       onStatus: (label) => onEvent({ type: "status", message: label }),
@@ -4000,6 +4031,28 @@ async function runTurn(params) {
       count: toolCalls.length,
       tools: toolCalls.map((tc) => tc.name)
     });
+    let subAgentText = "";
+    const origOnEvent = onEvent;
+    const wrappedOnEvent = (e) => {
+      if ("parentToolId" in e && e.parentToolId) {
+        if (e.type === "text") {
+          subAgentText = e.text;
+        } else if (e.type === "tool_start") {
+          subAgentText = `Using ${e.name}`;
+        }
+      }
+      origOnEvent(e);
+    };
+    const toolStatusWatcher = startStatusWatcher({
+      apiConfig,
+      getContext: () => ({
+        assistantText: subAgentText || getTextContent(contentBlocks).slice(-500),
+        lastToolName: toolCalls.filter((tc) => !STATUS_EXCLUDED_TOOLS.has(tc.name)).map((tc) => tc.name).join(", ") || void 0,
+        lastToolResult: lastCompletedResult || void 0
+      }),
+      onStatus: (label) => origOnEvent({ type: "status", message: label }),
+      signal
+    });
     const subAgentMessages = /* @__PURE__ */ new Map();
     const results = await Promise.all(
       toolCalls.map(async (tc) => {
@@ -4025,7 +4078,7 @@ async function runTurn(params) {
               apiConfig,
               model,
               signal,
-              onEvent,
+              onEvent: wrappedOnEvent,
               resolveExternalTool,
               toolCallId: tc.id,
               subAgentMessages
@@ -4059,15 +4112,21 @@ async function runTurn(params) {
         }
       })
     );
-    for (const [toolId, msgs] of subAgentMessages) {
+    toolStatusWatcher.stop();
+    for (const r of results) {
       const block = contentBlocks.find(
-        (b) => b.type === "tool" && b.id === toolId
+        (b) => b.type === "tool" && b.id === r.id
       );
       if (block?.type === "tool") {
-        block.subAgentMessages = msgs;
+        block.result = r.result;
+        block.isError = r.isError;
+        const msgs = subAgentMessages.get(r.id);
+        if (msgs) {
+          block.subAgentMessages = msgs;
+        }
       }
     }
-    lastCompletedTools = toolCalls.map((tc) => tc.name).join(", ");
+    lastCompletedTools = toolCalls.filter((tc) => !STATUS_EXCLUDED_TOOLS.has(tc.name)).map((tc) => tc.name).join(", ");
     lastCompletedResult = results.at(-1)?.result ?? "";
     for (const r of results) {
       state.messages.push({