npm - @mindstudio-ai/remy - Versions diffs - 0.1.198 → 0.1.199 - Mend

@mindstudio-ai/remy 0.1.198 → 0.1.199

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (4) hide show

package/dist/headless.js +28 -6
package/dist/index.js +28 -6
package/dist/subagents/designExpert/tools/images/enhance-image-prompt.md +1 -0
package/package.json +1 -1

package/dist/headless.js CHANGED Viewed

@@ -4232,7 +4232,15 @@ var SYSTEM_PROMPT = readAsset(
   "subagents/designExpert/tools/images/enhance-image-prompt.md"
 );
 async function enhanceImagePrompt(params) {
-  const { brief, width, height, transparentBackground, onLog, model } = params;
+  const {
+    brief,
+    width,
+    height,
+    transparentBackground,
+    hasReferenceImage,
+    onLog,
+    model
+  } = params;
   const contextParts = [
     `Dimensions: ${width}x${height}${width > height ? " (landscape)" : width < height ? " (portrait)" : " (square)"}`
   ];
@@ -4241,6 +4249,11 @@ async function enhanceImagePrompt(params) {
       "Transparent background: yes \u2014 the background will be removed. Focus on the subject as an isolated element."
     );
   }
+  if (hasReferenceImage) {
+    contextParts.push(
+      "Reference image: yes \u2014 a reference image is provided to the generation model alongside this prompt to guide style, subject, or composition. Complement it; don't re-describe what it already carries."
+    );
+  }
   const context = `<context>
 ${contextParts.join("\n")}
 </context>`;
@@ -4271,6 +4284,7 @@ async function generateImageAssets(opts) {
     prompts,
     sourceImages,
     transparentBackground,
+    enhancePrompts,
     onLog,
     imageGenerationModel: genModel,
     imageAnalysisModel,
@@ -4289,19 +4303,20 @@ async function generateImageAssets(opts) {
     config.source_image = firstImage;
     config.source = firstImage;
   }
-  const isEdit = !!sourceImages?.length;
-  const enhancedPrompts = isEdit ? prompts : await Promise.all(
+  const hasReference = !!sourceImages?.length;
+  const enhancedPrompts = enhancePrompts ? await Promise.all(
     prompts.map(
       (brief) => enhanceImagePrompt({
         brief,
         width,
         height,
         transparentBackground,
+        hasReferenceImage: hasReference,
         onLog,
         model: imagePromptEnhancerModel
       })
     )
-  );
+  ) : prompts;
   let imageUrls;
   if (enhancedPrompts.length === 1) {
     const step = JSON.stringify({
@@ -4371,7 +4386,7 @@ async function generateImageAssets(opts) {
       if (url.startsWith("Error")) {
         return {
           prompt: prompts[i],
-          ...!isEdit && { enhancedPrompt: enhancedPrompts[i] },
+          ...enhancePrompts && { enhancedPrompt: enhancedPrompts[i] },
           error: url
         };
       }
@@ -4384,7 +4399,7 @@ async function generateImageAssets(opts) {
       return {
         url,
         prompt: prompts[i],
-        ...!isEdit && { enhancedPrompt: enhancedPrompts[i] },
+        ...enhancePrompts && { enhancedPrompt: enhancedPrompts[i] },
         analysis,
         width,
         height
@@ -4409,6 +4424,10 @@ var definition6 = {
         },
         description: "One or more image briefs describing what you want. Focus on subject, mood, style, and intended use \u2014 the tool optimizes your brief into a model-ready prompt automatically. Multiple briefs run in parallel."
       },
+      referenceImage: {
+        type: "string",
+        description: "Optional URL of a single reference image to guide the generation \u2014 for style, subject, character consistency, or composition. Your prompt still describes the desired result; the reference conditions it. Applies to every prompt in the batch."
+      },
       width: {
         type: "number",
         description: "Image width in pixels. Default 2048. Range: 2048-4096."
@@ -4431,6 +4450,8 @@ async function execute6(input, onLog, context) {
     width: input.width,
     height: input.height,
     transparentBackground: input.transparentBackground,
+    sourceImages: input.referenceImage ? [input.referenceImage] : void 0,
+    enhancePrompts: true,
     onLog,
     imageGenerationModel: resolveModel(
       "imageGeneration",
@@ -4500,6 +4521,7 @@ async function execute7(input, onLog, context) {
     width: input.width,
     height: input.height,
     transparentBackground: input.transparentBackground,
+    enhancePrompts: false,
     onLog,
     imageGenerationModel: resolveModel(
       "imageGeneration",

package/dist/index.js CHANGED Viewed

@@ -4957,7 +4957,15 @@ var init_screenshot3 = __esm({
 // src/subagents/designExpert/tools/images/enhancePrompt.ts
 async function enhanceImagePrompt(params) {
-  const { brief, width, height, transparentBackground, onLog, model } = params;
+  const {
+    brief,
+    width,
+    height,
+    transparentBackground,
+    hasReferenceImage,
+    onLog,
+    model
+  } = params;
   const contextParts = [
     `Dimensions: ${width}x${height}${width > height ? " (landscape)" : width < height ? " (portrait)" : " (square)"}`
   ];
@@ -4966,6 +4974,11 @@ async function enhanceImagePrompt(params) {
       "Transparent background: yes \u2014 the background will be removed. Focus on the subject as an isolated element."
     );
   }
+  if (hasReferenceImage) {
+    contextParts.push(
+      "Reference image: yes \u2014 a reference image is provided to the generation model alongside this prompt to guide style, subject, or composition. Complement it; don't re-describe what it already carries."
+    );
+  }
   const context = `<context>
 ${contextParts.join("\n")}
 </context>`;
@@ -5006,6 +5019,7 @@ async function generateImageAssets(opts) {
     prompts,
     sourceImages,
     transparentBackground,
+    enhancePrompts,
     onLog,
     imageGenerationModel: genModel,
     imageAnalysisModel,
@@ -5024,19 +5038,20 @@ async function generateImageAssets(opts) {
     config.source_image = firstImage;
     config.source = firstImage;
   }
-  const isEdit = !!sourceImages?.length;
-  const enhancedPrompts = isEdit ? prompts : await Promise.all(
+  const hasReference = !!sourceImages?.length;
+  const enhancedPrompts = enhancePrompts ? await Promise.all(
     prompts.map(
       (brief) => enhanceImagePrompt({
         brief,
         width,
         height,
         transparentBackground,
+        hasReferenceImage: hasReference,
         onLog,
         model: imagePromptEnhancerModel
       })
     )
-  );
+  ) : prompts;
   let imageUrls;
   if (enhancedPrompts.length === 1) {
     const step = JSON.stringify({
@@ -5106,7 +5121,7 @@ async function generateImageAssets(opts) {
       if (url.startsWith("Error")) {
         return {
           prompt: prompts[i],
-          ...!isEdit && { enhancedPrompt: enhancedPrompts[i] },
+          ...enhancePrompts && { enhancedPrompt: enhancedPrompts[i] },
           error: url
         };
       }
@@ -5119,7 +5134,7 @@ async function generateImageAssets(opts) {
       return {
         url,
         prompt: prompts[i],
-        ...!isEdit && { enhancedPrompt: enhancedPrompts[i] },
+        ...enhancePrompts && { enhancedPrompt: enhancedPrompts[i] },
         analysis,
         width,
         height
@@ -5151,6 +5166,8 @@ async function execute6(input, onLog, context) {
     width: input.width,
     height: input.height,
     transparentBackground: input.transparentBackground,
+    sourceImages: input.referenceImage ? [input.referenceImage] : void 0,
+    enhancePrompts: true,
     onLog,
     imageGenerationModel: resolveModel(
       "imageGeneration",
@@ -5189,6 +5206,10 @@ var init_generateImages = __esm({
             },
             description: "One or more image briefs describing what you want. Focus on subject, mood, style, and intended use \u2014 the tool optimizes your brief into a model-ready prompt automatically. Multiple briefs run in parallel."
           },
+          referenceImage: {
+            type: "string",
+            description: "Optional URL of a single reference image to guide the generation \u2014 for style, subject, character consistency, or composition. Your prompt still describes the desired result; the reference conditions it. Applies to every prompt in the batch."
+          },
           width: {
             type: "number",
             description: "Image width in pixels. Default 2048. Range: 2048-4096."
@@ -5221,6 +5242,7 @@ async function execute7(input, onLog, context) {
     width: input.width,
     height: input.height,
     transparentBackground: input.transparentBackground,
+    enhancePrompts: false,
     onLog,
     imageGenerationModel: resolveModel(
       "imageGeneration",

package/dist/subagents/designExpert/tools/images/enhance-image-prompt.md CHANGED Viewed

@@ -41,6 +41,7 @@ You'll receive context about the generation parameters. Use them:
 - **Dimensions**: If the image is wide (landscape), compose horizontally. If tall (portrait), compose vertically. If square, center the subject.
 - **Transparent background**: The background will be removed after generation and the image will be trimmed to the subject bounds (no extra padding). Don't describe elaborate backgrounds — focus on the subject. Describe it as an isolated element.
+- **Reference image**: When a reference image is provided, the generation model receives it alongside your prompt to guide style, subject, or composition. Write the prompt to *complement* the reference, not duplicate it: describe the scene, action, and anything new or changed, and lean on the reference for what it already establishes (a specific face, product, logo, or art style). Don't exhaustively re-describe those — over-specifying competes with the reference image and can distort it.
 ## Photography prompts

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@mindstudio-ai/remy",
-  "version": "0.1.198",
+  "version": "0.1.199",
   "description": "MindStudio coding agent",
   "repository": {
     "type": "git",