npm - @nomad-e/bluma-cli - Versions diffs - 0.1.58 → 0.1.59 - Mend

@nomad-e/bluma-cli 0.1.58 → 0.1.59

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (10) hide show

package/README.md +2 -2
package/dist/config/native_tools.json +3 -3
package/dist/config/skills/git-pr/SKILL.md +1 -1
package/dist/config/skills/pdf/SKILL.md +153 -22
package/dist/config/skills/pdf/scripts/__pycache__/create_report.cpython-312.pyc +0 -0
package/dist/config/skills/pdf/scripts/create_report.py +607 -209
package/dist/config/skills/pdf/scripts/merge_pdfs.py +1 -1
package/dist/config/skills/skill-creator/SKILL.md +1 -1
package/dist/main.js +59 -6
package/package.json +1 -1

package/dist/config/skills/pdf/scripts/merge_pdfs.py CHANGED Viewed

@@ -3,7 +3,7 @@ Merge multiple PDF files into a single output PDF.
 Usage:
     python merge_pdfs.py --output merged.pdf file1.pdf file2.pdf file3.pdf
-    python merge_pdfs.py --output ./artifacts/combined.pdf *.pdf
+    python merge_pdfs.py --output ./.bluma/artifacts/combined.pdf *.pdf
 """
 import argparse
 import sys

package/dist/config/skills/skill-creator/SKILL.md CHANGED Viewed

@@ -193,7 +193,7 @@ Example script header:
 {description of what this script does}
 Usage:
-    python {script_name}.py --input data.csv --output ./artifacts/result.pdf
+    python {script_name}.py --input data.csv --output ./.bluma/artifacts/result.pdf
 """
 import argparse
 ```

package/dist/main.js CHANGED Viewed

@@ -113,6 +113,20 @@ function isPathInsideWorkspace(targetPath, policy = getSandboxPolicy()) {
   const relative = path6.relative(policy.workspaceRoot, resolved);
   return relative === "" || !relative.startsWith("..") && !path6.isAbsolute(relative);
 }
+function redirectTopLevelArtifactsPath(resolvedAbsolute, workspaceRoot) {
+  const wr = path6.resolve(workspaceRoot);
+  const abs = path6.resolve(resolvedAbsolute);
+  const rel = path6.relative(wr, abs);
+  if (rel.startsWith("..") || path6.isAbsolute(rel)) {
+    return abs;
+  }
+  const segments = rel.split(path6.sep).filter((s) => s.length > 0);
+  if (segments.length === 0 || segments[0] !== "artifacts") {
+    return abs;
+  }
+  const tail = segments.slice(1);
+  return tail.length > 0 ? path6.join(wr, ".bluma", "artifacts", ...tail) : path6.join(wr, ".bluma", "artifacts");
+}
 function resolveWorkspacePath(inputPath, policy = getSandboxPolicy()) {
   const candidate = path6.isAbsolute(inputPath) ? path6.resolve(inputPath) : path6.resolve(policy.workspaceRoot, inputPath);
   if (policy.isSandbox && !isPathInsideWorkspace(candidate, policy)) {
@@ -120,7 +134,7 @@ function resolveWorkspacePath(inputPath, policy = getSandboxPolicy()) {
       `Path "${inputPath}" escapes the sandbox workspace root ${policy.workspaceRoot}`
     );
   }
-  return candidate;
+  return redirectTopLevelArtifactsPath(candidate, policy.workspaceRoot);
 }
 function resolveCommandCwd(cwd, policy = getSandboxPolicy()) {
   const base = cwd ? path6.resolve(cwd) : policy.workspaceRoot;
@@ -8519,10 +8533,16 @@ var AdvancedFeedbackSystem = class {
         score: penalty,
         message: "You are attempting a direct message without a tool_call. All replies must contain tool_call.",
         correction: `
-         ## PROTOCOL VIOLATION \u2014 SERIOUS
-            You are sending a direct response without tool_call, which is strictly prohibited.
-            PENALTY APPLIED: ${penalty.toFixed(1)} points deducted.
-            You MUST always use tool_call without exception.
+## PROTOCOL VIOLATION \u2014 STOP WRITING PLAIN ASSISTANT TEXT
+You streamed or returned **user-visible markdown as assistant content** instead of using the **\`message\` tool**. That is prohibited and **does not end the turn** \u2014 the runtime will loop until timeout.
+Do this **immediately** in your next step (single tool call, no prose outside tools):
+- Call **\`message\`** with **\`message_type\`: \`"result"\`**, put the user-facing summary in **\`content\`**, and put deliverable paths in **\`attachments\`** (absolute paths).
+Do **not** repeat the same summary as plain assistant text again.
+PENALTY APPLIED: ${penalty.toFixed(1)} points deducted.
           `.trim()
       };
     }
@@ -9945,6 +9965,7 @@ The \\\`message\\\` tool has TWO types \u2014 use them CORRECTLY:
 - **Use when**: Task is complete, artifacts ready for delivery
 - **Use ONCE per turn** \u2014 only at the very end
 - **Ends the turn** \u2014 agent waits for next input
+- **CRITICAL:** Plain assistant markdown (streaming or not) **does not** end the worker or close the HTTP job \u2014 only a \\\`message\\\` tool call with \\\`message_type: "result"\\\` does. If you only write text in chat, the process loops until **timeout** (e.g. 300s).
 #### \u274C WRONG: Using "info" to ask questions
 \\\`\\\`\\\`typescript
@@ -10063,6 +10084,7 @@ You (Bluma):
 - **Sandbox is safe** - You can't break the host system
 - **But workspace matters** - Don't pollute /workspace with junk files
+- **Deliverables path** - Never use a top-level \`./artifacts/\` folder in the job root; use \`./.bluma/artifacts/\` (or the \`artifacts_dir\` from \`task_boundary\`). Shell redirects must use that path \u2014 \`file_write\` remaps \`artifacts/...\` to \`.bluma/artifacts/...\` automatically.
 - **Clean up after yourself** - Remove temporary files when done
 - **Respect session boundaries** - Stay in your session workspace
@@ -10288,6 +10310,10 @@ Auto-generated map (may be stale after pull/install). Confirm with tools before
 <<<BLUMA_WORKSPACE_SNAPSHOT_BODY>>>
 </workspace_snapshot>
+<deliverables>
+**Local and sandbox:** generated artifacts (reports, PDFs, exports, plans you attach) must live under \`<workdir>/.bluma/\` \u2014 use \`.bluma/artifacts/\` (or the \`artifacts_dir\` path returned by \`task_boundary\` after starting a task). Do **not** create a top-level \`./artifacts/\` folder in the project root. \`file_write\` / \`edit_tool\` / \`read_file_lines\` automatically remap \`artifacts/...\` \u2192 \`.bluma/artifacts/...\`. For \`shell_command\` redirects (\`>\` / \`>>\`), target \`.bluma/artifacts/...\` explicitly.
+</deliverables>
 <coding_memory>
 Persistent store (~/.bluma/coding_memory.json). Do not invent entries: \`list\` / \`search\` if unsure. \`<coding_memory_snapshot>\` is bootstrap only \u2014 after add/update/remove, list or search again. Operations: add | list | search | update (id) | remove (id), one mutating call at a time.
 </coding_memory>
@@ -10313,7 +10339,7 @@ Output is truncated (~30KB / ~200 lines); use head/tail or write to a file. Use
 The user **only** sees chat content you send through the \`message\` tool (\`content\` as Markdown). Bare assistant text is **not** a substitute \u2014 **you should use \`message\` liberally**.
 **Types**
-- \`message_type: "result"\` \u2014 **ends the turn**: final answer, deliverable, or a **question** that needs a user reply; then the agent waits for the user.
+- \`message_type: "result"\` \u2014 **ends the turn**: final answer, deliverable, or a **question** that needs a user reply; then the agent waits for the user. **Sandbox/worker:** only this stops the job; writing markdown as normal assistant output does **not** finish the task and can cause a **timeout loop**.
 - \`message_type: "info"\` \u2014 **non-terminal**: shown in chat, does **not** end the turn. **Expected behavior:** call \`info\` **multiple times** in a single turn whenever there is something worth saying (even briefly). Under-using \`info\` is a **mistake** in this product.
 **\u26A0\uFE0F CRITICAL: "info" is for INFORMATION ONLY \u2014 NEVER for asking questions**
@@ -11449,6 +11475,8 @@ var BluMaAgent = class {
   factorRouterTurnClosed = false;
   /** Passos seguidos sem tool_calls nem texto visível (só raciocínio) — evita loop lento no mesmo turno. */
   emptyAssistantReplySteps = 0;
+  /** Passos seguidos com texto do assistente sem tool_calls (violação de protocolo) — evita loop até timeout do job. */
+  directTextProtocolSteps = 0;
   constructor(sessionId, eventBus, llm, mcpClient, feedbackSystem) {
     this.sessionId = sessionId;
     this.eventBus = eventBus;
@@ -11592,6 +11620,7 @@ var BluMaAgent = class {
     const userContent = buildUserMessageContent(inputText, process.cwd());
     this.history.push({ role: "user", content: userContent });
     this.emptyAssistantReplySteps = 0;
+    this.directTextProtocolSteps = 0;
     this.eventBus.emit(
       "backend_message",
       buildTurnStartBackendMessage({
@@ -12149,6 +12178,7 @@ ${editData.error.display}`;
     this.history.push(normalizedMessage);
     if (normalizedMessage.tool_calls && normalizedMessage.tool_calls.length > 0) {
       this.emptyAssistantReplySteps = 0;
+      this.directTextProtocolSteps = 0;
       const validToolCalls = normalizedMessage.tool_calls.filter(
         (call) => ToolCallNormalizer.isValidToolCall(call)
       );
@@ -12188,9 +12218,20 @@ ${editData.error.display}`;
       }
     } else if (trimmedText) {
       this.emptyAssistantReplySteps = 0;
+      this.directTextProtocolSteps += 1;
+      const MAX_DIRECT_TEXT_PROTOCOL = 3;
       if (!hasEmittedStart) {
         this.eventBus.emit("backend_message", { type: "assistant_message", content: accumulatedContent });
       }
+      if (this.directTextProtocolSteps >= MAX_DIRECT_TEXT_PROTOCOL) {
+        this.eventBus.emit("backend_message", {
+          type: "error",
+          message: 'Agent kept answering with plain assistant text instead of the `message` tool with message_type "result". Turn forcibly closed to avoid job timeout; fix prompts or model routing.'
+        });
+        await this.notifyFactorTurnEndIfNeeded("protocol_direct_text_exhausted");
+        this.emitTurnCompleted();
+        return;
+      }
       const feedback = this.feedbackSystem.generateFeedback({
         event: "protocol_violation_direct_text",
         details: { violationContent: accumulatedContent }
@@ -12226,6 +12267,7 @@ ${editData.error.display}`;
     this.history.push(message2);
     if (message2.tool_calls && message2.tool_calls.length > 0) {
       this.emptyAssistantReplySteps = 0;
+      this.directTextProtocolSteps = 0;
       const validToolCalls = message2.tool_calls.filter(
         (call) => ToolCallNormalizer.isValidToolCall(call)
       );
@@ -12265,7 +12307,18 @@ ${editData.error.display}`;
       }
     } else if (typeof message2.content === "string" && message2.content.trim()) {
       this.emptyAssistantReplySteps = 0;
+      this.directTextProtocolSteps += 1;
+      const MAX_DIRECT_TEXT_PROTOCOL = 3;
       this.eventBus.emit("backend_message", { type: "assistant_message", content: message2.content });
+      if (this.directTextProtocolSteps >= MAX_DIRECT_TEXT_PROTOCOL) {
+        this.eventBus.emit("backend_message", {
+          type: "error",
+          message: 'Agent kept answering with plain assistant text instead of the `message` tool with message_type "result". Turn forcibly closed to avoid job timeout.'
+        });
+        await this.notifyFactorTurnEndIfNeeded("protocol_direct_text_exhausted");
+        this.emitTurnCompleted();
+        return;
+      }
       const feedback = this.feedbackSystem.generateFeedback({
         event: "protocol_violation_direct_text",
         details: { violationContent: message2.content }

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
 	"name": "@nomad-e/bluma-cli",
-	"version": "0.1.58",
+	"version": "0.1.59",
 	"description": "BluMa independent agent for automation and advanced software engineering.",
 	"author": "Alex Fonseca",
 	"license": "Apache-2.0",