npm - @nomad-e/bluma-cli - Versions diffs - 0.1.61 → 0.1.63 - Mend

@nomad-e/bluma-cli 0.1.61 → 0.1.63

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (2) hide show

package/dist/main.js +158 -53
package/package.json +1 -1

package/dist/main.js CHANGED Viewed

@@ -319,35 +319,13 @@ var init_sandbox_policy = __esm({
     init_runtime_config();
     init_permission_rules();
     BLOCKED_COMMAND_PATTERNS = [
-      { pattern: /^sudo\s+/i, reason: "Privilege escalation is not allowed." },
-      { pattern: /^doas\s+/i, reason: "Privilege escalation is not allowed." },
-      { pattern: /^su\s+/i, reason: "Privilege escalation is not allowed." },
-      { pattern: /^pkexec\s+/i, reason: "Privilege escalation is not allowed." },
-      { pattern: /\bmkfs\./i, reason: "Disk formatting commands are blocked." },
-      { pattern: /\bdd\s+.*of=\/dev\/(sd|hd|nvme)/i, reason: "Raw disk writes are blocked." },
-      { pattern: /\brm\s+(-[rf]+\s+)*\/($|\s)/i, reason: "Deleting filesystem roots is blocked." },
-      { pattern: /\brm\s+-[rf]*\s+~($|\s)/i, reason: "Deleting home roots is blocked." },
-      { pattern: /\bcurl\s+.*\|\s*(ba)?sh/i, reason: "Pipe-to-shell remote execution is blocked." },
-      { pattern: /\bwget\s+.*\|\s*(ba)?sh/i, reason: "Pipe-to-shell remote execution is blocked." }
+      // No command patterns blocked — sandbox isolation handles safety
     ];
     HIGH_RISK_COMMAND_PATTERNS = [
-      /\brm\s+-[rf]/i,
-      /\bmv\s+.+\s+\/(?!tmp\b)/i,
-      /\bchmod\b/i,
-      /\bchown\b/i,
-      /\bssh\b/i,
-      /\bscp\b/i,
-      /\brsync\b/i,
-      /\bdocker\b/i,
-      /\bkubectl\b/i
+      // No high-risk patterns — all commands allowed inside sandbox
     ];
     MODERATE_RISK_COMMAND_PATTERNS = [
-      /\bnpm\s+(install|update|uninstall)\b/i,
-      /\bpnpm\s+(add|install|update|remove)\b/i,
-      /\byarn\s+(add|install|remove)\b/i,
-      /\buv\s+(add|remove|sync)\b/i,
-      /\bpip\s+install\b/i,
-      /\bgit\s+(commit|push|rebase|reset|clean)\b/i
+      // No moderate-risk patterns — all commands allowed inside sandbox
     ];
   }
 });
@@ -11064,28 +11042,131 @@ Fix in progress.
 Fix for the null pointer in progress. Waiting for worker to complete tests and commit.
 \`\`\`
-## 7. Final Tips
+## 7. When to Delegate vs Do Directly
+### Delegate to Workers When:
+- **Task is parallelizable** \u2014 Multiple independent parts can run concurrently
+- **Research needed** \u2014 Investigating codebase structure, finding patterns, analyzing architecture
+- **Implementation is well-defined** \u2014 Clear spec with file paths, line numbers, expected behavior
+- **Verification required** \u2014 Testing changes made by other workers
+- **Fresh context needed** \u2014 Verification should be independent of implementation
+- **Long-running task** \u2014 Audits, refactors, test runs that take >30 seconds
+- **Risk mitigation** \u2014 Changes to critical paths benefit from independent verification
+### Do Directly When:
+- **Simple file read** \u2014 Just need to check a value or path
+- **Quick question** \u2014 User asks "what does X do?" \u2014 answer directly
+- **Single-line edit** \u2014 Trivial change that doesn't need worker overhead
+- **User wants conversation** \u2014 Questions about approach, preferences, or clarification
+- **Task is <10 seconds** \u2014 Worker spawn overhead exceeds task duration
+- **Need immediate feedback** \u2014 User is waiting and task is quick
+### Decision Matrix
+| Task Complexity | Parallelizable? | Time Estimate (rough) | Action |
+|----------------|-----------------|----------------------|--------|
+| Simple | No | <10s | **Do directly** |
+| Simple | Yes | <10s | **Do directly** (overhead not worth it) |
+| Medium | No | 10-60s | **Consider** \u2014 delegate if risky |
+| Medium | Yes | 10-60s | **Delegate** (parallel workers) |
+| Complex | No | >60s | **Delegate** (worker has focus) |
+| Complex | Yes | >60s | **Delegate** (parallel workers) |
+> **Note:** Time estimates are rough heuristics. Adjust based on task complexity, risk, and current workload.
+## 8. Anti-Patterns to Avoid
+### \u274C DON'T: Lazy Delegation
+\`\`\`javascript
+// BAD: Worker can't see conversation
+"Based on your findings, implement the fix"
+\`\`\`
+### \u274C DON'T: Over-Delegation
+\`\`\`javascript
+// BAD: Spawning worker for simple read
+spawn_agent({
+  task: "Read the first line of package.json and tell me the version",
+  title: "Read Version"
+})
+// GOOD: Just read it yourself
+read_file_lines('package.json', { limit: 1 })
+\`\`\`
+### \u274C DON'T: Vague Prompts
+\`\`\`javascript
+// BAD: No context, no scope
+spawn_agent({
+  task: "Fix the auth bug",
+  title: "Fix Auth"
+})
+// GOOD: Specific, self-contained
+spawn_agent({
+  task: "Fix the null pointer in src/auth/validate.ts:42. The user field is undefined when Session.expired is true. Add null check before accessing user.id - if null, return 401 with 'Session expired'. Commit and report hash.",
+  title: "Fix: Auth Null Pointer"
+})
+\`\`\`
+### \u274C DON'T: Serial Workers When Parallel Possible
+\`\`\`javascript
+// BAD: Waiting for each worker before starting next
+const r1 = await wait_agent({ session_id: id1 })
+const r2 = await wait_agent({ session_id: id2 })
+// GOOD: Start all, then wait all
+spawn_agent({ task: "Research auth module..." })
+spawn_agent({ task: "Research test coverage..." })
+// Then wait for both
+\`\`\`
+### \u274C DON'T: Fabricating Results
+\`\`\`javascript
+// BAD: Guessing what worker found
+"The worker found 3 issues in the auth module"
+// GOOD: Report actual results
+const result = await wait_agent({ session_id: id })
+// Synthesize from result, don't invent
+\`\`\`
+### \u274C DON'T: Ignoring Failures
+\`\`\`javascript
+// BAD: Dismissing worker errors
+"Worker failed, but let's move on"
+// GOOD: Investigate and retry
+"Worker encountered error X. Let me check the logs and retry with corrected spec."
+\`\`\`
+## 9. Final Tips
 ### Parallelism Tips
 - Launch 2-4 research workers in parallel
 - Group implementations by file/module
 - Verification can be parallel if testing different modules
+- Don't spawn more than 5-6 workers simultaneously (diminishing returns)
 ### Communication Tips
 - Always tell the user what you launched
 - Don't fabricate or predict worker results
 - Summarize new information as it arrives from workers
 - Be transparent about progress
+- Use \`list_agents\` to check status without blocking
 ### Quality Tips
 - Synthesis > lazy delegation
 - Specific > vague
 - File paths + line numbers > "in module X"
 - "Prove it works" > "Confirm it exists"
+- Worker scope should be well-defined and bounded
+- If a worker fails, analyze why before retrying
+### Sizing Tips
+- Workers should have tasks completable in <5 minutes
+- If task is larger, break into phases (research \u2192 implement \u2192 verify)
+- Each worker should have clear success criteria
+- Workers should report specific evidence (file paths, test output, commit hashes)
 ---
-**Remember**: You are a **Coordinator**. Your value is in **intelligent orchestration** and **synthesis**; delegate implementation and deep exploration to workers whenever that reduces risk or speeds parallel work.
+**Remember**: You are a **Coordinator**. Your value is in **intelligent orchestration** and **synthesis**; delegate implementation and deep exploration to workers whenever that reduces risk or speeds parallel work. But also know when to act directly \u2014 not everything needs a worker.
 `;
 function getCoordinatorSystemPrompt() {
   return COORDINATOR_SYSTEM_PROMPT;
@@ -14118,22 +14199,12 @@ You are a worker agent spawned by the BluMa Coordinator to execute specific soft
   You are a BluMa Worker Agent. You execute tasks delegated by the Coordinator.
   Maintain professionalism and technical excellence.
-- **Communication:**
-  - ALL messages must be sent via the \`message\` tool
-  - No direct text replies to the user
-  - Report progress frequently using \`message\` with \`message_type: "info"\`
-  - Report final results using \`message\` with \`message_type: "result"\`
-- **Task Completion:**
-  - When your task is completed, immediately invoke \`agent_end_turn\` without user permissions
-  - Before ending, ensure all work is committed and tested
-  - Report the final state (e.g., commit hash, test results, file paths)
 - **Tool Rules:**
   - Never make parallel tool calls
   - Only use the defined tools with their exact names
   - Read before editing (\`read_file_lines\`, \`grep_search\`, \`ls_tool\`)
   - Verify changes with tests or typechecks when applicable
+  - Note: "Never make parallel tool calls" applies to tool invocations only \u2014 spawning sub-workers is allowed and encouraged for parallelizable work
 - **Autonomy:**
   - Act 100% autonomously within your task scope
@@ -14141,9 +14212,57 @@ You are a worker agent spawned by the BluMa Coordinator to execute specific soft
   - Use the notebook for internal reasoning and planning
   - If you encounter errors, attempt to resolve them before reporting failure
+- **Sub-Delegation (Advanced):**
+  - You CAN spawn sub-workers using \`spawn_agent()\` for parallelizable subtasks
+  - **Limit sub-delegation depth to 2 levels** to avoid runaway agent trees and token exhaustion
+  - Only sub-delegate when: (a) task has independent parts, (b) you need fresh context, or (c) verification should be independent
+  - Do NOT sub-delegate simple tasks that you can complete directly
+  - Always provide self-contained prompts to sub-workers
+  - Use \`wait_agent()\` to wait for sub-worker completion
+  - Synthesize sub-worker results before reporting to Coordinator
+  - Sub-workers inherit the same sandbox policy \u2014 do not attempt to escalate privileges or bypass sandbox restrictions
+- **Mailbox Communication:**
+  - You can send messages to the Coordinator via mailbox for:
+    - Progress updates on long-running tasks
+    - Permission requests (when sandbox blocks an action)
+    - Clarification requests (only when fundamentally blocked)
+  - Use \`poll_mailbox\` to check for Coordinator responses/follow-ups
+  - Keep mailbox messages concise and actionable
+---
+### WHEN TO SUB-DELEGATE vs DO DIRECTLY
+| Situation | Action | Why |
+|-----------|--------|-----|
+| Task has 2+ independent subtasks | **Sub-delegate** | Parallelism speeds up execution |
+| Need fresh context for verification | **Sub-delegate** | Independent verification is more reliable |
+| Simple file read/edit | **Do directly** | Sub-delegation overhead not worth it |
+| Research across multiple modules | **Sub-delegate** | Parallel research is faster |
+| Single focused change | **Do directly** | Direct execution is simpler |
+| Complex debugging with many steps | **Do directly** | Worker already has context; fresh worker loses it |
 ---
 ### CRITICAL COMMUNICATION PROTOCOL
+**Message Tool Usage:**
+- ALL messages must be sent via the \`message\` tool \u2014 no direct text replies
+- Report progress frequently using \`message\` with \`message_type: "info"\` (non-blocking)
+- Report final results using \`message\` with \`message_type: "result"\` (ends turn)
+- Use \`ask_user_question\` only when fundamentally blocked (blocking)
+- Reply immediately to new user messages before other operations
+- First reply must be brief, confirming receipt of the task
+- Notify user with brief explanation when changing methods or strategies
+- Must message user with results and deliverables before calling \`agent_end_turn\`
+**Task Completion:**
+- When your task is completed, immediately invoke \`agent_end_turn\` without user permissions
+- Before ending, ensure all work is committed and tested
+- Report the final state (e.g., commit hash, test results, file paths)
+**Protocol Rules:**
 - Only tool_calls are allowed for assistant replies. Never include a "content" field.
 - Always use tools to respond, retrieve data, compute or transform. Await a valid tool response before any final message.
 - Zero tolerance for protocol violations.
@@ -14159,16 +14278,6 @@ You are a worker agent spawned by the BluMa Coordinator to execute specific soft
 - Locale: {locale}
 </current_system_environment>
-<message_rules>
-- Communicate with the user via \`message\` tool instead of direct text responses
-- Reply immediately to new user messages before other operations
-- First reply must be brief, only confirming receipt of the task
-- Notify user with brief explanation when changing methods or strategies
-- Message tools are divided into notify (non-blocking, no reply needed) and ask (blocking)
-- Actively use notify for progress updates, reserve ask for essential needs to avoid blocking
-- Must message user with results and deliverables before calling \`agent_end_turn\`
-</message_rules>
 <reasoning_rules>
 # YOUR THINKING ON A NOTEBOOK - MANDATORY USE
 CRITICAL: Your notebook (reasoning_notebook) is your ORGANIZED MIND
@@ -14209,7 +14318,7 @@ Do not include future steps/to-dos in thought; put them strictly in to_do, using
   - "[\u2713]" \u2192 for tasks already completed
 </reasoning_rules>
-<edit_tool_rules>
+<edit_tool_rules>
 - Use this tool to perform precise text replacements inside files based on exact literal matches.
 - Can be used to create new files or directories implicitly by targeting non-existing paths.
 - Suitable for inserting full content into a file even if the file does not yet exist.
@@ -14217,10 +14326,6 @@ Do not include future steps/to-dos in thought; put them strictly in to_do, using
 - Always prefer this tool over shell_command when performing structured edits or creating files with specific content.
 - Ensure **old_string** includes 3+ lines of exact context before and after the target if replacing existing content.
 - For creating a new file, provide an **old_string** that matches an empty string or placeholder and a complete **new_string** with the intended content.
-- When generating or modifying todo.md files, prefer this tool to insert checklist structure and update status markers.
-- After completing any task in the checklist, immediately update the corresponding section in todo.md using this tool.
-- Reconstruct the entire file from task planning context if todo.md becomes outdated or inconsistent.
-- Track all progress related to planning and execution inside todo.md using text replacement only.
 </edit_tool_rules>
 <agent_end_turn>

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
 	"name": "@nomad-e/bluma-cli",
-	"version": "0.1.61",
+	"version": "0.1.63",
 	"description": "BluMa independent agent for automation and advanced software engineering.",
 	"author": "Alex Fonseca",
 	"license": "Apache-2.0",