npm - @probelabs/probe - Versions diffs - 0.6.0-rc277 → 0.6.0-rc279 - Mend

@probelabs/probe 0.6.0-rc277 → 0.6.0-rc279

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (23) hide show

package/bin/binaries/probe-v0.6.0-rc279-aarch64-apple-darwin.tar.gz +0 -0
package/bin/binaries/probe-v0.6.0-rc279-aarch64-unknown-linux-musl.tar.gz +0 -0
package/bin/binaries/probe-v0.6.0-rc279-x86_64-apple-darwin.tar.gz +0 -0
package/bin/binaries/probe-v0.6.0-rc279-x86_64-pc-windows-msvc.zip +0 -0
package/bin/binaries/{probe-v0.6.0-rc277-x86_64-unknown-linux-musl.tar.gz → probe-v0.6.0-rc279-x86_64-unknown-linux-musl.tar.gz} +0 -0
package/build/agent/ProbeAgent.js +63 -11
package/build/agent/index.js +129 -33
package/build/agent/shared/prompts.js +30 -8
package/build/delegate.js +40 -11
package/build/tools/analyzeAll.js +8 -4
package/build/tools/vercel.js +7 -4
package/cjs/agent/ProbeAgent.cjs +132 -34
package/cjs/index.cjs +129 -33
package/package.json +1 -1
package/src/agent/ProbeAgent.js +63 -11
package/src/agent/shared/prompts.js +30 -8
package/src/delegate.js +40 -11
package/src/tools/analyzeAll.js +8 -4
package/src/tools/vercel.js +7 -4
package/bin/binaries/probe-v0.6.0-rc277-aarch64-apple-darwin.tar.gz +0 -0
package/bin/binaries/probe-v0.6.0-rc277-aarch64-unknown-linux-musl.tar.gz +0 -0
package/bin/binaries/probe-v0.6.0-rc277-x86_64-apple-darwin.tar.gz +0 -0
package/bin/binaries/probe-v0.6.0-rc277-x86_64-pc-windows-msvc.zip +0 -0

package/cjs/index.cjs CHANGED Viewed

@@ -36120,7 +36120,7 @@ ${taskManager.formatTasksForPrompt()}`;
     }
   };
 }
-var taskItemSchema, taskSchema, taskSystemPrompt, taskGuidancePrompt;
+var taskItemSchema, taskSchema, taskSystemPrompt;
 var init_taskTool = __esm({
   "src/agent/tasks/taskTool.js"() {
     "use strict";
@@ -36181,11 +36181,6 @@ Tasks = logical units of work, not files or steps.
 - Circular dependencies are rejected
 - attempt_completion is blocked while tasks remain unresolved
 `;
-    taskGuidancePrompt = `Does this request have MULTIPLE DISTINCT GOALS?
-- "Do A AND B AND C" (multiple goals) \u2192 Create tasks for each goal
-- "Investigate/explain/find X" (single goal) \u2192 Skip tasks, just answer directly
-Multiple internal steps for ONE goal = NO tasks needed.
-If creating tasks, use the task tool with action="create" first.`;
   }
 });
@@ -82671,8 +82666,20 @@ If the solution is clear, you can jump to implementation right away. If not, ask
 - Check imports and existing utilities before creating new helpers \u2014 the project may already have what you need.
 # Task Planning
-- If the task tool is available, use it to break complex work into milestones before starting implementation.
-- Stay flexible \u2014 if your understanding changes mid-task, add, remove, or reorganize tasks as needed. The plan should serve you, not constrain you.
+When the request has **multiple distinct goals** (e.g. "Fix bug A AND add feature B"), use the task tool to track them:
+- Call the task tool with action="create" and a tasks array. Each task must have an "id" field.
+- Update task status to "in_progress" when starting and "completed" when done.
+- All tasks must be completed or cancelled before calling attempt_completion.
+- Stay flexible \u2014 add, remove, or reorganize tasks as your understanding changes.
+Do NOT create tasks for single-goal requests, even complex ones. Multiple internal steps for one goal (search, read, analyze, implement) do not need tasks.
+# Discovering Project Commands
+Before building or testing, determine the project's toolchain:
+- Check for Makefile, package.json (scripts), Cargo.toml, go.mod, pyproject.toml, or similar
+- Look for CI config (.github/workflows/, .gitlab-ci.yml) to see what commands CI runs
+- Read README for build/test instructions if the above are unclear
+- Common patterns: \`make build\`/\`make test\`, \`npm run build\`/\`npm test\`, \`cargo build\`/\`cargo test\`, \`go build ./...\`/\`go test ./...\`, \`python -m pytest\`
 # During Implementation
 - Always create a new branch before making changes to the codebase.
@@ -82683,12 +82690,22 @@ If the solution is clear, you can jump to implementation right away. If not, ask
 - When editing files, keep edits focused and minimal. For changes spanning more than a few lines, prefer line-targeted editing (start_line/end_line) over text replacement (old_string) \u2014 it constrains scope and prevents accidental removal of adjacent content. Never include unrelated sections in an edit operation.
 - After every significant change, verify the project still builds and passes linting. Do not wait until the end to discover breakage.
-# After Implementation
-- Verify the project builds successfully. If it doesn't, fix the build before moving on.
-- Run lint and typecheck commands if known for the project. Fix any new warnings or errors you introduced.
-- Add tests for any new or changed functionality. Tests must cover the main path and important edge cases.
-- Run the project's full test suite. If any tests fail (including pre-existing ones you may have broken), fix them before finishing.
-- When the task is done, respond to the user with a concise summary of what was implemented, what files were changed, and any relevant details. Include links (e.g. pull request URL) so the user has everything they need.
+# Writing Tests
+Every change must include tests. Before writing them:
+- Find existing test files for the module you changed \u2014 look in \`tests/\`, \`__tests__/\`, \`*_test.go\`, \`*.test.js\`, \`*.spec.ts\`, or co-located test modules (\`#[cfg(test)]\` in Rust).
+- Read those tests to understand the project's testing patterns: framework, assertion style, mocking approach, file naming, test organization.
+- Prefer extending an existing test file over creating a new one when your change is in the same module.
+- Write tests that cover the main path and important edge cases. Include a failing-input test when relevant.
+- When fixing a bug, write a failing test first that reproduces the bug, then fix the code to make it pass.
+# Verify Changes
+Before committing or creating a PR, run through this checklist:
+1. **Build** \u2014 run the project-appropriate build command (go build, npm run build, cargo build, make, etc.). Fix any compilation errors.
+2. **Lint & typecheck** \u2014 run linter/formatter if the project has one (eslint, clippy, golangci-lint, etc.). Fix any new warnings.
+3. **Test** \u2014 run the full test suite (go test ./..., npm test, cargo test, make test, pytest, etc.). Fix any failures, including pre-existing tests you may have broken.
+4. **Review** \u2014 re-read your diff. Ensure no debug code, no unrelated changes, no secrets, no missing files.
+Do NOT skip verification. Do NOT proceed to PR creation with a broken build or failing tests.
 # GitHub Integration
 - Use the \`gh\` CLI for all GitHub operations: issues, pull requests, checks, releases.
@@ -105948,8 +105965,23 @@ __export(ProbeAgent_exports, {
   ENGINE_ACTIVITY_TIMEOUT_DEFAULT: () => ENGINE_ACTIVITY_TIMEOUT_DEFAULT,
   ENGINE_ACTIVITY_TIMEOUT_MAX: () => ENGINE_ACTIVITY_TIMEOUT_MAX,
   ENGINE_ACTIVITY_TIMEOUT_MIN: () => ENGINE_ACTIVITY_TIMEOUT_MIN,
-  ProbeAgent: () => ProbeAgent
+  ProbeAgent: () => ProbeAgent,
+  debugLogToolResults: () => debugLogToolResults,
+  debugTruncate: () => debugTruncate
 });
+function debugTruncate(s5, limit = 200) {
+  if (s5.length <= limit) return s5;
+  const half = Math.floor(limit / 2);
+  return s5.substring(0, half) + ` ... [${s5.length} chars] ... ` + s5.substring(s5.length - half);
+}
+function debugLogToolResults(toolResults) {
+  if (!toolResults || toolResults.length === 0) return;
+  for (const tr of toolResults) {
+    const argsStr = JSON.stringify(tr.args || {});
+    const resultStr = typeof tr.result === "string" ? tr.result : JSON.stringify(tr.result || "");
+    console.log(`[DEBUG]   tool: ${tr.toolName} | args: ${debugTruncate(argsStr)} | result: ${debugTruncate(resultStr)}`);
+  }
+}
 var import_dotenv, import_anthropic2, import_openai2, import_google2, import_ai4, import_crypto8, import_events4, import_fs10, import_promises6, import_path15, ENGINE_ACTIVITY_TIMEOUT_DEFAULT, ENGINE_ACTIVITY_TIMEOUT_MIN, ENGINE_ACTIVITY_TIMEOUT_MAX, MAX_TOOL_ITERATIONS, MAX_HISTORY_MESSAGES, MAX_IMAGE_FILE_SIZE, ProbeAgent;
 var init_ProbeAgent = __esm({
   "src/agent/ProbeAgent.js"() {
@@ -106069,6 +106101,7 @@ var init_ProbeAgent = __esm({
         this.enableExecutePlan = !!options.enableExecutePlan;
         this.debug = options.debug || process.env.DEBUG === "1";
         this.cancelled = false;
+        this._abortController = new AbortController();
         this.tracer = options.tracer || null;
         this.outline = !!options.outline;
         this.searchDelegate = options.searchDelegate !== void 0 ? !!options.searchDelegate : true;
@@ -106514,6 +106547,8 @@ var init_ProbeAgent = __esm({
           searchDelegateModel: this.searchDelegateModel,
           delegationManager: this.delegationManager,
           // Per-instance delegation limits
+          parentAbortSignal: this._abortController.signal,
+          // Propagate cancellation to delegations
           outputBuffer: this._outputBuffer,
           concurrencyLimiter: this.concurrencyLimiter,
           // Global AI concurrency limiter
@@ -106961,6 +106996,15 @@ var init_ProbeAgent = __esm({
         }
         const controller = new AbortController();
         const timeoutState = { timeoutId: null };
+        if (this._abortController.signal.aborted) {
+          controller.abort();
+        } else {
+          const onAgentAbort = () => controller.abort();
+          this._abortController.signal.addEventListener("abort", onAgentAbort, { once: true });
+          controller.signal.addEventListener("abort", () => {
+            this._abortController.signal.removeEventListener("abort", onAgentAbort);
+          }, { once: true });
+        }
         if (this.maxOperationTimeout && this.maxOperationTimeout > 0) {
           timeoutState.timeoutId = setTimeout(() => {
             controller.abort();
@@ -107264,7 +107308,8 @@ var init_ProbeAgent = __esm({
                     allowEdit: this.allowEdit,
                     allowedTools: allowedToolsForDelegate,
                     debug: this.debug,
-                    tracer: this.tracer
+                    tracer: this.tracer,
+                    parentAbortSignal: this._abortController.signal
                   };
                   if (this.debug) {
                     console.log(`[DEBUG] Executing delegate tool`);
@@ -108426,12 +108471,6 @@ You are working with a workspace. Available paths: ${workspaceDesc}
           });
           const systemMessage = await this.getSystemMessage();
           let userMessage = { role: "user", content: message.trim() };
-          if (this.enableTasks) {
-            userMessage.content = userMessage.content + "\n\n" + taskGuidancePrompt;
-            if (this.debug) {
-              console.log("[DEBUG] Task guidance injected into user message");
-            }
-          }
           if (options.schema && !options._schemaFormatted) {
             const schemaInstructions = generateSchemaInstructions(options.schema, { debug: this.debug });
             userMessage.content = message.trim() + schemaInstructions;
@@ -108587,6 +108626,10 @@ You are working with a workspace. Available paths: ${workspaceDesc}
             completionResult = result;
             completionAttempted = true;
           }, toolContext);
+          if (this.debug) {
+            const toolNames = Object.keys(tools2);
+            console.log(`[DEBUG] Agent tools registered (${toolNames.length}): ${toolNames.join(", ")}`);
+          }
           let maxResponseTokens = this.maxResponseTokens;
           if (!maxResponseTokens) {
             maxResponseTokens = 4e3;
@@ -108626,6 +108669,7 @@ You are working with a workspace. Available paths: ${workspaceDesc}
                   }
                   if (this.debug) {
                     console.log(`[DEBUG] Step ${currentIteration}/${maxIterations} finished (reason: ${finishReason}, tools: ${toolResults?.length || 0})`);
+                    debugLogToolResults(toolResults);
                   }
                 }
               };
@@ -108782,6 +108826,7 @@ Double-check your response based on the criteria above. If everything looks good
                   }
                   if (this.debug) {
                     console.log(`[DEBUG] Completion prompt step finished (reason: ${finishReason}, tools: ${toolResults?.length || 0})`);
+                    debugLogToolResults(toolResults);
                   }
                 }
               };
@@ -109492,6 +109537,9 @@ Convert your previous response content into actual JSON data that follows this s
        * Clean up resources (including MCP connections)
        */
       async cleanup() {
+        if (!this._abortController.signal.aborted) {
+          this._abortController.abort();
+        }
         if (this.mcpBridge) {
           try {
             await this.mcpBridge.cleanup();
@@ -109515,14 +109563,25 @@ Convert your previous response content into actual JSON data that follows this s
         this.clearHistory();
       }
       /**
-       * Cancel the current request
+       * Cancel the current request and all in-flight delegations.
+       * Aborts the internal AbortController so streamText, subagents,
+       * and any code checking the signal will stop.
        */
       cancel() {
         this.cancelled = true;
+        this._abortController.abort();
         if (this.debug) {
           console.log(`[DEBUG] Agent cancelled for session ${this.sessionId}`);
         }
       }
+      /**
+       * Get the abort signal for this agent.
+       * Delegations and subagents should check this signal.
+       * @returns {AbortSignal}
+       */
+      get abortSignal() {
+        return this._abortController.signal;
+      }
     };
   }
 });
@@ -109555,12 +109614,17 @@ async function delegate({
   mcpConfigPath = null,
   delegationManager = null,
   // Optional per-instance manager, falls back to default singleton
-  concurrencyLimiter = null
+  concurrencyLimiter = null,
   // Optional global AI concurrency limiter
+  parentAbortSignal = null
+  // Optional AbortSignal from parent to cancel this delegation
 }) {
   if (!task || typeof task !== "string") {
     throw new Error("Task parameter is required and must be a string");
   }
+  if (parentAbortSignal?.aborted) {
+    throw new Error("Delegation cancelled: parent operation was aborted");
+  }
   const hasExplicitTimeout = Object.prototype.hasOwnProperty.call(arguments?.[0] ?? {}, "timeout");
   if (!hasExplicitTimeout) {
     const envTimeoutMs = parseInt(process.env.DELEGATION_TIMEOUT_MS || "", 10);
@@ -109645,12 +109709,37 @@ async function delegate({
     }
     const timeoutPromise = new Promise((_, reject2) => {
       timeoutId = setTimeout(() => {
+        subagent.cancel();
         reject2(new Error(`Delegation timed out after ${timeout} seconds`));
       }, timeout * 1e3);
     });
+    let parentAbortHandler;
+    const parentAbortPromise = new Promise((_, reject2) => {
+      if (parentAbortSignal) {
+        if (parentAbortSignal.aborted) {
+          subagent.cancel();
+          reject2(new Error("Delegation cancelled: parent operation was aborted"));
+          return;
+        }
+        parentAbortHandler = () => {
+          subagent.cancel();
+          reject2(new Error("Delegation cancelled: parent operation was aborted"));
+        };
+        parentAbortSignal.addEventListener("abort", parentAbortHandler, { once: true });
+      }
+    });
     const answerOptions = schema ? { schema } : void 0;
     const answerPromise = answerOptions ? subagent.answer(task, [], answerOptions) : subagent.answer(task);
-    const response = await Promise.race([answerPromise, timeoutPromise]);
+    const racers = [answerPromise, timeoutPromise];
+    if (parentAbortSignal) racers.push(parentAbortPromise);
+    let response;
+    try {
+      response = await Promise.race(racers);
+    } finally {
+      if (parentAbortHandler && parentAbortSignal) {
+        parentAbortSignal.removeEventListener("abort", parentAbortHandler);
+      }
+    }
     if (timeoutId !== null) {
       clearTimeout(timeoutId);
       timeoutId = null;
@@ -110063,8 +110152,9 @@ Instructions:
       promptType: "code-researcher",
       allowedTools: ["extract"],
       maxIterations: 5,
-      delegationManager: options.delegationManager
+      delegationManager: options.delegationManager,
       // Per-instance delegation limits
+      parentAbortSignal: options.parentAbortSignal || null
       // timeout removed - inherit default from delegate (300s)
     });
     return { chunk, result };
@@ -110163,8 +110253,9 @@ Organize all findings into clear categories with items listed under each.${compl
       promptType: "code-researcher",
       allowedTools: [],
       maxIterations: 5,
-      delegationManager: options.delegationManager
+      delegationManager: options.delegationManager,
       // Per-instance delegation limits
+      parentAbortSignal: options.parentAbortSignal || null
       // timeout removed - inherit default from delegate (300s)
     });
     return result;
@@ -110228,8 +110319,9 @@ CRITICAL: Do NOT guess keywords. Actually run searches and see what returns resu
       promptType: "code-researcher",
       // Full tool access for exploration and experimentation
       maxIterations: 15,
-      delegationManager: options.delegationManager
+      delegationManager: options.delegationManager,
       // Per-instance delegation limits
+      parentAbortSignal: options.parentAbortSignal || null
       // timeout removed - inherit default from delegate (300s)
     });
     const plan = parsePlanningResult(stripResultTags(result));
@@ -110286,8 +110378,9 @@ When done, use the attempt_completion tool with your answer as the result.`;
       promptType: "code-researcher",
       allowedTools: [],
       maxIterations: 5,
-      delegationManager: options.delegationManager
+      delegationManager: options.delegationManager,
       // Per-instance delegation limits
+      parentAbortSignal: options.parentAbortSignal || null
       // timeout removed - inherit default from delegate (300s)
     });
     return stripResultTags(result);
@@ -110735,7 +110828,8 @@ var init_vercel = __esm({
               promptType: "code-searcher",
               allowedTools: ["search", "extract", "listFiles", "attempt_completion"],
               searchDelegate: false,
-              schema: CODE_SEARCH_SCHEMA
+              schema: CODE_SEARCH_SCHEMA,
+              parentAbortSignal: options.parentAbortSignal || null
             });
             const delegateResult = options.tracer?.withSpan ? await options.tracer.withSpan("search.delegate", runDelegation, {
               "search.query": searchQuery,
@@ -110949,7 +111043,7 @@ var init_vercel = __esm({
         name: "delegate",
         description: delegateDescription,
         inputSchema: delegateSchema,
-        execute: async ({ task, currentIteration, maxIterations, parentSessionId, path: path9, provider, model, tracer, searchDelegate }) => {
+        execute: async ({ task, currentIteration, maxIterations, parentSessionId, path: path9, provider, model, tracer, searchDelegate, parentAbortSignal }) => {
           if (!task || typeof task !== "string") {
             throw new Error("Task parameter is required and must be a non-empty string");
           }
@@ -111007,8 +111101,9 @@ var init_vercel = __esm({
             enableMcp,
             mcpConfig,
             mcpConfigPath,
-            delegationManager
+            delegationManager,
             // Per-instance delegation limits
+            parentAbortSignal
           });
           return result;
         }
@@ -111046,8 +111141,9 @@ var init_vercel = __esm({
               provider: options.provider,
               model: options.model,
               tracer: options.tracer,
-              delegationManager
+              delegationManager,
               // Per-instance delegation limits
+              parentAbortSignal: options.parentAbortSignal || null
             });
             return result;
           } catch (error2) {

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@probelabs/probe",
-  "version": "0.6.0-rc277",
+  "version": "0.6.0-rc279",
   "description": "Node.js wrapper for the probe code search tool",
   "main": "src/index.js",
   "module": "src/index.js",

package/src/agent/ProbeAgent.js CHANGED Viewed

@@ -104,7 +104,6 @@ import {
   TaskManager,
   createTaskTool,
   taskSystemPrompt,
-  taskGuidancePrompt,
   createTaskCompletionBlockedMessage
 } from './tasks/index.js';
 import { z } from 'zod';
@@ -126,6 +125,27 @@ const MAX_HISTORY_MESSAGES = 100;
 // Maximum image file size (20MB) to prevent OOM attacks
 const MAX_IMAGE_FILE_SIZE = 20 * 1024 * 1024;
+/**
+ * Truncate a string for debug logging, showing first and last portion.
+ */
+export function debugTruncate(s, limit = 200) {
+  if (s.length <= limit) return s;
+  const half = Math.floor(limit / 2);
+  return s.substring(0, half) + ` ... [${s.length} chars] ... ` + s.substring(s.length - half);
+}
+/**
+ * Log tool results details for debug output.
+ */
+export function debugLogToolResults(toolResults) {
+  if (!toolResults || toolResults.length === 0) return;
+  for (const tr of toolResults) {
+    const argsStr = JSON.stringify(tr.args || {});
+    const resultStr = typeof tr.result === 'string' ? tr.result : JSON.stringify(tr.result || '');
+    console.log(`[DEBUG]   tool: ${tr.toolName} | args: ${debugTruncate(argsStr)} | result: ${debugTruncate(resultStr)}`);
+  }
+}
 /**
  * ProbeAgent class to handle AI interactions with code search capabilities
  */
@@ -194,6 +214,7 @@ export class ProbeAgent {
     this.enableExecutePlan = !!options.enableExecutePlan;
     this.debug = options.debug || process.env.DEBUG === '1';
     this.cancelled = false;
+    this._abortController = new AbortController();
     this.tracer = options.tracer || null;
     this.outline = !!options.outline;
     this.searchDelegate = options.searchDelegate !== undefined ? !!options.searchDelegate : true;
@@ -793,6 +814,7 @@ export class ProbeAgent {
       searchDelegateProvider: this.searchDelegateProvider,
       searchDelegateModel: this.searchDelegateModel,
       delegationManager: this.delegationManager,  // Per-instance delegation limits
+      parentAbortSignal: this._abortController.signal,  // Propagate cancellation to delegations
       outputBuffer: this._outputBuffer,
       concurrencyLimiter: this.concurrencyLimiter,  // Global AI concurrency limiter
       isToolAllowed,
@@ -1363,6 +1385,19 @@ export class ProbeAgent {
     const controller = new AbortController();
     const timeoutState = { timeoutId: null };
+    // Link agent-level abort to this operation's controller
+    // so that cancel() / cleanup() stops the current streamText call
+    if (this._abortController.signal.aborted) {
+      controller.abort();
+    } else {
+      const onAgentAbort = () => controller.abort();
+      this._abortController.signal.addEventListener('abort', onAgentAbort, { once: true });
+      // Clean up listener when this controller aborts (from any source)
+      controller.signal.addEventListener('abort', () => {
+        this._abortController.signal.removeEventListener('abort', onAgentAbort);
+      }, { once: true });
+    }
     // Set up overall operation timeout (default 5 minutes)
     if (this.maxOperationTimeout && this.maxOperationTimeout > 0) {
       timeoutState.timeoutId = setTimeout(() => {
@@ -1730,7 +1765,8 @@ export class ProbeAgent {
                 allowEdit: this.allowEdit,
                 allowedTools: allowedToolsForDelegate,
                 debug: this.debug,
-                tracer: this.tracer
+                tracer: this.tracer,
+                parentAbortSignal: this._abortController.signal
               };
               if (this.debug) {
@@ -3153,14 +3189,6 @@ Follow these instructions carefully:
       // Create user message with optional image support
       let userMessage = { role: 'user', content: message.trim() };
-      // START CHECKPOINT: Inject task guidance if tasks are enabled
-      if (this.enableTasks) {
-        userMessage.content = userMessage.content + '\n\n' + taskGuidancePrompt;
-        if (this.debug) {
-          console.log('[DEBUG] Task guidance injected into user message');
-        }
-      }
       // If schema is provided, prepend JSON format requirement to user message
       if (options.schema && !options._schemaFormatted) {
         const schemaInstructions = generateSchemaInstructions(options.schema, { debug: this.debug });
@@ -3378,6 +3406,11 @@ Follow these instructions carefully:
         completionAttempted = true;
       }, toolContext);
+      if (this.debug) {
+        const toolNames = Object.keys(tools);
+        console.log(`[DEBUG] Agent tools registered (${toolNames.length}): ${toolNames.join(', ')}`);
+      }
       let maxResponseTokens = this.maxResponseTokens;
       if (!maxResponseTokens) {
         maxResponseTokens = 4000;
@@ -3427,6 +3460,7 @@ Follow these instructions carefully:
               if (this.debug) {
                 console.log(`[DEBUG] Step ${currentIteration}/${maxIterations} finished (reason: ${finishReason}, tools: ${toolResults?.length || 0})`);
+                debugLogToolResults(toolResults);
               }
             }
           };
@@ -3638,6 +3672,7 @@ Double-check your response based on the criteria above. If everything looks good
               }
               if (this.debug) {
                 console.log(`[DEBUG] Completion prompt step finished (reason: ${finishReason}, tools: ${toolResults?.length || 0})`);
+                debugLogToolResults(toolResults);
               }
             }
           };
@@ -4554,6 +4589,11 @@ Convert your previous response content into actual JSON data that follows this s
    * Clean up resources (including MCP connections)
    */
   async cleanup() {
+    // Abort any in-flight operations (delegations, streaming, etc.)
+    if (!this._abortController.signal.aborted) {
+      this._abortController.abort();
+    }
     // Clean up MCP bridge
     if (this.mcpBridge) {
       try {
@@ -4583,12 +4623,24 @@ Convert your previous response content into actual JSON data that follows this s
   }
   /**
-   * Cancel the current request
+   * Cancel the current request and all in-flight delegations.
+   * Aborts the internal AbortController so streamText, subagents,
+   * and any code checking the signal will stop.
    */
   cancel() {
     this.cancelled = true;
+    this._abortController.abort();
     if (this.debug) {
       console.log(`[DEBUG] Agent cancelled for session ${this.sessionId}`);
     }
   }
+  /**
+   * Get the abort signal for this agent.
+   * Delegations and subagents should check this signal.
+   * @returns {AbortSignal}
+   */
+  get abortSignal() {
+    return this._abortController.signal;
+  }
 }

package/src/agent/shared/prompts.js CHANGED Viewed

@@ -81,8 +81,20 @@ If the solution is clear, you can jump to implementation right away. If not, ask
 - Check imports and existing utilities before creating new helpers — the project may already have what you need.
 # Task Planning
-- If the task tool is available, use it to break complex work into milestones before starting implementation.
-- Stay flexible — if your understanding changes mid-task, add, remove, or reorganize tasks as needed. The plan should serve you, not constrain you.
+When the request has **multiple distinct goals** (e.g. "Fix bug A AND add feature B"), use the task tool to track them:
+- Call the task tool with action="create" and a tasks array. Each task must have an "id" field.
+- Update task status to "in_progress" when starting and "completed" when done.
+- All tasks must be completed or cancelled before calling attempt_completion.
+- Stay flexible — add, remove, or reorganize tasks as your understanding changes.
+Do NOT create tasks for single-goal requests, even complex ones. Multiple internal steps for one goal (search, read, analyze, implement) do not need tasks.
+# Discovering Project Commands
+Before building or testing, determine the project's toolchain:
+- Check for Makefile, package.json (scripts), Cargo.toml, go.mod, pyproject.toml, or similar
+- Look for CI config (.github/workflows/, .gitlab-ci.yml) to see what commands CI runs
+- Read README for build/test instructions if the above are unclear
+- Common patterns: \`make build\`/\`make test\`, \`npm run build\`/\`npm test\`, \`cargo build\`/\`cargo test\`, \`go build ./...\`/\`go test ./...\`, \`python -m pytest\`
 # During Implementation
 - Always create a new branch before making changes to the codebase.
@@ -93,12 +105,22 @@ If the solution is clear, you can jump to implementation right away. If not, ask
 - When editing files, keep edits focused and minimal. For changes spanning more than a few lines, prefer line-targeted editing (start_line/end_line) over text replacement (old_string) — it constrains scope and prevents accidental removal of adjacent content. Never include unrelated sections in an edit operation.
 - After every significant change, verify the project still builds and passes linting. Do not wait until the end to discover breakage.
-# After Implementation
-- Verify the project builds successfully. If it doesn't, fix the build before moving on.
-- Run lint and typecheck commands if known for the project. Fix any new warnings or errors you introduced.
-- Add tests for any new or changed functionality. Tests must cover the main path and important edge cases.
-- Run the project's full test suite. If any tests fail (including pre-existing ones you may have broken), fix them before finishing.
-- When the task is done, respond to the user with a concise summary of what was implemented, what files were changed, and any relevant details. Include links (e.g. pull request URL) so the user has everything they need.
+# Writing Tests
+Every change must include tests. Before writing them:
+- Find existing test files for the module you changed — look in \`tests/\`, \`__tests__/\`, \`*_test.go\`, \`*.test.js\`, \`*.spec.ts\`, or co-located test modules (\`#[cfg(test)]\` in Rust).
+- Read those tests to understand the project's testing patterns: framework, assertion style, mocking approach, file naming, test organization.
+- Prefer extending an existing test file over creating a new one when your change is in the same module.
+- Write tests that cover the main path and important edge cases. Include a failing-input test when relevant.
+- When fixing a bug, write a failing test first that reproduces the bug, then fix the code to make it pass.
+# Verify Changes
+Before committing or creating a PR, run through this checklist:
+1. **Build** — run the project-appropriate build command (go build, npm run build, cargo build, make, etc.). Fix any compilation errors.
+2. **Lint & typecheck** — run linter/formatter if the project has one (eslint, clippy, golangci-lint, etc.). Fix any new warnings.
+3. **Test** — run the full test suite (go test ./..., npm test, cargo test, make test, pytest, etc.). Fix any failures, including pre-existing tests you may have broken.
+4. **Review** — re-read your diff. Ensure no debug code, no unrelated changes, no secrets, no missing files.
+Do NOT skip verification. Do NOT proceed to PR creation with a broken build or failing tests.
 # GitHub Integration
 - Use the \`gh\` CLI for all GitHub operations: issues, pull requests, checks, releases.

package/src/delegate.js CHANGED Viewed

@@ -386,12 +386,18 @@ export async function delegate({
 	mcpConfig = null,
 	mcpConfigPath = null,
 	delegationManager = null,  // Optional per-instance manager, falls back to default singleton
-	concurrencyLimiter = null  // Optional global AI concurrency limiter
+	concurrencyLimiter = null,  // Optional global AI concurrency limiter
+	parentAbortSignal = null   // Optional AbortSignal from parent to cancel this delegation
 }) {
 	if (!task || typeof task !== 'string') {
 		throw new Error('Task parameter is required and must be a string');
 	}
+	// Check if parent has already been cancelled
+	if (parentAbortSignal?.aborted) {
+		throw new Error('Delegation cancelled: parent operation was aborted');
+	}
 	// Support runtime timeout override via environment variables when timeout not explicitly passed
 	// This allows operators to configure delegation timeouts without code changes
 	// Priority: DELEGATION_TIMEOUT_MS (milliseconds) > DELEGATION_TIMEOUT_SECONDS > DELEGATION_TIMEOUT (seconds)
@@ -481,24 +487,47 @@ export async function delegate({
 			console.error(`[DELEGATE] Subagent config: promptType=${promptType}, enableDelegate=false, maxIterations=${remainingIterations}`);
 		}
-		// Set up timeout with proper cleanup
-		// TODO: Implement AbortController support in ProbeAgent.answer() for proper cancellation
-		// Current limitation: When timeout occurs, subagent.answer() continues running in background
-		// This is acceptable since:
-		// 1. The promise will eventually resolve/reject and be garbage collected
-		// 2. The delegation slot is properly released on timeout
-		// 3. The parent receives timeout error and can handle it
-		// Future improvement: Add signal parameter to ProbeAgent.answer(task, [], { signal })
+		// Set up timeout and parent abort handling.
+		// When timeout fires or parent aborts, we cancel the subagent so it
+		// stops making API calls and releases resources promptly.
 		const timeoutPromise = new Promise((_, reject) => {
 			timeoutId = setTimeout(() => {
+				subagent.cancel();
 				reject(new Error(`Delegation timed out after ${timeout} seconds`));
 			}, timeout * 1000);
 		});
-		// Execute the task with timeout
+		// Listen for parent abort signal
+		let parentAbortHandler;
+		const parentAbortPromise = new Promise((_, reject) => {
+			if (parentAbortSignal) {
+				if (parentAbortSignal.aborted) {
+					subagent.cancel();
+					reject(new Error('Delegation cancelled: parent operation was aborted'));
+					return;
+				}
+				parentAbortHandler = () => {
+					subagent.cancel();
+					reject(new Error('Delegation cancelled: parent operation was aborted'));
+				};
+				parentAbortSignal.addEventListener('abort', parentAbortHandler, { once: true });
+			}
+		});
+		// Execute the task with timeout and parent abort
 		const answerOptions = schema ? { schema } : undefined;
 		const answerPromise = answerOptions ? subagent.answer(task, [], answerOptions) : subagent.answer(task);
-		const response = await Promise.race([answerPromise, timeoutPromise]);
+		const racers = [answerPromise, timeoutPromise];
+		if (parentAbortSignal) racers.push(parentAbortPromise);
+		let response;
+		try {
+			response = await Promise.race(racers);
+		} finally {
+			// Clean up parent abort listener to prevent memory leaks
+			if (parentAbortHandler && parentAbortSignal) {
+				parentAbortSignal.removeEventListener('abort', parentAbortHandler);
+			}
+		}
 		// Clear timeout immediately after race completes to prevent memory leak
 		// Note: timeoutId is always set by this point (synchronous in Promise constructor)