npm - attocode - Versions diffs - 0.2.1 → 0.2.2 - Mend

attocode 0.2.1 → 0.2.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (148) hide show

package/CHANGELOG.md +91 -1
package/README.md +7 -0
package/dist/src/adapters.d.ts +6 -1
package/dist/src/adapters.d.ts.map +1 -1
package/dist/src/adapters.js +8 -1
package/dist/src/adapters.js.map +1 -1
package/dist/src/agent.d.ts +35 -4
package/dist/src/agent.d.ts.map +1 -1
package/dist/src/agent.js +361 -45
package/dist/src/agent.js.map +1 -1
package/dist/src/defaults.d.ts +1 -1
package/dist/src/defaults.d.ts.map +1 -1
package/dist/src/defaults.js +2 -0
package/dist/src/defaults.js.map +1 -1
package/dist/src/integrations/agent-registry.d.ts +2 -0
package/dist/src/integrations/agent-registry.d.ts.map +1 -1
package/dist/src/integrations/agent-registry.js.map +1 -1
package/dist/src/integrations/async-subagent.d.ts +135 -0
package/dist/src/integrations/async-subagent.d.ts.map +1 -0
package/dist/src/integrations/async-subagent.js +213 -0
package/dist/src/integrations/async-subagent.js.map +1 -0
package/dist/src/integrations/auto-checkpoint.d.ts +98 -0
package/dist/src/integrations/auto-checkpoint.d.ts.map +1 -0
package/dist/src/integrations/auto-checkpoint.js +252 -0
package/dist/src/integrations/auto-checkpoint.js.map +1 -0
package/dist/src/integrations/complexity-classifier.d.ts +86 -0
package/dist/src/integrations/complexity-classifier.d.ts.map +1 -0
package/dist/src/integrations/complexity-classifier.js +233 -0
package/dist/src/integrations/complexity-classifier.js.map +1 -0
package/dist/src/integrations/delegation-protocol.d.ts +86 -0
package/dist/src/integrations/delegation-protocol.d.ts.map +1 -0
package/dist/src/integrations/delegation-protocol.js +127 -0
package/dist/src/integrations/delegation-protocol.js.map +1 -0
package/dist/src/integrations/dynamic-budget.d.ts +81 -0
package/dist/src/integrations/dynamic-budget.d.ts.map +1 -0
package/dist/src/integrations/dynamic-budget.js +151 -0
package/dist/src/integrations/dynamic-budget.js.map +1 -0
package/dist/src/integrations/economics.d.ts +44 -1
package/dist/src/integrations/economics.d.ts.map +1 -1
package/dist/src/integrations/economics.js +182 -3
package/dist/src/integrations/economics.js.map +1 -1
package/dist/src/integrations/environment-facts.d.ts +52 -0
package/dist/src/integrations/environment-facts.d.ts.map +1 -0
package/dist/src/integrations/environment-facts.js +84 -0
package/dist/src/integrations/environment-facts.js.map +1 -0
package/dist/src/integrations/index.d.ts +16 -1
package/dist/src/integrations/index.d.ts.map +1 -1
package/dist/src/integrations/index.js +31 -1
package/dist/src/integrations/index.js.map +1 -1
package/dist/src/integrations/injection-budget.d.ts +71 -0
package/dist/src/integrations/injection-budget.d.ts.map +1 -0
package/dist/src/integrations/injection-budget.js +136 -0
package/dist/src/integrations/injection-budget.js.map +1 -0
package/dist/src/integrations/mcp-client.d.ts.map +1 -1
package/dist/src/integrations/mcp-client.js +14 -0
package/dist/src/integrations/mcp-client.js.map +1 -1
package/dist/src/integrations/mcp-custom-tools.d.ts +102 -0
package/dist/src/integrations/mcp-custom-tools.d.ts.map +1 -0
package/dist/src/integrations/mcp-custom-tools.js +232 -0
package/dist/src/integrations/mcp-custom-tools.js.map +1 -0
package/dist/src/integrations/mcp-tool-validator.d.ts +60 -0
package/dist/src/integrations/mcp-tool-validator.d.ts.map +1 -0
package/dist/src/integrations/mcp-tool-validator.js +141 -0
package/dist/src/integrations/mcp-tool-validator.js.map +1 -0
package/dist/src/integrations/self-improvement.d.ts +90 -0
package/dist/src/integrations/self-improvement.d.ts.map +1 -0
package/dist/src/integrations/self-improvement.js +217 -0
package/dist/src/integrations/self-improvement.js.map +1 -0
package/dist/src/integrations/smart-decomposer.d.ts +4 -0
package/dist/src/integrations/smart-decomposer.d.ts.map +1 -1
package/dist/src/integrations/smart-decomposer.js +55 -28
package/dist/src/integrations/smart-decomposer.js.map +1 -1
package/dist/src/integrations/subagent-output-store.d.ts +91 -0
package/dist/src/integrations/subagent-output-store.d.ts.map +1 -0
package/dist/src/integrations/subagent-output-store.js +257 -0
package/dist/src/integrations/subagent-output-store.js.map +1 -0
package/dist/src/integrations/swarm/index.d.ts +1 -1
package/dist/src/integrations/swarm/index.d.ts.map +1 -1
package/dist/src/integrations/swarm/index.js +1 -1
package/dist/src/integrations/swarm/index.js.map +1 -1
package/dist/src/integrations/swarm/model-selector.d.ts +1 -0
package/dist/src/integrations/swarm/model-selector.d.ts.map +1 -1
package/dist/src/integrations/swarm/model-selector.js +37 -3
package/dist/src/integrations/swarm/model-selector.js.map +1 -1
package/dist/src/integrations/swarm/swarm-config-loader.d.ts +10 -1
package/dist/src/integrations/swarm/swarm-config-loader.d.ts.map +1 -1
package/dist/src/integrations/swarm/swarm-config-loader.js +72 -6
package/dist/src/integrations/swarm/swarm-config-loader.js.map +1 -1
package/dist/src/integrations/swarm/swarm-event-bridge.d.ts.map +1 -1
package/dist/src/integrations/swarm/swarm-event-bridge.js +26 -4
package/dist/src/integrations/swarm/swarm-event-bridge.js.map +1 -1
package/dist/src/integrations/swarm/swarm-events.d.ts +11 -0
package/dist/src/integrations/swarm/swarm-events.d.ts.map +1 -1
package/dist/src/integrations/swarm/swarm-events.js +4 -0
package/dist/src/integrations/swarm/swarm-events.js.map +1 -1
package/dist/src/integrations/swarm/swarm-orchestrator.d.ts +11 -0
package/dist/src/integrations/swarm/swarm-orchestrator.d.ts.map +1 -1
package/dist/src/integrations/swarm/swarm-orchestrator.js +233 -10
package/dist/src/integrations/swarm/swarm-orchestrator.js.map +1 -1
package/dist/src/integrations/swarm/swarm-quality-gate.d.ts +9 -2
package/dist/src/integrations/swarm/swarm-quality-gate.d.ts.map +1 -1
package/dist/src/integrations/swarm/swarm-quality-gate.js +128 -11
package/dist/src/integrations/swarm/swarm-quality-gate.js.map +1 -1
package/dist/src/integrations/swarm/task-queue.d.ts +11 -1
package/dist/src/integrations/swarm/task-queue.d.ts.map +1 -1
package/dist/src/integrations/swarm/task-queue.js +125 -15
package/dist/src/integrations/swarm/task-queue.js.map +1 -1
package/dist/src/integrations/swarm/types.d.ts +40 -1
package/dist/src/integrations/swarm/types.d.ts.map +1 -1
package/dist/src/integrations/swarm/types.js +6 -1
package/dist/src/integrations/swarm/types.js.map +1 -1
package/dist/src/integrations/swarm/worker-pool.d.ts +9 -3
package/dist/src/integrations/swarm/worker-pool.d.ts.map +1 -1
package/dist/src/integrations/swarm/worker-pool.js +89 -17
package/dist/src/integrations/swarm/worker-pool.js.map +1 -1
package/dist/src/integrations/thinking-strategy.d.ts +52 -0
package/dist/src/integrations/thinking-strategy.d.ts.map +1 -0
package/dist/src/integrations/thinking-strategy.js +129 -0
package/dist/src/integrations/thinking-strategy.js.map +1 -0
package/dist/src/integrations/tool-recommendation.d.ts +58 -0
package/dist/src/integrations/tool-recommendation.d.ts.map +1 -0
package/dist/src/integrations/tool-recommendation.js +215 -0
package/dist/src/integrations/tool-recommendation.js.map +1 -0
package/dist/src/integrations/verification-gate.d.ts +80 -0
package/dist/src/integrations/verification-gate.d.ts.map +1 -0
package/dist/src/integrations/verification-gate.js +146 -0
package/dist/src/integrations/verification-gate.js.map +1 -0
package/dist/src/integrations/work-log.d.ts +87 -0
package/dist/src/integrations/work-log.d.ts.map +1 -0
package/dist/src/integrations/work-log.js +275 -0
package/dist/src/integrations/work-log.js.map +1 -0
package/dist/src/main.js +5 -4
package/dist/src/main.js.map +1 -1
package/dist/src/modes.d.ts +6 -0
package/dist/src/modes.d.ts.map +1 -1
package/dist/src/modes.js +73 -2
package/dist/src/modes.js.map +1 -1
package/dist/src/tools/bash.d.ts +6 -0
package/dist/src/tools/bash.d.ts.map +1 -1
package/dist/src/tools/bash.js +12 -0
package/dist/src/tools/bash.js.map +1 -1
package/dist/src/tools/standard.d.ts +17 -1
package/dist/src/tools/standard.d.ts.map +1 -1
package/dist/src/tools/standard.js +64 -11
package/dist/src/tools/standard.js.map +1 -1
package/dist/src/types.d.ts +18 -0
package/dist/src/types.d.ts.map +1 -1
package/package.json +6 -2

package/dist/src/agent.js CHANGED Viewed

@@ -21,7 +21,11 @@
 import { buildConfig, isFeatureEnabled, getEnabledFeatures, getSubagentTimeout, getSubagentMaxIterations, } from './defaults.js';
 import { createModeManager, formatModeList, parseMode, calculateTaskSimilarity, SUBAGENT_PLAN_MODE_ADDITION, } from './modes.js';
 import { createLSPFileTools, } from './agent-tools/index.js';
-import { HookManager, MemoryManager, PlanningManager, ObservabilityManager, SafetyManager, RoutingManager, MultiAgentManager, ReActManager, ExecutionPolicyManager, ThreadManager, RulesManager, DEFAULT_RULE_SOURCES, ExecutionEconomicsManager, STANDARD_BUDGET, SUBAGENT_BUDGET, TIMEOUT_WRAPUP_PROMPT, AgentRegistry, filterToolsForAgent, formatAgentList, createCancellationManager, isCancellationError, createLinkedToken, createGracefulTimeout, race, createResourceManager, createLSPManager, createSemanticCacheManager, createSkillManager, formatSkillList, createContextEngineering, stableStringify, createCodebaseContext, buildContextFromChunks, createSharedFileCache, createBudgetPool, createPendingPlanManager, createInteractivePlanner, createRecursiveContext, createLearningStore, createCompactor, createAutoCompactionManager, createFileChangeTracker, createCapabilitiesRegistry, createSharedBlackboard, createTaskManager, createSwarmOrchestrator, createThrottledProvider, FREE_TIER_THROTTLE, PAID_TIER_THROTTLE, } from './integrations/index.js';
+import { HookManager, MemoryManager, PlanningManager, ObservabilityManager, SafetyManager, RoutingManager, MultiAgentManager, ReActManager, ExecutionPolicyManager, ThreadManager, RulesManager, DEFAULT_RULE_SOURCES, ExecutionEconomicsManager, STANDARD_BUDGET, SUBAGENT_BUDGET, TIMEOUT_WRAPUP_PROMPT, AgentRegistry, filterToolsForAgent, formatAgentList, createCancellationManager, isCancellationError, createLinkedToken, createGracefulTimeout, race, createResourceManager, createLSPManager, createSemanticCacheManager, createSkillManager, formatSkillList, createContextEngineering, stableStringify, createCodebaseContext, buildContextFromChunks, createSharedFileCache, createBudgetPool, createDynamicBudgetPool, createPendingPlanManager, createInteractivePlanner, createRecursiveContext, createLearningStore, createCompactor, createAutoCompactionManager, createFileChangeTracker, createCapabilitiesRegistry, createSharedBlackboard, createTaskManager, createSwarmOrchestrator, createThrottledProvider, FREE_TIER_THROTTLE, PAID_TIER_THROTTLE, createWorkLog, createVerificationGate,
+// Phase 2: Orchestration
+classifyComplexity, getScalingGuidance, buildDelegationPrompt, createMinimalDelegationSpec, getSubagentQualityPrompt, ToolRecommendationEngine, createToolRecommendationEngine, createInjectionBudgetManager,
+// Phase 3: Advanced
+getThinkingSystemPrompt, createSelfImprovementProtocol, createSubagentOutputStore, createSerperSearchTool, getEnvironmentFacts, formatFactsBlock, createAutoCheckpointManager, createSubagentSupervisor, createSubagentHandle, } from './integrations/index.js';
 // Lesson 26: Tracing & Evaluation integration
 import { createTraceCollector } from './tracing/trace-collector.js';
 // Model registry for context window limits
@@ -43,31 +47,107 @@ export const PARALLELIZABLE_TOOLS = new Set([
     'search_code', 'get_file_info',
 ]);
 /**
- * Groups consecutive tool calls into batches for parallel/sequential execution.
- * Consecutive parallelizable tools form a single parallel batch.
- * Non-parallelizable tools break the sequence, starting a new batch.
+ * Tools that can run in parallel IF they target different files.
+ * write_file and edit_file on different paths are safe to parallelize.
  */
-export function groupToolCallsIntoBatches(toolCalls, isParallelizable = (tc) => PARALLELIZABLE_TOOLS.has(tc.name)) {
+export const CONDITIONALLY_PARALLEL_TOOLS = new Set([
+    'write_file', 'edit_file',
+]);
+/**
+ * Extract the target file path from a tool call's arguments.
+ * Returns null if no file path can be determined.
+ */
+export function extractToolFilePath(toolCall) {
+    // Check common argument patterns
+    const args = toolCall;
+    for (const key of ['path', 'file_path', 'filename', 'file']) {
+        if (typeof args[key] === 'string')
+            return args[key];
+    }
+    // Check nested args object
+    if (args.args && typeof args.args === 'object') {
+        const nested = args.args;
+        for (const key of ['path', 'file_path', 'filename', 'file']) {
+            if (typeof nested[key] === 'string')
+                return nested[key];
+        }
+    }
+    // Check input object (common in structured tool calls)
+    if (args.input && typeof args.input === 'object') {
+        const input = args.input;
+        for (const key of ['path', 'file_path', 'filename', 'file']) {
+            if (typeof input[key] === 'string')
+                return input[key];
+        }
+    }
+    return null;
+}
+/**
+ * Check if a conditionally-parallel tool call conflicts with any tool
+ * in the current accumulator (same file path).
+ */
+function hasFileConflict(toolCall, accumulator) {
+    const path = extractToolFilePath(toolCall);
+    if (!path)
+        return true; // Can't determine path → assume conflict
+    for (const existing of accumulator) {
+        const existingPath = extractToolFilePath(existing);
+        if (existingPath === path)
+            return true; // Same file → conflict
+    }
+    return false;
+}
+/**
+ * Groups tool calls into batches for parallel/sequential execution.
+ * Uses accumulate-and-flush: parallelizable tools accumulate until a
+ * non-parallelizable tool flushes them as a batch. This produces optimal
+ * batching even for non-consecutive parallelizable tools.
+ *
+ * Enhanced with conditional parallelism: write_file/edit_file on
+ * DIFFERENT files can be batched together for parallel execution.
+ *
+ * Example: [read1, read2, write, read3, grep] → [[read1, read2], [write], [read3, grep]]
+ * (Previous algorithm produced 4 batches; this produces 3)
+ *
+ * Enhanced: [write_a, write_b, write_a] → [[write_a, write_b], [write_a]]
+ * (Different files parallelized, same file sequential)
+ */
+export function groupToolCallsIntoBatches(toolCalls, isParallelizable = (tc) => PARALLELIZABLE_TOOLS.has(tc.name), isConditionallyParallel = (tc) => CONDITIONALLY_PARALLEL_TOOLS.has(tc.name)) {
+    if (toolCalls.length === 0)
+        return [];
     const batches = [];
-    let currentBatch = [];
-    let currentIsParallel = false;
+    let parallelAccum = [];
     for (const toolCall of toolCalls) {
-        const isParallel = isParallelizable(toolCall);
-        if (batches.length === 0 && currentBatch.length === 0) {
-            currentBatch.push(toolCall);
-            currentIsParallel = isParallel;
+        if (isParallelizable(toolCall)) {
+            parallelAccum.push(toolCall);
         }
-        else if (isParallel && currentIsParallel) {
-            currentBatch.push(toolCall);
+        else if (isConditionallyParallel(toolCall)) {
+            // Can parallelize if no file conflict with existing accumulator
+            if (!hasFileConflict(toolCall, parallelAccum)) {
+                parallelAccum.push(toolCall);
+            }
+            else {
+                // Conflict: flush current batch, start new one with this tool
+                if (parallelAccum.length > 0) {
+                    batches.push(parallelAccum);
+                    parallelAccum = [];
+                }
+                parallelAccum.push(toolCall);
+            }
         }
         else {
-            batches.push(currentBatch);
-            currentBatch = [toolCall];
-            currentIsParallel = isParallel;
+            // Flush any accumulated parallel tools as a single batch
+            if (parallelAccum.length > 0) {
+                batches.push(parallelAccum);
+                parallelAccum = [];
+            }
+            // Non-parallelizable tool gets its own batch
+            batches.push([toolCall]);
         }
     }
-    if (currentBatch.length > 0) {
-        batches.push(currentBatch);
+    // Flush remaining parallel tools
+    if (parallelAccum.length > 0) {
+        batches.push(parallelAccum);
     }
     return batches;
 }
@@ -117,6 +197,15 @@ export class ProductionAgent {
     taskManager = null;
     store = null;
     swarmOrchestrator = null;
+    workLog = null;
+    verificationGate = null;
+    // Phase 2-4 integration modules
+    injectionBudget = null;
+    selfImprovement = null;
+    subagentOutputStore = null;
+    autoCheckpointManager = null;
+    toolRecommendation = null;
+    lastComplexityAssessment = null;
     // Duplicate spawn prevention - tracks recently spawned tasks to prevent doom loops
     // Map<taskKey, { timestamp: number; result: string; queuedChanges: number }>
     spawnedTasks = new Map();
@@ -311,6 +400,19 @@ export class ProductionAgent {
             maxIterations: this.config.maxIterations,
             targetIterations: Math.min(baseBudget.targetIterations ?? 20, this.config.maxIterations),
         });
+        // Work Log - compaction-resilient summary of agent work
+        // Always enabled - minimal overhead and critical for long-running tasks
+        this.workLog = createWorkLog();
+        // Verification Gate - opt-in completion verification
+        if (this.config.verificationCriteria) {
+            this.verificationGate = createVerificationGate(this.config.verificationCriteria);
+        }
+        // Phase 2-4: Orchestration & Advanced modules (always enabled, lightweight)
+        this.injectionBudget = createInjectionBudgetManager();
+        this.selfImprovement = createSelfImprovementProtocol(undefined, this.learningStore ?? undefined);
+        this.subagentOutputStore = createSubagentOutputStore({ persistToFile: false });
+        this.autoCheckpointManager = createAutoCheckpointManager({ enabled: true });
+        this.toolRecommendation = createToolRecommendationEngine();
         // Agent Registry - always enabled for subagent support
         this.agentRegistry = new AgentRegistry();
         // Load user agents asynchronously - tracked for ensureReady()
@@ -341,6 +443,15 @@ export class ProductionAgent {
         for (const tool of taskTools) {
             this.tools.set(tool.name, tool);
         }
+        // Built-in web search (Serper API) — gracefully handles missing API key
+        const serperCustomTool = createSerperSearchTool();
+        this.tools.set('web_search', {
+            name: serperCustomTool.name,
+            description: serperCustomTool.description,
+            parameters: serperCustomTool.inputSchema,
+            execute: serperCustomTool.execute,
+            dangerLevel: 'safe',
+        });
         // Swarm Mode (experimental)
         if (this.config.swarm) {
             const swarmConfig = this.config.swarm;
@@ -837,6 +948,10 @@ export class ProductionAgent {
         try {
             // Check for cancellation before starting
             cancellationToken?.throwIfCancellationRequested();
+            // Classify task complexity for scaling guidance
+            this.lastComplexityAssessment = classifyComplexity(task, {
+                hasActivePlan: !!this.state.plan,
+            });
             // Check if swarm mode should handle this task
             if (this.swarmOrchestrator) {
                 const swarmResult = await this.runSwarm(task);
@@ -1119,6 +1234,14 @@ export class ProductionAgent {
                                     content: `[CONTEXT REDUCED: Earlier messages were removed to stay within budget. Conversation continues from recent context.]`,
                                 });
                                 messages.push(...recentMessages);
+                                // Inject work log after emergency truncation to prevent amnesia
+                                if (this.workLog?.hasContent()) {
+                                    const workLogMessage = {
+                                        role: 'user',
+                                        content: this.workLog.toCompactString(),
+                                    };
+                                    messages.push(workLogMessage);
+                                }
                                 // Update state messages too
                                 this.state.messages.length = 0;
                                 this.state.messages.push(...messages);
@@ -1299,6 +1422,35 @@ export class ProductionAgent {
                     }
                 }
                 // =====================================================================
+                // INJECTION BUDGET ANALYSIS (Phase 2 - monitoring mode)
+                // Collects stats on context injections without gating; logs when
+                // budget would have dropped items. Validates system before enabling gating.
+                // =====================================================================
+                if (this.injectionBudget) {
+                    const proposals = [];
+                    if (budgetInjectedPrompt) {
+                        proposals.push({ name: 'budget_warning', priority: 0, maxTokens: 500, content: budgetInjectedPrompt });
+                    }
+                    // Approximate recitation content (actual injection handled above)
+                    if (this.contextEngineering) {
+                        const failureCtx = this.contextEngineering.getFailureContext(5);
+                        if (failureCtx) {
+                            proposals.push({ name: 'failure_context', priority: 2, maxTokens: 300, content: failureCtx });
+                        }
+                    }
+                    if (proposals.length > 0) {
+                        const accepted = this.injectionBudget.allocate(proposals);
+                        const stats = this.injectionBudget.getLastStats();
+                        if (stats && stats.droppedNames.length > 0 && process.env.DEBUG) {
+                            console.log(`[injection-budget] Would drop: ${stats.droppedNames.join(', ')} (${stats.proposedTokens} proposed, ${stats.acceptedTokens} accepted)`);
+                        }
+                        // Log total injection overhead for observability
+                        if (stats && process.env.DEBUG_LLM) {
+                            console.log(`[injection-budget] Iteration ${this.state.iteration}: ${accepted.length}/${proposals.length} injections, ~${stats.acceptedTokens} tokens`);
+                        }
+                    }
+                }
+                // =====================================================================
                 // RESILIENT LLM CALL: Empty response retries + max_tokens continuation
                 // =====================================================================
                 // Get resilience config
@@ -1594,6 +1746,24 @@ export class ProductionAgent {
                         });
                         incompleteActionRetries = 0;
                     }
+                    // Verification gate: if criteria not met, nudge agent to verify before completing
+                    if (this.verificationGate && !forceTextOnly) {
+                        const vResult = this.verificationGate.check();
+                        if (!vResult.satisfied && !vResult.forceAllow && vResult.nudge) {
+                            // Inject nudge and continue the loop
+                            const nudgeMessage = {
+                                role: 'user',
+                                content: vResult.nudge,
+                            };
+                            messages.push(nudgeMessage);
+                            this.state.messages.push(nudgeMessage);
+                            this.observability?.logger?.info('Verification gate nudge', {
+                                missing: vResult.missing,
+                                nudgeCount: this.verificationGate.getState().nudgeCount,
+                            });
+                            continue;
+                        }
+                    }
                     // No tool calls (or forced to ignore), agent is done - compact tool outputs to save context
                     // The model has "consumed" the tool outputs and produced a response,
                     // so we can replace verbose outputs with compact summaries
@@ -1630,12 +1800,33 @@ export class ProductionAgent {
                 // Execute tool calls (we know toolCalls is defined here due to the check above)
                 const toolCalls = response.toolCalls;
                 const toolResults = await this.executeToolCalls(toolCalls);
-                // Record tool calls for economics/progress tracking
+                // Record tool calls for economics/progress tracking + work log
                 for (let i = 0; i < toolCalls.length; i++) {
                     const toolCall = toolCalls[i];
                     const result = toolResults[i];
                     executedToolNames.add(toolCall.name);
                     this.economics?.recordToolCall(toolCall.name, toolCall.arguments, result?.result);
+                    // Record in work log for compaction resilience
+                    const toolOutput = result?.result && typeof result.result === 'object' && 'output' in result.result
+                        ? String(result.result.output)
+                        : typeof result?.result === 'string' ? result.result : undefined;
+                    this.workLog?.recordToolExecution(toolCall.name, toolCall.arguments, toolOutput);
+                    // Record in verification gate
+                    if (this.verificationGate) {
+                        if (toolCall.name === 'bash') {
+                            const toolRes = result?.result;
+                            const output = toolRes && typeof toolRes === 'object' && 'output' in toolRes
+                                ? String(toolRes.output)
+                                : typeof toolRes === 'string' ? toolRes : '';
+                            const exitCode = toolRes && typeof toolRes === 'object' && toolRes.metadata
+                                ? toolRes.metadata.exitCode ?? null
+                                : null;
+                            this.verificationGate.recordBashExecution(String(toolCall.arguments.command || ''), output, exitCode);
+                        }
+                        if (['write_file', 'edit_file'].includes(toolCall.name)) {
+                            this.verificationGate.recordFileChange();
+                        }
+                    }
                 }
                 // Add tool results to messages (with truncation and proactive budget management)
                 const MAX_TOOL_OUTPUT_CHARS = 8000; // ~2000 tokens max per tool output
@@ -1657,6 +1848,15 @@ export class ProductionAgent {
                         messages.push(...compactionResult.compactedMessages);
                         this.state.messages.length = 0;
                         this.state.messages.push(...compactionResult.compactedMessages);
+                        // Inject work log after compaction to prevent amnesia
+                        if (this.workLog?.hasContent()) {
+                            const workLogMessage = {
+                                role: 'user',
+                                content: this.workLog.toCompactString(),
+                            };
+                            messages.push(workLogMessage);
+                            this.state.messages.push(workLogMessage);
+                        }
                     }
                     else if (compactionResult.status === 'hard_limit') {
                         // Hard limit reached - this is serious, emit error
@@ -1851,12 +2051,25 @@ export class ProductionAgent {
             }
         }
         // Build system prompt using cache-aware builder if available (Trick P)
-        // Combine memory, learnings, and codebase context
-        const combinedContext = [
+        // Combine memory, learnings, codebase context, and environment facts
+        const combinedContextParts = [
+            // Environment facts — temporal/platform grounding (prevents stale date hallucinations)
+            formatFactsBlock(getEnvironmentFacts()),
             ...(memoryContext.length > 0 ? memoryContext : []),
             ...(learningsContext ? [learningsContext] : []),
             ...(codebaseContextStr ? [`\n## Relevant Code\n${codebaseContextStr}`] : []),
-        ].join('\n');
+        ];
+        // Inject thinking directives and scaling guidance for non-simple tasks
+        if (this.lastComplexityAssessment) {
+            const thinkingPrompt = getThinkingSystemPrompt(this.lastComplexityAssessment.tier);
+            if (thinkingPrompt) {
+                combinedContextParts.push(thinkingPrompt);
+            }
+            if (this.lastComplexityAssessment.tier !== 'simple') {
+                combinedContextParts.push(getScalingGuidance(this.lastComplexityAssessment));
+            }
+        }
+        const combinedContext = combinedContextParts.join('\n');
         const promptOptions = {
             rules: rulesContent + (skillsPrompt ? '\n\n' + skillsPrompt : ''),
             tools: toolDescriptions,
@@ -1996,6 +2209,8 @@ export class ProductionAgent {
                 },
             },
         });
+        // Pause duration budget during LLM call - network time shouldn't count against agent
+        this.economics?.pauseDuration();
         try {
             let response;
             let actualModel = model;
@@ -2135,6 +2350,10 @@ export class ProductionAgent {
             this.observability?.tracer?.endSpan(spanId);
             throw error;
         }
+        finally {
+            // Resume duration budget after LLM call completes (success or failure)
+            this.economics?.resumeDuration();
+        }
     }
     /**
      * Execute an async callback while excluding wall-clock wait time from duration budgeting.
@@ -2467,6 +2686,8 @@ export class ProductionAgent {
                     this.blackboard.release(filePath, agentId);
                 }
             }
+            // Self-improvement: record success pattern
+            this.selfImprovement?.recordSuccess(toolCall.name, toolCall.arguments, typeof result === 'string' ? result.slice(0, 200) : JSON.stringify(result).slice(0, 200));
             this.observability?.tracer?.endSpan(spanId);
             return { callId: toolCall.id, result };
         }
@@ -2494,6 +2715,12 @@ export class ProductionAgent {
                 error,
                 intent: `Execute tool ${toolCall.name}`,
             });
+            // Self-improvement: enhance error message with diagnosis for better LLM recovery
+            if (this.selfImprovement) {
+                const enhanced = this.selfImprovement.enhanceErrorMessage(toolCall.name, error.message, toolCall.arguments);
+                this.emit({ type: 'tool.blocked', tool: toolCall.name, reason: enhanced });
+                return { callId: toolCall.id, result: `Error: ${enhanced}`, error: enhanced };
+            }
             this.emit({ type: 'tool.blocked', tool: toolCall.name, reason: error.message });
             return { callId: toolCall.id, result: `Error: ${error.message}`, error: error.message };
         }
@@ -3522,6 +3749,19 @@ export class ProductionAgent {
         }
         // Create the checkpoint
         const label = `auto-iter-${this.state.iteration}`;
+        // Supplementary: also save to AutoCheckpointManager (file-based)
+        if (this.autoCheckpointManager) {
+            try {
+                this.autoCheckpointManager.save({
+                    label,
+                    sessionId: this.agentId,
+                    iteration: this.state.iteration,
+                });
+            }
+            catch {
+                // Non-critical — don't fail the main checkpoint path
+            }
+        }
         return this.createCheckpoint(label);
     }
     // =========================================================================
@@ -3675,7 +3915,18 @@ export class ProductionAgent {
         let workerResultId;
         try {
             // Filter tools for this agent
-            const agentTools = filterToolsForAgent(agentDef, Array.from(this.tools.values()));
+            let agentTools = filterToolsForAgent(agentDef, Array.from(this.tools.values()));
+            // Apply tool recommendations to improve subagent focus (only for large tool sets)
+            if (this.toolRecommendation && agentTools.length > 15) {
+                const taskType = ToolRecommendationEngine.inferTaskType(agentName);
+                const recommendations = this.toolRecommendation.recommendTools(task, taskType, agentTools.map(t => t.name));
+                if (recommendations.length > 0) {
+                    const recommendedNames = new Set(recommendations.map(r => r.toolName));
+                    // Always keep spawn tools even if not recommended
+                    const alwaysKeep = new Set(['spawn_agent', 'spawn_agents_parallel']);
+                    agentTools = agentTools.filter(t => recommendedNames.has(t.name) || alwaysKeep.has(t.name));
+                }
+            }
             // Resolve model - abstract tiers (fast/balanced/quality) should use parent's model
             // Only use agentDef.model if it's an actual model ID (contains '/')
             const resolvedModel = (agentDef.model && agentDef.model.includes('/'))
@@ -3767,14 +4018,30 @@ export class ProductionAgent {
             // BUDGET AWARENESS: Always inject so subagent understands its limits
             const subagentBudgetTokens = constraints?.maxTokens ?? SUBAGENT_BUDGET.maxTokens ?? 100000;
             const subagentBudgetMinutes = Math.round((SUBAGENT_BUDGET.maxDuration ?? 240000) / 60000);
-            constraintParts.push(`**RESOURCE AWARENESS (CRITICAL):**\n` +
-                `- Token budget: ~${(subagentBudgetTokens / 1000).toFixed(0)}k tokens\n` +
-                `- Time limit: ~${subagentBudgetMinutes} minutes\n` +
-                `- You will receive warnings at 70% usage. When warned, WRAP UP immediately.\n` +
-                `- Do not explore indefinitely - be focused and efficient.\n` +
-                `- If approaching limits, summarize findings and return.\n` +
-                `- **STRUCTURED WRAPUP:** When told to wrap up, respond with ONLY this JSON (no tool calls):\n` +
-                `  {"findings":[...], "actionsTaken":[...], "failures":[...], "remainingWork":[...], "suggestedNextSteps":[...]}`);
+            if (isSwarmWorker) {
+                // V6: Calmer resource awareness for swarm workers — prevents weaker models
+                // from confabulating budget warnings and wrapping up without doing work
+                constraintParts.push(`**Resource Info:**\n` +
+                    `- Token budget: ~${(subagentBudgetTokens / 1000).toFixed(0)}k tokens (you have plenty)\n` +
+                    `- Time limit: ~${subagentBudgetMinutes} minutes\n` +
+                    `- Focus on completing your task. Do NOT wrap up prematurely.\n` +
+                    `- You will receive a system warning IF you approach budget limits. Until then, work normally.\n` +
+                    `- **IMPORTANT:** Budget warnings come from the SYSTEM, not from your own assessment. ` +
+                    `Do not preemptively claim budget issues.\n` +
+                    `- **STRUCTURED WRAPUP:** When told to wrap up, respond with ONLY this JSON (no tool calls):\n` +
+                    `  {"findings":[...], "actionsTaken":[...], "failures":[...], "remainingWork":[...], "suggestedNextSteps":[...]}`);
+            }
+            else {
+                // Original RESOURCE AWARENESS text for regular subagents
+                constraintParts.push(`**RESOURCE AWARENESS (CRITICAL):**\n` +
+                    `- Token budget: ~${(subagentBudgetTokens / 1000).toFixed(0)}k tokens\n` +
+                    `- Time limit: ~${subagentBudgetMinutes} minutes\n` +
+                    `- You will receive warnings at 70% usage. When warned, WRAP UP immediately.\n` +
+                    `- Do not explore indefinitely - be focused and efficient.\n` +
+                    `- If approaching limits, summarize findings and return.\n` +
+                    `- **STRUCTURED WRAPUP:** When told to wrap up, respond with ONLY this JSON (no tool calls):\n` +
+                    `  {"findings":[...], "actionsTaken":[...], "failures":[...], "remainingWork":[...], "suggestedNextSteps":[...]}`);
+            }
             if (constraints) {
                 if (constraints.focusAreas && constraints.focusAreas.length > 0) {
                     constraintParts.push(`**FOCUS AREAS (limit exploration to these paths):**\n${constraints.focusAreas.map(a => `  - ${a}`).join('\n')}`);
@@ -3790,11 +4057,19 @@ export class ProductionAgent {
                 }
             }
             const constraintContext = `\n\n**EXECUTION CONSTRAINTS:**\n${constraintParts.join('\n\n')}\n`;
+            // Build delegation-enhanced system prompt
+            let delegationContext = '';
+            if (this.lastComplexityAssessment && this.lastComplexityAssessment.tier !== 'simple') {
+                const spec = createMinimalDelegationSpec(task, agentName);
+                delegationContext = '\n\n' + buildDelegationPrompt(spec);
+            }
+            // Quality self-assessment prompt for subagent
+            const qualityPrompt = '\n\n' + getSubagentQualityPrompt();
             // Build subagent system prompt with subagent-specific plan mode addition
             const parentMode = this.getMode();
             const subagentSystemPrompt = parentMode === 'plan'
-                ? `${agentDef.systemPrompt}\n\n${SUBAGENT_PLAN_MODE_ADDITION}${blackboardContext}${constraintContext}`
-                : `${agentDef.systemPrompt}${blackboardContext}${constraintContext}`;
+                ? `${agentDef.systemPrompt}\n\n${SUBAGENT_PLAN_MODE_ADDITION}${blackboardContext}${constraintContext}${delegationContext}${qualityPrompt}`
+                : `${agentDef.systemPrompt}${blackboardContext}${constraintContext}${delegationContext}${qualityPrompt}`;
             // Allocate budget from pool (or use default) — track allocation ID for release later
             const pooledBudget = this.getSubagentBudget(agentName, constraints);
             const poolAllocationId = pooledBudget.allocationId;
@@ -4006,6 +4281,25 @@ export class ProductionAgent {
                     },
                     structured,
                 };
+                // Save full output to subagent output store (avoids telephone problem)
+                if (this.subagentOutputStore) {
+                    const outputEntry = {
+                        id: agentId,
+                        agentId,
+                        agentName,
+                        task,
+                        fullOutput: finalOutput,
+                        structured,
+                        filesModified: [],
+                        filesCreated: [],
+                        timestamp: new Date(),
+                        tokensUsed: result.metrics.totalTokens,
+                        durationMs: duration,
+                    };
+                    const storeId = this.subagentOutputStore.save(outputEntry);
+                    // Attach reference so downstream consumers can retrieve full output
+                    spawnResultFinal.outputStoreId = storeId;
+                }
                 if (workerResultId && this.store?.hasWorkerResultsFeature()) {
                     try {
                         this.store.completeWorkerResult(workerResultId, {
@@ -4310,23 +4604,34 @@ export class ProductionAgent {
             count: tasks.length,
             agents: tasks.map(t => t.agent),
         });
-        // Pre-divide budget pool equally to prevent first-come starvation.
-        // Temporarily lower maxPerChild so each spawnAgent's normal reserve() call
-        // gets an equal share instead of racing for the full maxPerChild allocation.
+        // Use DynamicBudgetPool for parallel spawns (prevents child starvation,
+        // enables priority-based allocation). Falls back to regular pool for single tasks.
         let settled;
+        const originalPool = this.budgetPool;
+        // SubagentSupervisor for unified monitoring of concurrent subagents
+        const supervisor = tasks.length > 1 ? createSubagentSupervisor() : null;
         if (this.budgetPool && tasks.length > 1) {
+            // Swap to DynamicBudgetPool for this parallel batch
             const poolStats = this.budgetPool.getStats();
-            // equalShare is always ≤ remaining ≤ totalTokens ≤ originalMaxPerChild
-            // (guaranteed by createBudgetPool capping maxPerChild to poolTokens)
-            // so we don't need Math.min(equalShare, originalMaxPerChild) here.
-            const equalShare = Math.floor(poolStats.tokensRemaining / tasks.length);
-            this.budgetPool.setMaxPerChild(equalShare);
+            const dynamicPool = createDynamicBudgetPool(poolStats.tokensRemaining, 0.1);
+            dynamicPool.setExpectedChildren(tasks.length);
+            // Temporarily replace the budget pool so spawnAgent's reserve() uses the dynamic one
+            this.budgetPool = dynamicPool;
             try {
-                const promises = tasks.map(({ agent, task }) => this.spawnAgent(agent, task));
+                const promises = tasks.map(({ agent, task }) => {
+                    const spawnPromise = this.spawnAgent(agent, task);
+                    // Register with supervisor for monitoring
+                    if (supervisor) {
+                        const handle = createSubagentHandle(`parallel-${agent}-${Date.now()}`, agent, task, spawnPromise, {});
+                        supervisor.add(handle);
+                    }
+                    return spawnPromise;
+                });
                 settled = await Promise.allSettled(promises);
             }
             finally {
-                this.budgetPool.resetMaxPerChild();
+                this.budgetPool = originalPool;
+                supervisor?.stop();
             }
         }
         else {
@@ -5041,8 +5346,19 @@ If the task is a simple question or doesn't need specialized handling, set bestA
         this.unsubscribers = [];
         // Flush trace collector before cleanup
         await this.traceCollector?.flush();
-        // Clear blackboard (releases file claim locks)
-        this.blackboard?.clear();
+        // Per-agent blackboard cleanup: release only this agent's claims and subscriptions
+        // so parallel siblings don't lose their data. Only root agent clears everything.
+        if (this.blackboard) {
+            if (this.parentIterations > 0 && this.agentId) {
+                // Subagent: release only our claims and subscriptions
+                this.blackboard.releaseAll(this.agentId);
+                this.blackboard.unsubscribeAgent(this.agentId);
+            }
+            else {
+                // Root agent: full clear
+                this.blackboard.clear();
+            }
+        }
         // Wait for any pending init before cleanup
         if (this.initPromises.length > 0) {
             try {