npm - aiden-runtime - Versions diffs - 4.6.1 → 4.8.0 - Mend

aiden-runtime 4.6.1 → 4.8.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (34) hide show

package/README.md +499 -265
package/dist/cli/v4/aidenCLI.js +44 -5
package/dist/cli/v4/callbacks.js +52 -31
package/dist/cli/v4/chatSession.js +46 -1
package/dist/cli/v4/commands/help.js +22 -11
package/dist/cli/v4/commands/runs.js +42 -24
package/dist/cli/v4/commands/skills.js +15 -17
package/dist/cli/v4/commands/usage.js +17 -5
package/dist/cli/v4/daemonAgentBuilder.js +13 -4
package/dist/cli/v4/design/tokens.js +265 -0
package/dist/cli/v4/display/framedPanel.js +116 -0
package/dist/cli/v4/display/toolTrail.js +2 -2
package/dist/cli/v4/display.js +446 -164
package/dist/cli/v4/onboarding/disclaimer.js +42 -10
package/dist/cli/v4/onboarding/loading.js +24 -1
package/dist/cli/v4/onboarding/successScreen.js +17 -8
package/dist/cli/v4/replyRenderer.js +74 -58
package/dist/cli/v4/setupWizard.js +19 -2
package/dist/cli/v4/skinEngine.js +13 -0
package/dist/cli/v4/table.js +65 -8
package/dist/core/v4/aidenAgent.js +42 -14
package/dist/core/v4/auxiliaryClient.js +46 -13
package/dist/core/v4/daemon/dispatcher/realAgentRunner.js +13 -8
package/dist/core/v4/promptBuilder.js +45 -0
package/dist/core/v4/sandboxFs.js +1 -1
package/dist/core/v4/subagent/childBuilder.js +13 -4
package/dist/core/v4/subagent/spawnSubAgent.js +7 -1
package/dist/core/v4/ui/banner.js +16 -16
package/dist/core/version.js +1 -1
package/dist/moat/approvalEngine.js +14 -0
package/dist/moat/honestyEnforcement.js +143 -241
package/dist/tools/v4/index.js +54 -0
package/dist/tools/v4/subagent/spawnSubAgentTool.js +23 -0
package/package.json +10 -4

package/dist/core/v4/auxiliaryClient.js CHANGED Viewed

@@ -45,19 +45,35 @@ class AuxiliaryClient {
             return this.opts.adapter;
         if (!this.opts.resolver)
             return null;
-        this.resolveCallCount += 1;
-        try {
-            const adapter = await this.opts.resolver.resolve({
-                providerId: this.opts.defaultProvider,
-                modelId: this.opts.defaultModel,
-            });
-            return adapter;
-        }
-        catch (err) {
-            this.warn(`auxiliary client unavailable (${this.opts.defaultProvider}/${this.opts.defaultModel}): ${err.message}`);
-            this.adapterUnavailable = true;
-            return null;
+        // v4.8.0 Slice 11 — resolution chain: default first, then each
+        // fallback in order. The first attempt that resolves wins. This
+        // is the routing-fix entry point for the chatgpt-plus + gpt-5
+        // bug: aidenCLI hands us Groq as the default and the parent
+        // provider/model as the fallback, so auxiliary calls land on
+        // Groq when configured and the parent only sees traffic when
+        // Groq is absent.
+        const attempts = [
+            { providerId: this.opts.defaultProvider, modelId: this.opts.defaultModel },
+            ...(this.opts.fallbacks ?? []),
+        ];
+        const failures = [];
+        for (const att of attempts) {
+            this.resolveCallCount += 1;
+            try {
+                const adapter = await this.opts.resolver.resolve({
+                    providerId: att.providerId,
+                    modelId: att.modelId,
+                });
+                this.warn(`auxiliary resolved via ${att.providerId}/${att.modelId}`);
+                return adapter;
+            }
+            catch (err) {
+                failures.push(`${att.providerId}/${att.modelId}: ${err.message}`);
+            }
         }
+        this.warn(`auxiliary client unavailable (tried ${attempts.length}): ${failures.join('; ')}`);
+        this.adapterUnavailable = true;
+        return null;
     }
     /** Resolve count for tests (verifies single-resolution behaviour). */
     _resolveCallCount() {
@@ -122,7 +138,24 @@ class AuxiliaryClient {
         this.usage.set(purpose, cur);
     }
     warn(msg) {
-        (this.opts.warn ?? ((m) => console.warn(`[auxiliary] ${m}`)))(msg);
+        // v4.8.0 Slice 5 — gate console output behind AIDEN_VERBOSE.
+        // Auxiliary failures are recoverable (the main loop continues;
+        // result content is just empty), so the warning is pure noise
+        // for end users. Power users set AIDEN_VERBOSE=1 to surface them.
+        // Inline env-read preserves the core → cli no-import invariant;
+        // canonical isVerbose() lives at cli/v4/design/tokens.ts.
+        //
+        // v4.8.0 Slice 11 — if opts.warn is explicitly injected, always
+        // forward (tests + advanced callers register their own sink and
+        // expect every message). The AIDEN_VERBOSE gate now applies only
+        // to the default console.warn fallback that end-users see.
+        if (this.opts.warn) {
+            this.opts.warn(msg);
+            return;
+        }
+        if (process.env.AIDEN_VERBOSE !== '1')
+            return;
+        console.warn(`[auxiliary] ${msg}`);
     }
     async withTimeout(p, ms) {
         return new Promise((resolve, reject) => {

package/dist/core/v4/daemon/dispatcher/realAgentRunner.js CHANGED Viewed

@@ -177,14 +177,19 @@ function createRealAgentRunner(opts) {
             let invocationError = null;
             try {
                 result = await agent.runConversation(history, {
-                // The agent honours its own abort signal via per-tool aborts;
-                // tools that respect AbortSignal (shell_exec, fetch_*) will
-                // bail when perTurnWatcher trips.
-                //
-                // Note: runConversation doesn't currently take an abort
-                // signal in its options — the budget watcher is best-effort
-                // observability via tally(). Future enhancement: thread the
-                // signal into the loop body via options.
+                    // The agent honours its own abort signal via per-tool aborts;
+                    // tools that respect AbortSignal (shell_exec, fetch_*) will
+                    // bail when perTurnWatcher trips.
+                    //
+                    // Note: runConversation doesn't currently take an abort
+                    // signal in its options — the budget watcher is best-effort
+                    // observability via tally(). Future enhancement: thread the
+                    // signal into the loop body via options.
+                    //
+                    // v4.8.0 Phase 2.2 — uiOnly events on the daemon side are
+                    // dropped here. Phase 2.4 will serialize them into the
+                    // dispatcher's run_events stream.
+                    onUiEvent: () => { },
                 });
                 // Stamp the actual token usage onto the watcher for the
                 // post-turn snapshot below.

package/dist/core/v4/promptBuilder.js CHANGED Viewed

@@ -131,6 +131,42 @@ const EXECUTION_DISCIPLINE_PROSE = [
     'result. When the user requests an action, take it. When the user requests',
     'discussion, discuss.',
 ].join('\n');
+/**
+ * v4.8.0 Phase 2.6 — UI events nudge. Without this, the model only
+ * emits ui_* tools when explicitly told to (e.g. "call ui_task_update
+ * with ..."). With it, events fire during normal multi-step work —
+ * research, file creation, test runs, command execution. Always-on:
+ * every model that sees the ui_* tools benefits.
+ */
+const UI_EVENTS_GUIDANCE = [
+    '## UI events',
+    '',
+    'When doing multi-step work, emit structured progress signals INSTEAD OF',
+    'writing them as text. The user sees these as inline rows separate from',
+    'your prose reply.',
+    '',
+    'WRONG (do NOT do this):',
+    '  "✓ Done — found 3 results"',
+    '  "⟳ Searching the web..."',
+    '  "Created hello.py"',
+    '',
+    'RIGHT:',
+    '  ui_task_update {task_id, label, status: "running"}',
+    '  ui_task_done   {task_id, status: "success", summary}',
+    '  ui_artifact_created {path, kind: "file", preview}',
+    '',
+    'When to fire each:',
+    '- ui_task_update + ui_task_done for any multi-step task (pair them by task_id)',
+    '- ui_command_result after shell_exec when the output is interesting',
+    '- ui_test_result after running tests',
+    '- ui_toast for transient notices (e.g. "switched to dark mode")',
+    '- ui_artifact_created when you create or modify a file/skill',
+    '- ui_approval_request fires automatically for risky tools — NEVER emit it manually',
+    '',
+    'Markdown text in your reply is for explanation, not status. Status goes',
+    'through events. Skip events entirely on single-shot queries that aren\'t',
+    'multi-step work.',
+].join('\n');
 /**
  * Llama-3.3-specific tool-call format guard. Adapter-side recovery picks
  * up failures, but we'd rather avoid the 400 round-trip.
@@ -358,6 +394,15 @@ class PromptBuilder {
                 optional: true,
             });
         }
+        // ── 6.6. UI events nudge (v4.8.0 Phase 2.6) ───────────────────────
+        // Unconditional like execution discipline — every model that sees
+        // the ui_* tools benefits. Teaches structured-event emission for
+        // multi-step work instead of relying on text status formatting.
+        slots.push({
+            name: 'uiEvents',
+            content: UI_EVENTS_GUIDANCE,
+            optional: true,
+        });
         // ── 7. Iteration budget ───────────────────────────────────────────
         if (opts.initialBudget) {
             const { used, max } = opts.initialBudget;

package/dist/core/v4/sandboxFs.js CHANGED Viewed

@@ -94,7 +94,7 @@ function expandPathInline(input, cwd) {
 }
 /**
  * Boundary-aware containment check. `path.relative` avoids the
- * `/home/user-evil` vs `/home/user` false positive that a naive
+ * `<root>/user-evil` vs `<root>/user` false positive that a naive
  * `startsWith` would produce.
  */
 function isWithin(child, parent) {

package/dist/core/v4/subagent/childBuilder.js CHANGED Viewed

@@ -33,6 +33,7 @@ Object.defineProperty(exports, "__esModule", { value: true });
 exports.ProviderNotFoundError = exports.SUBAGENT_BLOCKED_TOOL_NAMES = void 0;
 exports.buildChildAgent = buildChildAgent;
 const approvalEngine_1 = require("../../../moat/approvalEngine");
+const honestyEnforcement_1 = require("../../../moat/honestyEnforcement");
 const aidenAgent_1 = require("../aidenAgent");
 const providerFallback_1 = require("../providerFallback");
 // ── Hard-coded blocklist (Q5 from design doc §2) ────────────────────────────
@@ -177,10 +178,16 @@ function buildChildAgent(deps, input) {
     // Pure no-op when runStore is absent (unit tests of buildChildAgent).
     const onToolCall = buildOnToolCall(deps);
     // ── 7. Build the child agent ─────────────────────────────────────────────
-    // Focused worker config: omit plannerGuard, honestyEnforcement,
-    // skillTeacher, skillMiner, contextCompressor, promptCaching,
-    // promptBuilder. Match the daemon agent's "act on the task, don't
-    // self-improve" shape.
+    // Focused worker config: omit plannerGuard, skillTeacher, skillMiner,
+    // contextCompressor, promptCaching, promptBuilder. Match the daemon
+    // agent's "act on the task, don't self-improve" shape.
+    //
+    // v4.7.0: HonestyEnforcement is now structural (reads tool trace only,
+    // no natural-language scanning) and cheap enough to run in subagents.
+    // Mode is 'detect' here — events are captured into the child's run
+    // record but never produce user-visible output (subagents have no
+    // chat surface; the parent assembles their summary).
+    const childHonestyEnforcement = new honestyEnforcement_1.HonestyEnforcement('detect');
     const agent = new aidenAgent_1.AidenAgent({
         provider: childProvider,
         tools: childTools,
@@ -192,6 +199,8 @@ function buildChildAgent(deps, input) {
         resolveVerifiedFlag: deps.resolveVerifiedFlag,
         resolveToolset: deps.resolveToolset,
         resolveMutates: deps.resolveMutates,
+        resolveUiOnly: deps.resolveUiOnly,
+        honestyEnforcement: childHonestyEnforcement,
         onToolCall,
         // iterationBudgetInjection inherits the default (true) — child
         // sees its own remaining-budget hint near the end of the run.

package/dist/core/v4/subagent/spawnSubAgent.js CHANGED Viewed

@@ -190,7 +190,13 @@ async function spawnSubAgent(spec, deps, ctx) {
     let tokensIn = 0;
     let tokensOut = 0;
     try {
-        const result = await agentBundle.agent.runConversation(agentBundle.history, { signal: childCtrl.signal });
+        const result = await agentBundle.agent.runConversation(agentBundle.history, {
+            signal: childCtrl.signal,
+            // v4.8.0 Phase 2.2 — uiOnly events from a subagent are
+            // dropped. Subagents have no chat surface; the parent
+            // assembles their summary. Stub stays a no-op forever.
+            onUiEvent: () => { },
+        });
         apiCalls = result.turnCount; // one provider call per turn
         tokensIn = result.totalUsage.inputTokens;
         tokensOut = result.totalUsage.outputTokens;

package/dist/core/v4/ui/banner.js CHANGED Viewed

@@ -90,29 +90,29 @@ function renderBanner(opts) {
         out.push('');
         return out.join('\n') + '\n';
     }
-    // Wide layout: framed panel with ASCII art inside, taglines below.
+    // v4.8.0 Slice 10b — wide layout flows the AIDEN art without the
+    // heavy `╔══╗` frame (legacy chrome). The art carries its own
+    // visual weight as the boot-card identity anchor; framing it
+    // inside a closed box collides with the asymmetric orange-bar
+    // language used by every other v4.8.0 surface.
+    //
+    // v4.8.0 Slice 10c — emit raw 24-bit truecolor for the AIDEN art
+    // instead of routing through `c.primary` (which depth-detects via
+    // theme.ts and degrades to 256-color or 16-color when COLORTERM is
+    // unset — common on Windows ConPTY). Result on those terminals was
+    // a washed-out / grey AIDEN that didn't match the boot card's
+    // skinEngine-painted brand orange. Forcing truecolor here brings
+    // disclaimer + setupWizard banner in line with the boot card.
+    const ORANGE_ON = '\x1b[38;2;255;107;53m';
+    const COLOR_OFF = '\x1b[39m';
     const inner = w - 2;
     const artPad = Math.max(0, Math.floor((inner - ART_WIDTH) / 2));
-    const framed = opts.framed !== false;
-    const horiz = '═'.repeat(inner);
-    const top = framed ? theme_1.c.rule(`╔${horiz}╗`) : '';
-    const bottom = framed ? theme_1.c.rule(`╚${horiz}╝`) : '';
-    const blank = framed
-        ? `${theme_1.c.rule('║')}${' '.repeat(inner)}${theme_1.c.rule('║')}`
-        : ' '.repeat(w);
     const lines = [];
     lines.push('');
-    if (framed)
-        lines.push(top);
-    lines.push(blank);
     for (const row of AIDEN_ART) {
         const padded = rpad(' '.repeat(artPad) + row, inner);
-        const coloured = theme_1.c.primary(padded);
-        lines.push(framed ? `${theme_1.c.rule('║')}${coloured}${theme_1.c.rule('║')}` : `  ${coloured}`);
+        lines.push(`  ${ORANGE_ON}${padded}${COLOR_OFF}`);
     }
-    lines.push(blank);
-    if (framed)
-        lines.push(bottom);
     lines.push('');
     lines.push('  ' + (0, theme_1.dim)(theme_1.c.muted(versionLine)));
     lines.push('');

package/dist/core/version.js CHANGED Viewed

@@ -2,4 +2,4 @@
 Object.defineProperty(exports, "__esModule", { value: true });
 exports.VERSION = void 0;
 // AUTO-GENERATED by scripts/inject-version.js — do not edit by hand
-exports.VERSION = '4.6.1';
+exports.VERSION = '4.8.0';

package/dist/moat/approvalEngine.js CHANGED Viewed

@@ -237,6 +237,20 @@ class ApprovalEngine {
             this.callbacks.onDecision?.(req, 'deny');
             return false;
         }
+        // v4.8.0 Phase 2.5 — emit a structured ui_approval_request event
+        // BEFORE the y/n prompt fires. Additive: the display layer paints
+        // the gutter-integrated row, then the existing promptUser flow
+        // runs unchanged. Moat-tier (safe/caution/dangerous) maps to the
+        // ui schema's 4-tier scale; 'critical' is reserved for future
+        // wiring and unreachable from this path.
+        const uiTier = req.riskTier === 'safe' ? 'low' :
+            req.riskTier === 'dangerous' ? 'high' : 'medium';
+        const argsPreview = JSON.stringify(req.args).slice(0, 80);
+        this.callbacks.onUiEvent?.('ui_approval_request', {
+            prompt: `${req.toolName} ${argsPreview}`,
+            risk_tier: uiTier,
+            reason: req.reason,
+        });
         const decision = await this.callbacks.promptUser(req);
         this.callbacks.onDecision?.(req, decision);
         if (decision === 'deny')