npm - aiden-runtime - Versions diffs - 4.7.0 → 4.8.0 - Mend

aiden-runtime 4.7.0 → 4.8.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (32) hide show

package/README.md +12 -1
package/dist/cli/v4/aidenCLI.js +40 -5
package/dist/cli/v4/callbacks.js +52 -31
package/dist/cli/v4/chatSession.js +46 -1
package/dist/cli/v4/commands/help.js +22 -11
package/dist/cli/v4/commands/runs.js +42 -24
package/dist/cli/v4/commands/skills.js +15 -17
package/dist/cli/v4/commands/usage.js +17 -5
package/dist/cli/v4/daemonAgentBuilder.js +1 -0
package/dist/cli/v4/design/tokens.js +265 -0
package/dist/cli/v4/display/framedPanel.js +116 -0
package/dist/cli/v4/display/toolTrail.js +2 -2
package/dist/cli/v4/display.js +446 -164
package/dist/cli/v4/onboarding/disclaimer.js +42 -10
package/dist/cli/v4/onboarding/loading.js +24 -1
package/dist/cli/v4/onboarding/successScreen.js +17 -8
package/dist/cli/v4/replyRenderer.js +74 -58
package/dist/cli/v4/setupWizard.js +19 -2
package/dist/cli/v4/skinEngine.js +13 -0
package/dist/cli/v4/table.js +65 -8
package/dist/core/v4/aidenAgent.js +23 -0
package/dist/core/v4/auxiliaryClient.js +46 -13
package/dist/core/v4/daemon/dispatcher/realAgentRunner.js +13 -8
package/dist/core/v4/promptBuilder.js +45 -0
package/dist/core/v4/subagent/childBuilder.js +1 -0
package/dist/core/v4/subagent/spawnSubAgent.js +7 -1
package/dist/core/v4/ui/banner.js +16 -16
package/dist/core/version.js +1 -1
package/dist/moat/approvalEngine.js +14 -0
package/dist/tools/v4/index.js +54 -0
package/dist/tools/v4/subagent/spawnSubAgentTool.js +23 -0
package/package.json +1 -1

package/dist/core/v4/auxiliaryClient.js CHANGED Viewed

@@ -45,19 +45,35 @@ class AuxiliaryClient {
             return this.opts.adapter;
         if (!this.opts.resolver)
             return null;
-        this.resolveCallCount += 1;
-        try {
-            const adapter = await this.opts.resolver.resolve({
-                providerId: this.opts.defaultProvider,
-                modelId: this.opts.defaultModel,
-            });
-            return adapter;
-        }
-        catch (err) {
-            this.warn(`auxiliary client unavailable (${this.opts.defaultProvider}/${this.opts.defaultModel}): ${err.message}`);
-            this.adapterUnavailable = true;
-            return null;
+        // v4.8.0 Slice 11 — resolution chain: default first, then each
+        // fallback in order. The first attempt that resolves wins. This
+        // is the routing-fix entry point for the chatgpt-plus + gpt-5
+        // bug: aidenCLI hands us Groq as the default and the parent
+        // provider/model as the fallback, so auxiliary calls land on
+        // Groq when configured and the parent only sees traffic when
+        // Groq is absent.
+        const attempts = [
+            { providerId: this.opts.defaultProvider, modelId: this.opts.defaultModel },
+            ...(this.opts.fallbacks ?? []),
+        ];
+        const failures = [];
+        for (const att of attempts) {
+            this.resolveCallCount += 1;
+            try {
+                const adapter = await this.opts.resolver.resolve({
+                    providerId: att.providerId,
+                    modelId: att.modelId,
+                });
+                this.warn(`auxiliary resolved via ${att.providerId}/${att.modelId}`);
+                return adapter;
+            }
+            catch (err) {
+                failures.push(`${att.providerId}/${att.modelId}: ${err.message}`);
+            }
         }
+        this.warn(`auxiliary client unavailable (tried ${attempts.length}): ${failures.join('; ')}`);
+        this.adapterUnavailable = true;
+        return null;
     }
     /** Resolve count for tests (verifies single-resolution behaviour). */
     _resolveCallCount() {
@@ -122,7 +138,24 @@ class AuxiliaryClient {
         this.usage.set(purpose, cur);
     }
     warn(msg) {
-        (this.opts.warn ?? ((m) => console.warn(`[auxiliary] ${m}`)))(msg);
+        // v4.8.0 Slice 5 — gate console output behind AIDEN_VERBOSE.
+        // Auxiliary failures are recoverable (the main loop continues;
+        // result content is just empty), so the warning is pure noise
+        // for end users. Power users set AIDEN_VERBOSE=1 to surface them.
+        // Inline env-read preserves the core → cli no-import invariant;
+        // canonical isVerbose() lives at cli/v4/design/tokens.ts.
+        //
+        // v4.8.0 Slice 11 — if opts.warn is explicitly injected, always
+        // forward (tests + advanced callers register their own sink and
+        // expect every message). The AIDEN_VERBOSE gate now applies only
+        // to the default console.warn fallback that end-users see.
+        if (this.opts.warn) {
+            this.opts.warn(msg);
+            return;
+        }
+        if (process.env.AIDEN_VERBOSE !== '1')
+            return;
+        console.warn(`[auxiliary] ${msg}`);
     }
     async withTimeout(p, ms) {
         return new Promise((resolve, reject) => {

package/dist/core/v4/daemon/dispatcher/realAgentRunner.js CHANGED Viewed

@@ -177,14 +177,19 @@ function createRealAgentRunner(opts) {
             let invocationError = null;
             try {
                 result = await agent.runConversation(history, {
-                // The agent honours its own abort signal via per-tool aborts;
-                // tools that respect AbortSignal (shell_exec, fetch_*) will
-                // bail when perTurnWatcher trips.
-                //
-                // Note: runConversation doesn't currently take an abort
-                // signal in its options — the budget watcher is best-effort
-                // observability via tally(). Future enhancement: thread the
-                // signal into the loop body via options.
+                    // The agent honours its own abort signal via per-tool aborts;
+                    // tools that respect AbortSignal (shell_exec, fetch_*) will
+                    // bail when perTurnWatcher trips.
+                    //
+                    // Note: runConversation doesn't currently take an abort
+                    // signal in its options — the budget watcher is best-effort
+                    // observability via tally(). Future enhancement: thread the
+                    // signal into the loop body via options.
+                    //
+                    // v4.8.0 Phase 2.2 — uiOnly events on the daemon side are
+                    // dropped here. Phase 2.4 will serialize them into the
+                    // dispatcher's run_events stream.
+                    onUiEvent: () => { },
                 });
                 // Stamp the actual token usage onto the watcher for the
                 // post-turn snapshot below.

package/dist/core/v4/promptBuilder.js CHANGED Viewed

@@ -131,6 +131,42 @@ const EXECUTION_DISCIPLINE_PROSE = [
     'result. When the user requests an action, take it. When the user requests',
     'discussion, discuss.',
 ].join('\n');
+/**
+ * v4.8.0 Phase 2.6 — UI events nudge. Without this, the model only
+ * emits ui_* tools when explicitly told to (e.g. "call ui_task_update
+ * with ..."). With it, events fire during normal multi-step work —
+ * research, file creation, test runs, command execution. Always-on:
+ * every model that sees the ui_* tools benefits.
+ */
+const UI_EVENTS_GUIDANCE = [
+    '## UI events',
+    '',
+    'When doing multi-step work, emit structured progress signals INSTEAD OF',
+    'writing them as text. The user sees these as inline rows separate from',
+    'your prose reply.',
+    '',
+    'WRONG (do NOT do this):',
+    '  "✓ Done — found 3 results"',
+    '  "⟳ Searching the web..."',
+    '  "Created hello.py"',
+    '',
+    'RIGHT:',
+    '  ui_task_update {task_id, label, status: "running"}',
+    '  ui_task_done   {task_id, status: "success", summary}',
+    '  ui_artifact_created {path, kind: "file", preview}',
+    '',
+    'When to fire each:',
+    '- ui_task_update + ui_task_done for any multi-step task (pair them by task_id)',
+    '- ui_command_result after shell_exec when the output is interesting',
+    '- ui_test_result after running tests',
+    '- ui_toast for transient notices (e.g. "switched to dark mode")',
+    '- ui_artifact_created when you create or modify a file/skill',
+    '- ui_approval_request fires automatically for risky tools — NEVER emit it manually',
+    '',
+    'Markdown text in your reply is for explanation, not status. Status goes',
+    'through events. Skip events entirely on single-shot queries that aren\'t',
+    'multi-step work.',
+].join('\n');
 /**
  * Llama-3.3-specific tool-call format guard. Adapter-side recovery picks
  * up failures, but we'd rather avoid the 400 round-trip.
@@ -358,6 +394,15 @@ class PromptBuilder {
                 optional: true,
             });
         }
+        // ── 6.6. UI events nudge (v4.8.0 Phase 2.6) ───────────────────────
+        // Unconditional like execution discipline — every model that sees
+        // the ui_* tools benefits. Teaches structured-event emission for
+        // multi-step work instead of relying on text status formatting.
+        slots.push({
+            name: 'uiEvents',
+            content: UI_EVENTS_GUIDANCE,
+            optional: true,
+        });
         // ── 7. Iteration budget ───────────────────────────────────────────
         if (opts.initialBudget) {
             const { used, max } = opts.initialBudget;

package/dist/core/v4/subagent/childBuilder.js CHANGED Viewed

@@ -199,6 +199,7 @@ function buildChildAgent(deps, input) {
         resolveVerifiedFlag: deps.resolveVerifiedFlag,
         resolveToolset: deps.resolveToolset,
         resolveMutates: deps.resolveMutates,
+        resolveUiOnly: deps.resolveUiOnly,
         honestyEnforcement: childHonestyEnforcement,
         onToolCall,
         // iterationBudgetInjection inherits the default (true) — child

package/dist/core/v4/subagent/spawnSubAgent.js CHANGED Viewed

@@ -190,7 +190,13 @@ async function spawnSubAgent(spec, deps, ctx) {
     let tokensIn = 0;
     let tokensOut = 0;
     try {
-        const result = await agentBundle.agent.runConversation(agentBundle.history, { signal: childCtrl.signal });
+        const result = await agentBundle.agent.runConversation(agentBundle.history, {
+            signal: childCtrl.signal,
+            // v4.8.0 Phase 2.2 — uiOnly events from a subagent are
+            // dropped. Subagents have no chat surface; the parent
+            // assembles their summary. Stub stays a no-op forever.
+            onUiEvent: () => { },
+        });
         apiCalls = result.turnCount; // one provider call per turn
         tokensIn = result.totalUsage.inputTokens;
         tokensOut = result.totalUsage.outputTokens;

package/dist/core/v4/ui/banner.js CHANGED Viewed

@@ -90,29 +90,29 @@ function renderBanner(opts) {
         out.push('');
         return out.join('\n') + '\n';
     }
-    // Wide layout: framed panel with ASCII art inside, taglines below.
+    // v4.8.0 Slice 10b — wide layout flows the AIDEN art without the
+    // heavy `╔══╗` frame (legacy chrome). The art carries its own
+    // visual weight as the boot-card identity anchor; framing it
+    // inside a closed box collides with the asymmetric orange-bar
+    // language used by every other v4.8.0 surface.
+    //
+    // v4.8.0 Slice 10c — emit raw 24-bit truecolor for the AIDEN art
+    // instead of routing through `c.primary` (which depth-detects via
+    // theme.ts and degrades to 256-color or 16-color when COLORTERM is
+    // unset — common on Windows ConPTY). Result on those terminals was
+    // a washed-out / grey AIDEN that didn't match the boot card's
+    // skinEngine-painted brand orange. Forcing truecolor here brings
+    // disclaimer + setupWizard banner in line with the boot card.
+    const ORANGE_ON = '\x1b[38;2;255;107;53m';
+    const COLOR_OFF = '\x1b[39m';
     const inner = w - 2;
     const artPad = Math.max(0, Math.floor((inner - ART_WIDTH) / 2));
-    const framed = opts.framed !== false;
-    const horiz = '═'.repeat(inner);
-    const top = framed ? theme_1.c.rule(`╔${horiz}╗`) : '';
-    const bottom = framed ? theme_1.c.rule(`╚${horiz}╝`) : '';
-    const blank = framed
-        ? `${theme_1.c.rule('║')}${' '.repeat(inner)}${theme_1.c.rule('║')}`
-        : ' '.repeat(w);
     const lines = [];
     lines.push('');
-    if (framed)
-        lines.push(top);
-    lines.push(blank);
     for (const row of AIDEN_ART) {
         const padded = rpad(' '.repeat(artPad) + row, inner);
-        const coloured = theme_1.c.primary(padded);
-        lines.push(framed ? `${theme_1.c.rule('║')}${coloured}${theme_1.c.rule('║')}` : `  ${coloured}`);
+        lines.push(`  ${ORANGE_ON}${padded}${COLOR_OFF}`);
     }
-    lines.push(blank);
-    if (framed)
-        lines.push(bottom);
     lines.push('');
     lines.push('  ' + (0, theme_1.dim)(theme_1.c.muted(versionLine)));
     lines.push('');

package/dist/core/version.js CHANGED Viewed

@@ -2,4 +2,4 @@
 Object.defineProperty(exports, "__esModule", { value: true });
 exports.VERSION = void 0;
 // AUTO-GENERATED by scripts/inject-version.js — do not edit by hand
-exports.VERSION = '4.7.0';
+exports.VERSION = '4.8.0';

package/dist/moat/approvalEngine.js CHANGED Viewed

@@ -237,6 +237,20 @@ class ApprovalEngine {
             this.callbacks.onDecision?.(req, 'deny');
             return false;
         }
+        // v4.8.0 Phase 2.5 — emit a structured ui_approval_request event
+        // BEFORE the y/n prompt fires. Additive: the display layer paints
+        // the gutter-integrated row, then the existing promptUser flow
+        // runs unchanged. Moat-tier (safe/caution/dangerous) maps to the
+        // ui schema's 4-tier scale; 'critical' is reserved for future
+        // wiring and unreachable from this path.
+        const uiTier = req.riskTier === 'safe' ? 'low' :
+            req.riskTier === 'dangerous' ? 'high' : 'medium';
+        const argsPreview = JSON.stringify(req.args).slice(0, 80);
+        this.callbacks.onUiEvent?.('ui_approval_request', {
+            prompt: `${req.toolName} ${argsPreview}`,
+            risk_tier: uiTier,
+            reason: req.reason,
+        });
         const decision = await this.callbacks.promptUser(req);
         this.callbacks.onDecision?.(req, decision);
         if (decision === 'deny')

package/dist/tools/v4/index.js CHANGED Viewed

@@ -246,6 +246,60 @@ function registerWriteTools(registry) {
 function registerAllTools(registry) {
     registerReadOnlyTools(registry);
     registerWriteTools(registry);
+    // v4.8.0 Phase 2.2 — register the 7 semantic ui_* event tools.
+    // All uiOnly: true → the dispatch loop in core/v4/aidenAgent.ts
+    // bypasses execute and fires onUiEvent on the caller. execute()
+    // throws as a safety guard: if the uiOnly branch ever misfires
+    // and an executor is reached, that's a wiring bug, not a render.
+    // Renderer is a no-op stub in this phase; Phase 2.3 lands chrome.
+    const ui = (name, description, properties, required) => ({
+        schema: { name, description, inputSchema: { type: 'object', properties, required } },
+        execute: async () => { throw new Error(`${name} is uiOnly — dispatch branch should bypass execute`); },
+        category: 'read', mutates: false, uiOnly: true,
+    });
+    const str = { type: 'string' };
+    const num = { type: 'number' };
+    registry.register(ui('ui_task_update', 'Signal current task state for the live task panel. Append-only stream.', { task_id: str, label: { type: 'string', description: '≤80 chars' },
+        status: { type: 'string', enum: ['running', 'blocked', 'paused'] },
+        kind: { type: 'string', enum: ['task', 'subagent'] }, depth: num, parent_id: str }, ['task_id', 'label', 'status']));
+    registry.register(ui('ui_task_done', 'Signal a task is complete. Pairs with a prior ui_task_update.', { task_id: str, status: { type: 'string', enum: ['success', 'failure', 'blocked'] },
+        summary: { type: 'string', description: 'Optional, ≤120 chars' } }, ['task_id', 'status']));
+    registry.register(ui('ui_command_result', 'Surface shell output as a formatted block.', { command: str, stdout: str, stderr: str, exit_code: num }, ['command']));
+    registry.register(ui('ui_test_result', 'Pass/fail count after a test run.', { framework: { type: 'string', description: 'e.g. "vitest", "pytest"' },
+        passed: num, failed: num, skipped: num, duration_ms: num }, ['framework', 'passed', 'failed']));
+    registry.register(ui('ui_approval_request', 'Structured approval prompt before a privileged action.', { prompt: { type: 'string', description: '≤160 chars' },
+        risk_tier: { type: 'string', enum: ['low', 'medium', 'high', 'critical'] },
+        reason: { type: 'string', description: 'Optional, ≤200 chars' } }, ['prompt', 'risk_tier']));
+    registry.register(ui('ui_toast', 'Transient notice to surface without interrupting flow.', { message: { type: 'string', description: '≤120 chars' },
+        kind: { type: 'string', enum: ['info', 'success', 'warning', 'error'] } }, ['message', 'kind']));
+    registry.register(ui('ui_artifact_created', 'Surface a file or skill created/modified this turn.', { path: str, kind: { type: 'string', enum: ['file', 'skill', 'directory'] },
+        preview: { type: 'string', description: 'Optional, ≤200 chars' } }, ['path', 'kind']));
+    // v4.8.0 Phase 2.1 — env-gated uiOnly smoke stub. Never registers
+    // in production. Set AIDEN_TEST_UI_STUB=1 to enable for the
+    // dispatch-branch smoke harness. The execute() throws on purpose:
+    // if the uiOnly branch is wired correctly the model can never
+    // reach the executor.
+    if (process.env.AIDEN_TEST_UI_STUB === '1') {
+        registry.register({
+            schema: {
+                name: '_test_ui_stub',
+                description: 'Test-only uiOnly stub for v4.8.0 Phase 2.1 smoke. Set AIDEN_TEST_UI_STUB=1 to enable.',
+                inputSchema: {
+                    type: 'object',
+                    properties: {
+                        message: { type: 'string', description: 'Arbitrary message to echo via onUiEvent' },
+                    },
+                    required: ['message'],
+                },
+            },
+            execute: async () => {
+                throw new Error('_test_ui_stub should never execute — uiOnly branch should bypass it');
+            },
+            category: 'read',
+            mutates: false,
+            uiOnly: true,
+        });
+    }
 }
 var subagentFanout_2 = require("./subagent/subagentFanout");
 Object.defineProperty(exports, "makeSubagentFanoutTool", { enumerable: true, get: function () { return subagentFanout_2.makeSubagentFanoutTool; } });

package/dist/tools/v4/subagent/spawnSubAgentTool.js CHANGED Viewed

@@ -289,6 +289,19 @@ function makeSpawnSubAgentTool(factory) {
             // ── 3. Resolve optional parent run / session identifiers ─────────────
             const parentRunId = factory.resolveParentRunId?.();
             const parentSessionId = factory.resolveParentSessionId?.();
+            // v4.8.0 Phase 2.5 — emit ui_task_update for the subagent start.
+            // Stable task_id correlates with the matching ui_task_done emit
+            // after the spawnSubAgent call returns. depth:1 hardcoded today
+            // — childBuilder caps recursion at 1 (see SUBAGENT_BLOCKED_TOOL_NAMES
+            // 'spawn_sub_agent'). TODO: thread real depth when nested spawns ship.
+            const subTaskId = `subagent-${Date.now()}-${Math.random().toString(36).slice(2, 8)}`;
+            factory.onUiEvent?.('ui_task_update', {
+                task_id: subTaskId,
+                label: goalPreview,
+                status: 'running',
+                kind: 'subagent',
+                depth: 1,
+            });
             // ── 4. Invoke the primitive. NEVER throws — always envelope. ─────────
             const result = await (0, spawnSubAgent_1.spawnSubAgent)(spec, {
                 // ChildBuilderDeps fields:
@@ -310,6 +323,16 @@ function makeSpawnSubAgentTool(factory) {
                 parentRunId,
                 parentSessionId,
             });
+            // v4.8.0 Phase 2.5 — emit ui_task_done with the same subTaskId
+            // so the display layer can finalize the in-flight row.
+            const doneStatus = result.ok ? 'success' :
+                result.status === 'interrupted' ? 'blocked' :
+                    result.status === 'timeout' ? 'blocked' : 'failure';
+            factory.onUiEvent?.('ui_task_done', {
+                task_id: subTaskId,
+                status: doneStatus,
+                summary: `${result.metrics.apiCalls} calls · ${result.exitReason}`,
+            });
             // Completion log — pairs with "spawn_sub_agent invoked" so a
             // grep on parentSessionId surfaces invoke → complete in order.
             logger.info('spawn_sub_agent completed', {

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "aiden-runtime",
-  "version": "4.7.0",
+  "version": "4.8.0",
   "publishConfig": {
     "access": "public"
   },