npm - @aitne/daemon - Versions diffs - 0.1.10 → 0.1.11 - Mend

@aitne/daemon 0.1.10 → 0.1.11

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (305) hide show

package/dist/adapters/adapter-watchdog.d.ts +70 -0
package/dist/adapters/adapter-watchdog.js +115 -0
package/dist/adapters/discord.d.ts +17 -1
package/dist/adapters/discord.js +33 -0
package/dist/adapters/notification-manager.d.ts +27 -1
package/dist/adapters/notification-manager.js +54 -39
package/dist/adapters/slack-adapter.d.ts +26 -1
package/dist/adapters/slack-adapter.js +41 -0
package/dist/adapters/telegram-adapter.d.ts +18 -1
package/dist/adapters/telegram-adapter.js +41 -2
package/dist/adapters/types.d.ts +20 -0
package/dist/adapters/whatsapp-adapter.d.ts +26 -7
package/dist/adapters/whatsapp-adapter.js +74 -21
package/dist/api/env-writer.js +8 -5
package/dist/api/helpers/agent-errors-registry.d.ts +5 -5
package/dist/api/helpers/agent-errors-registry.js +5 -5
package/dist/api/routes/agent.js +33 -12
package/dist/api/routes/agents/index.js +75 -16
package/dist/api/routes/agents/views.d.ts +37 -2
package/dist/api/routes/agents/views.js +64 -2
package/dist/api/routes/background-task.d.ts +22 -0
package/dist/api/routes/background-task.js +338 -0
package/dist/api/routes/browser-history.js +9 -1
package/dist/api/routes/context/permissions.js +3 -2
package/dist/api/routes/context/snapshots.js +0 -3
package/dist/api/routes/context/write.js +3 -17
package/dist/api/routes/dashboard/config.js +48 -12
package/dist/api/routes/dashboard/cost-approvals.js +66 -0
package/dist/api/routes/dashboard/notifications.js +9 -9
package/dist/api/routes/integrations/crud-patch.js +5 -1
package/dist/api/routes/integrations-reconcile.js +2 -2
package/dist/api/routes/notion.d.ts +1 -1
package/dist/api/routes/observations.js +7 -7
package/dist/api/routes/obsidian.d.ts +1 -1
package/dist/api/routes/receipts.js +5 -1
package/dist/api/routes/setup-migrate.js +1 -1
package/dist/api/routes/setup.js +1 -1
package/dist/api/routes/task-flows.d.ts +1 -1
package/dist/api/routes/task-flows.js +1 -1
package/dist/api/routes/tuning.d.ts +29 -0
package/dist/api/routes/tuning.js +304 -0
package/dist/api/server.d.ts +44 -16
package/dist/api/server.js +9 -0
package/dist/bootstrap/adapters.d.ts +19 -0
package/dist/bootstrap/adapters.js +61 -0
package/dist/bootstrap/api.d.ts +5 -3
package/dist/bootstrap/api.js +45 -13
package/dist/bootstrap/catchup.d.ts +1 -1
package/dist/bootstrap/catchup.js +11 -11
package/dist/bootstrap/event-pipeline.d.ts +11 -0
package/dist/bootstrap/event-pipeline.js +245 -7
package/dist/bootstrap/observers.js +9 -6
package/dist/bootstrap/schedule-helpers.d.ts +104 -6
package/dist/bootstrap/schedule-helpers.js +172 -19
package/dist/config.js +26 -12
package/dist/core/agent-core.d.ts +33 -1
package/dist/core/agent-core.js +36 -1
package/dist/core/agents/activity-scan-cadence.d.ts +103 -0
package/dist/core/agents/activity-scan-cadence.js +127 -0
package/dist/core/agents/agent-route-override.d.ts +53 -0
package/dist/core/agents/agent-route-override.js +69 -0
package/dist/core/agents/builtin-registry.d.ts +51 -14
package/dist/core/agents/builtin-registry.js +92 -15
package/dist/core/agents/config-gate-reconcile.d.ts +38 -0
package/dist/core/agents/config-gate-reconcile.js +51 -0
package/dist/core/agents/cron-substitute.d.ts +1 -1
package/dist/core/agents/cron-substitute.js +1 -1
package/dist/core/agents/custom-routine-migration.d.ts +60 -0
package/dist/core/agents/custom-routine-migration.js +149 -0
package/dist/core/agents/firing-blocked.d.ts +1 -1
package/dist/core/agents/hourly-cadence.d.ts +102 -0
package/dist/core/agents/hourly-cadence.js +126 -0
package/dist/core/agents/loader-boot.js +23 -0
package/dist/core/agents/loader.d.ts +19 -0
package/dist/core/agents/loader.js +34 -2
package/dist/core/agents/override-merge.d.ts +1 -1
package/dist/core/agents/override-merge.js +9 -1
package/dist/core/agents/recurrence-convert.d.ts +1 -1
package/dist/core/agents/recurrence-convert.js +1 -1
package/dist/core/agents/recurring-schedule-adapter.js +8 -0
package/dist/core/alerts.js +6 -6
package/dist/core/backends/auth-health-monitor.d.ts +2 -2
package/dist/core/backends/auth-health-monitor.js +1 -1
package/dist/core/backends/backend-router.d.ts +27 -1
package/dist/core/backends/backend-router.js +165 -1
package/dist/core/backends/claude-code-core.d.ts +71 -31
package/dist/core/backends/claude-code-core.js +282 -54
package/dist/core/backends/cli-quota-guards.d.ts +29 -1
package/dist/core/backends/cli-quota-guards.js +40 -5
package/dist/core/backends/codex-core.d.ts +6 -0
package/dist/core/backends/codex-core.js +22 -6
package/dist/core/backends/failure-spend.d.ts +58 -0
package/dist/core/backends/failure-spend.js +137 -0
package/dist/core/backends/gemini-cli-core.d.ts +6 -0
package/dist/core/backends/gemini-cli-core.js +25 -6
package/dist/core/backends/model-registry.d.ts +1 -1
package/dist/core/backends/model-registry.js +4 -4
package/dist/core/backends/opencode-core.d.ts +1 -1
package/dist/core/backends/opencode-core.js +5 -5
package/dist/core/backends/plan-presets.js +39 -15
package/dist/core/bang-commands/commands-cost.js +3 -1
package/dist/core/bang-commands/commands-report.js +4 -3
package/dist/core/bang-commands/commands-research.js +4 -1
package/dist/core/bang-commands/commands-revert-tuning.d.ts +18 -0
package/dist/core/bang-commands/commands-revert-tuning.js +63 -0
package/dist/core/bang-commands/commands-stop-start.js +3 -3
package/dist/core/bang-commands/commands-task-control.d.ts +19 -0
package/dist/core/bang-commands/commands-task-control.js +147 -0
package/dist/core/bang-commands/commands-wiki.js +5 -5
package/dist/core/bang-commands/index.d.ts +2 -0
package/dist/core/bang-commands/index.js +12 -0
package/dist/core/bang-commands/registry.d.ts +12 -0
package/dist/core/browser-history/research-cluster-fanout.d.ts +28 -14
package/dist/core/browser-history/research-cluster-fanout.js +39 -16
package/dist/core/channel-timeline.d.ts +5 -1
package/dist/core/channel-timeline.js +13 -0
package/dist/core/context/index-reconciler.js +5 -2
package/dist/core/context/policy-index-reconciler.d.ts +6 -4
package/dist/core/context/policy-index-runner.js +25 -6
package/dist/core/context-builder-calendar.js +10 -2
package/dist/core/context-builder-conversation.d.ts +8 -1
package/dist/core/context-builder-conversation.js +41 -7
package/dist/core/context-builder-yesterday.js +4 -3
package/dist/core/context-builder.d.ts +7 -2
package/dist/core/context-builder.js +62 -20
package/dist/core/context-file-serializer.d.ts +1 -1
package/dist/core/context-file-serializer.js +1 -1
package/dist/core/context-health.js +2 -2
package/dist/core/context-paths.d.ts +1 -1
package/dist/core/context-paths.js +1 -1
package/dist/core/context-validation/prepare-write.js +1 -1
package/dist/core/context-validation/routine-rulebook.d.ts +1 -1
package/dist/core/context-vault-aliases.d.ts +0 -13
package/dist/core/context-vault-aliases.js +37 -0
package/dist/core/custom-routines.d.ts +99 -0
package/dist/core/custom-routines.js +187 -0
package/dist/core/daemon-api-cli.js +49 -0
package/dist/core/day-boundary.d.ts +46 -0
package/dist/core/day-boundary.js +40 -0
package/dist/core/dispatcher-activity-scan.d.ts +221 -0
package/dist/core/dispatcher-activity-scan.js +775 -0
package/dist/core/dispatcher-error-handling.d.ts +6 -11
package/dist/core/dispatcher-error-handling.js +38 -62
package/dist/core/dispatcher-hourly-check.js +6 -1
package/dist/core/dispatcher-message-handler.d.ts +10 -0
package/dist/core/dispatcher-message-handler.js +17 -0
package/dist/core/dispatcher-morning-routine.d.ts +6 -6
package/dist/core/dispatcher-morning-routine.js +13 -13
package/dist/core/dispatcher-result-processor.d.ts +33 -0
package/dist/core/dispatcher-result-processor.js +167 -11
package/dist/core/dispatcher-scheduled-background-task.d.ts +42 -0
package/dist/core/dispatcher-scheduled-background-task.js +89 -0
package/dist/core/dispatcher-scheduled-tasks.d.ts +63 -1
package/dist/core/dispatcher-scheduled-tasks.js +213 -6
package/dist/core/dispatcher-task-delivery.d.ts +105 -0
package/dist/core/dispatcher-task-delivery.js +555 -0
package/dist/core/dispatcher-types.d.ts +48 -9
package/dist/core/dispatcher-types.js +3 -3
package/dist/core/dispatcher.d.ts +112 -31
package/dist/core/dispatcher.js +284 -59
package/dist/core/dm-freshness-metrics.d.ts +1 -1
package/dist/core/drift-effects.js +2 -2
package/dist/core/feedback/consolidation-prep.js +17 -5
package/dist/core/feedback/eviction-scorer.js +6 -2
package/dist/core/feedback/lesson-format.js +9 -4
package/dist/core/feedback/lesson-injection.d.ts +1 -1
package/dist/core/feedback/lesson-injection.js +17 -2
package/dist/core/feedback/lesson-store-overview.d.ts +8 -4
package/dist/core/feedback/lesson-store-overview.js +8 -4
package/dist/core/feedback/regeneralization-prep.js +29 -16
package/dist/core/feedback/self-performance-prep.d.ts +186 -0
package/dist/core/feedback/self-performance-prep.js +541 -0
package/dist/core/feedback/tuning-actuator.d.ts +198 -0
package/dist/core/feedback/tuning-actuator.js +432 -0
package/dist/core/feedback/tuning-recommender.d.ts +247 -0
package/dist/core/feedback/tuning-recommender.js +580 -0
package/dist/core/feedback/tuning-revert-monitor.d.ts +90 -0
package/dist/core/feedback/tuning-revert-monitor.js +213 -0
package/dist/core/health-monitor.d.ts +6 -0
package/dist/core/health-monitor.js +1 -1
package/dist/core/injection-policy.d.ts +4 -4
package/dist/core/injection-policy.js +4 -4
package/dist/core/integration-main-backend.js +4 -0
package/dist/core/management-md.d.ts +2 -2
package/dist/core/management-md.js +51 -13
package/dist/core/morning/orchestrator.d.ts +2 -2
package/dist/core/morning/orchestrator.js +2 -2
package/dist/core/notification-gate.d.ts +64 -0
package/dist/core/notification-gate.js +51 -0
package/dist/core/notification-rate-limit.d.ts +40 -0
package/dist/core/notification-rate-limit.js +50 -0
package/dist/core/policy-files.d.ts +1 -1
package/dist/core/policy-files.js +2 -2
package/dist/core/pre-pass-freshness.d.ts +4 -4
package/dist/core/retention.d.ts +5 -0
package/dist/core/retention.js +20 -4
package/dist/core/review-context.d.ts +1 -1
package/dist/core/review-context.js +10 -5
package/dist/core/roadmap-write-lock.d.ts +2 -1
package/dist/core/roadmap-write-lock.js +15 -10
package/dist/core/routine-acquisition-plan.d.ts +47 -1
package/dist/core/routine-acquisition-plan.js +78 -20
package/dist/core/routine-fetch-window-retry.js +7 -4
package/dist/core/routine-fetch-window-runner.d.ts +39 -3
package/dist/core/routine-fetch-window-runner.js +264 -13
package/dist/core/routine-windows.d.ts +2 -2
package/dist/core/routine-windows.js +8 -5
package/dist/core/scheduler.d.ts +175 -16
package/dist/core/scheduler.js +559 -102
package/dist/core/signal-detector.d.ts +12 -0
package/dist/core/signal-detector.js +53 -9
package/dist/core/skills-compiler-denied-tools.js +2 -2
package/dist/core/skills-compiler-skill-index.d.ts +2 -2
package/dist/core/skills-compiler-skill-index.js +2 -2
package/dist/core/skills-compiler-variants.d.ts +1 -1
package/dist/core/skills-compiler-variants.js +8 -0
package/dist/core/skills-compiler.d.ts +29 -26
package/dist/core/skills-compiler.js +117 -81
package/dist/core/skills-manifest.d.ts +37 -0
package/dist/core/skills-manifest.js +73 -2
package/dist/core/sleep-inhibitor.d.ts +79 -0
package/dist/core/sleep-inhibitor.js +132 -0
package/dist/core/slim-system-prompt-loader.d.ts +77 -0
package/dist/core/slim-system-prompt-loader.js +141 -0
package/dist/core/spawn-gates.d.ts +126 -0
package/dist/core/spawn-gates.js +180 -0
package/dist/core/today-direct-writer.d.ts +2 -2
package/dist/core/today-direct-writer.js +1 -1
package/dist/core/today-write-lock.d.ts +4 -2
package/dist/core/today-write-lock.js +30 -20
package/dist/core/wake-detector.d.ts +55 -0
package/dist/core/wake-detector.js +80 -0
package/dist/core/wiki/compile-lock.d.ts +1 -1
package/dist/core/wiki/compile-lock.js +1 -1
package/dist/core/workdir.js +15 -6
package/dist/db/activity-scan-signals.d.ts +77 -0
package/dist/db/activity-scan-signals.js +378 -0
package/dist/db/agents-store.d.ts +28 -0
package/dist/db/agents-store.js +62 -0
package/dist/db/background-task-clarifications-store.d.ts +81 -0
package/dist/db/background-task-clarifications-store.js +152 -0
package/dist/db/background-task-store.d.ts +207 -0
package/dist/db/background-task-store.js +380 -0
package/dist/db/browser-history-store.d.ts +39 -6
package/dist/db/browser-history-store.js +51 -7
package/dist/db/browser-task-clarifications-store.d.ts +12 -0
package/dist/db/browser-task-clarifications-store.js +35 -5
package/dist/db/browser-task-store.d.ts +3 -0
package/dist/db/browser-task-store.js +29 -4
package/dist/db/deferred-dm.d.ts +86 -0
package/dist/db/deferred-dm.js +199 -0
package/dist/db/migrations.js +330 -0
package/dist/db/observations.d.ts +2 -2
package/dist/db/observations.js +3 -3
package/dist/db/schema.js +217 -16
package/dist/db/voice-transcripts-store.d.ts +1 -1
package/dist/index.js +86 -29
package/dist/messaging/browser-task-mcp-notifier.d.ts +12 -70
package/dist/messaging/browser-task-mcp-notifier.js +30 -151
package/dist/messaging/browser-task-screenshot-attachment.d.ts +15 -0
package/dist/messaging/browser-task-screenshot-attachment.js +63 -0
package/dist/observers/delegated-sync-worker.d.ts +6 -6
package/dist/observers/delegated-sync-worker.js +10 -10
package/dist/observers/git-delegated-cron.d.ts +1 -1
package/dist/observers/git-delegated-cron.js +2 -2
package/dist/observers/github-poller-classifier.d.ts +3 -3
package/dist/observers/github-poller-classifier.js +3 -3
package/dist/observers/imminent-event-scheduler.d.ts +1 -1
package/dist/observers/imminent-event-scheduler.js +1 -1
package/dist/observers/mail-poller.d.ts +1 -0
package/dist/observers/mail-poller.js +42 -3
package/dist/observers/observation-summarizer/summarizer-client.d.ts +2 -2
package/dist/observers/observation-summarizer/summarizer-client.js +2 -2
package/dist/observers/observation-summarizer/worker.d.ts +2 -2
package/dist/observers/observation-summarizer/worker.js +4 -4
package/dist/observers/obsidian-watcher.d.ts +1 -1
package/dist/observers/obsidian-watcher.js +1 -1
package/dist/safety/agent-write-tracker.d.ts +4 -4
package/dist/safety/agent-write-tracker.js +4 -4
package/dist/safety/audit.d.ts +43 -5
package/dist/safety/audit.js +86 -18
package/dist/safety/risk-classifier.d.ts +6 -0
package/dist/safety/risk-classifier.js +75 -11
package/dist/scheduler/activity-scan-gate.d.ts +86 -0
package/dist/scheduler/activity-scan-gate.js +132 -0
package/dist/services/background-task/background-task-budget.d.ts +80 -0
package/dist/services/background-task/background-task-budget.js +91 -0
package/dist/services/background-task/background-task-driver.d.ts +105 -0
package/dist/services/background-task/background-task-driver.js +416 -0
package/dist/services/background-task/background-task-runner.d.ts +96 -0
package/dist/services/background-task/background-task-runner.js +673 -0
package/dist/services/background-task/background-task-tools.d.ts +84 -0
package/dist/services/background-task/background-task-tools.js +247 -0
package/dist/services/background-task/background-task-transition-events.d.ts +43 -0
package/dist/services/background-task/background-task-transition-events.js +54 -0
package/dist/services/browser-history/automation/egress-denylist.d.ts +1 -1
package/dist/services/browser-history/automation/egress-denylist.js +16 -6
package/dist/services/browser-history/managed-chromium/sandbox-launcher.js +0 -1
package/dist/services/browser-task/browser-task-runner.js +53 -8
package/dist/services/observations-batch.d.ts +1 -1
package/dist/services/observations-batch.js +2 -2
package/dist/settings/runtime-settings.d.ts +38 -11
package/dist/settings/runtime-settings.js +203 -40
package/dist/settings/settings-store.js +11 -3
package/package.json +4 -4

package/dist/core/backends/codex-core.js CHANGED Viewed

@@ -16,7 +16,7 @@ import { buildDaemonApiCliEnv } from "../daemon-api-cli.js";
 import { noteNativeSkillToolIfPresent, probeCliNativeSkillSubcommand, } from "./native-skill-discovery-probe.js";
 import { createOutputCapturePath, CliPathCache, parseJsonLine, readFileIfExists, removeFileIfExists, runLineCommand, } from "./cli-utils.js";
 import { probeApiKeyServerSide } from "./api-key-probe.js";
-import { assertCostWithinMaxBudget, assertPromptCostWithinMaxBudget, classifyCliFailure, } from "./cli-quota-guards.js";
+import { assertCostWithinMaxBudget, assertPromptCostWithinMaxBudget, classifyCliFailure, recoverCliFailureSpend, } from "./cli-quota-guards.js";
 import { auditStreamObservation, extractCodexShellCall, } from "../../safety/subprocess-block-scanner.js";
 import { extractSilentApiErrors, logSilentApiErrors, } from "./silent-api-error-detector.js";
 import { findRegisteredModel, getModelsForBackend, latestLiteFor, } from "./model-registry.js";
@@ -43,7 +43,7 @@ const EMPTY_USAGE = {
  * The delegated path already had this guard (see the `runDelegatedTool`
  * wiring lower in this file); the reactive path needs it explicitly
  * because a single hung subprocess can pin a session for the full
- * executeTimeoutMinutes wall-clock, blocking morning-routine / hourly-check
+ * executeTimeoutMinutes wall-clock, blocking morning-routine / activity-scan
  * dispatch downstream.
  */
 const REACTIVE_IDLE_TIMEOUT_MS = 5 * 60 * 1000;
@@ -669,12 +669,12 @@ export class CodexCore {
             // we still throw a `timeout` failure here because that matches
             // the dispatcher's retry semantics.
             if (idleTimedOut) {
-                const err = new BackendDecisiveFailure(this.backendId, "timeout", new Error(`Codex reactive stream went idle for ${REACTIVE_IDLE_TIMEOUT_MS}ms (no events from CLI subprocess)`));
+                const err = new BackendDecisiveFailure(this.backendId, "timeout", new Error(`Codex reactive stream went idle for ${REACTIVE_IDLE_TIMEOUT_MS}ms (no events from CLI subprocess)`), this.recoverFailureSpend(usage, actualModelId, numTurns, startMs));
                 logger.error({ err, eventType: params.eventType, model: params.modelId, durationMs: Date.now() - startMs }, "Codex execute idle-timed-out");
                 throw err;
             }
             if (runResult.timedOut) {
-                const err = new BackendDecisiveFailure(this.backendId, "timeout", new Error(`Codex execution exceeded timeout of ${this.config.executeTimeoutMinutes} minutes`));
+                const err = new BackendDecisiveFailure(this.backendId, "timeout", new Error(`Codex execution exceeded timeout of ${this.config.executeTimeoutMinutes} minutes`), this.recoverFailureSpend(usage, actualModelId, numTurns, startMs));
                 logger.error({ err, eventType: params.eventType, model: params.modelId, durationMs: Date.now() - startMs }, "Codex execute timed out");
                 throw err;
             }
@@ -723,7 +723,7 @@ export class CodexCore {
                 ?? firstFailureLine(runResult.stdoutLines);
             if (!sawCompletion || runResult.exitCode !== 0) {
                 const failureMsg = combinedFailure ?? "Codex execution did not complete successfully.";
-                const classified = this.classifyFailure(failureMsg);
+                const classified = this.classifyFailure(failureMsg, this.recoverFailureSpend(usage, actualModelId, numTurns, startMs));
                 logger.error({ err: classified, eventType: params.eventType, model: params.modelId, exitCode: runResult.exitCode, durationMs: Date.now() - startMs }, "Codex execute failed");
                 throw classified;
             }
@@ -943,13 +943,29 @@ export class CodexCore {
     // Gemini CLI core; the logic lives in `cli-quota-guards.ts` (single source
     // of truth) and each backend passes its own regexes / label. See that
     // module for the full ordering rationale.
-    classifyFailure(message) {
+    classifyFailure(message, spend) {
         return classifyCliFailure({
             backendId: this.backendId,
             message,
             // OpenAI surfaces quota exhaustion as "rate limit" / "usage limit" / "quota".
             rateLimitPattern: /rate limit|usage limit|quota/i,
             authPattern: /unauthorized|forbidden|api key|login/i,
+            ...(spend !== undefined ? { spend } : {}),
+        });
+    }
+    /**
+     * PREPASS_COST_REDUCTION_PLAN.md N1 — spend recovered from the failed
+     * run's JSONL usage so terminal errors carry what the provider already
+     * billed. Null when the stream never reported usage.
+     */
+    recoverFailureSpend(usage, modelId, numTurns, startMs) {
+        return recoverCliFailureSpend({
+            backendId: this.backendId,
+            priceFetcher: this.priceFetcher,
+            usage,
+            modelId,
+            numTurns,
+            durationMs: Date.now() - startMs,
         });
     }
     assertWithinMaxBudget(costUsd, maxBudgetUsd, modelId, spend) {

package/dist/core/backends/failure-spend.d.ts ADDED Viewed

@@ -0,0 +1,58 @@
+/**
+ * PREPASS_COST_REDUCTION_PLAN.md N1 — shared post-hoc failure-spend
+ * recording.
+ *
+ * A backend attempt that fails (or is budget-killed) after the provider
+ * has already billed must still land in `agent_actions`, or the cost
+ * dials under-report by the size of every failed turn. Two layers need
+ * the same write:
+ *
+ *  - `DispatcherErrorRouter.handleError` — the throw path, where a
+ *    `BackendRouterHandledError` is unwrapped into its per-backend
+ *    failures (main + fallback can both have billed);
+ *  - `BackendRouter.executeFallbackCore` — the fallback-SUCCESS path,
+ *    where the dispatcher's error path never runs and this module is
+ *    the only place the main attempt's spend can be recorded (and the
+ *    raw-fallback-error rethrow, which bypasses the dispatcher's
+ *    unwrap because the thrown error is not a router wrap).
+ *
+ * Tagging convention: quota errors keep the spend payload's own
+ * `costSource` (`sdk` for Codex/Gemini post-hoc asserts, `sdk_partial`
+ * for Claude budget aborts); non-quota decisive failures are tagged
+ * `cost_source='post_hoc_error'` so failure-spend rows are queryable
+ * as a class.
+ */
+import type Database from "better-sqlite3";
+import type { BackendId } from "@aitne/shared";
+import { type BackendQuotaSpend } from "../agent-core.js";
+/**
+ * One recordable failure-spend: which backend billed it, the recovered
+ * payload, and the `cost_source` tag the audit row should carry.
+ */
+export interface FailureSpendInfo {
+    backendId: BackendId;
+    spend: BackendQuotaSpend;
+    costSource: string | null;
+}
+/**
+ * Recover the recordable spend from one backend failure signal.
+ * Handles the nested `BackendDecisiveFailure(kind="quota",
+ * cause=BackendQuotaError)` wrap the router produces. Returns `null`
+ * when the failure carries no spend (nothing billed, or the
+ * SDK/CLI surfaced no usage before dying).
+ */
+export declare function extractFailureSpendInfo(failure: unknown): FailureSpendInfo | null;
+/**
+ * Write a `result='failed'` agent_actions row carrying the actual spend
+ * for a turn the backend completed (or partially ran) before failing.
+ * One row per distinct billed backend attempt — a fallback-success run
+ * gets a `failed` row for the main attempt next to the ResultProcessor's
+ * `success` row for the fallback.
+ *
+ * Best-effort: a logging failure must not mask the original control
+ * flow — we catch and warn instead of rethrowing.
+ */
+export declare function recordFailureSpendRow(db: Database.Database, event: {
+    correlationId: string;
+    type: string;
+}, spendInfo: FailureSpendInfo, errorMessage: string): void;

package/dist/core/backends/failure-spend.js ADDED Viewed

@@ -0,0 +1,137 @@
+/**
+ * PREPASS_COST_REDUCTION_PLAN.md N1 — shared post-hoc failure-spend
+ * recording.
+ *
+ * A backend attempt that fails (or is budget-killed) after the provider
+ * has already billed must still land in `agent_actions`, or the cost
+ * dials under-report by the size of every failed turn. Two layers need
+ * the same write:
+ *
+ *  - `DispatcherErrorRouter.handleError` — the throw path, where a
+ *    `BackendRouterHandledError` is unwrapped into its per-backend
+ *    failures (main + fallback can both have billed);
+ *  - `BackendRouter.executeFallbackCore` — the fallback-SUCCESS path,
+ *    where the dispatcher's error path never runs and this module is
+ *    the only place the main attempt's spend can be recorded (and the
+ *    raw-fallback-error rethrow, which bypasses the dispatcher's
+ *    unwrap because the thrown error is not a router wrap).
+ *
+ * Tagging convention: quota errors keep the spend payload's own
+ * `costSource` (`sdk` for Codex/Gemini post-hoc asserts, `sdk_partial`
+ * for Claude budget aborts); non-quota decisive failures are tagged
+ * `cost_source='post_hoc_error'` so failure-spend rows are queryable
+ * as a class.
+ */
+import { BackendDecisiveFailure, BackendQuotaError, } from "../agent-core.js";
+import { createLogger } from "../../logging.js";
+const logger = createLogger("failure-spend");
+/**
+ * Recover the recordable spend from one backend failure signal.
+ * Handles the nested `BackendDecisiveFailure(kind="quota",
+ * cause=BackendQuotaError)` wrap the router produces. Returns `null`
+ * when the failure carries no spend (nothing billed, or the
+ * SDK/CLI surfaced no usage before dying).
+ */
+export function extractFailureSpendInfo(failure) {
+    const quota = failure instanceof BackendQuotaError
+        ? failure
+        : failure instanceof BackendDecisiveFailure
+            && failure.kind === "quota"
+            && failure.cause instanceof BackendQuotaError
+            ? failure.cause
+            : null;
+    if (quota?.spend) {
+        return {
+            backendId: quota.backendId,
+            spend: quota.spend,
+            costSource: quota.spend.costSource ?? null,
+        };
+    }
+    if (failure instanceof BackendDecisiveFailure && failure.spend) {
+        return {
+            backendId: failure.backendId,
+            spend: failure.spend,
+            costSource: "post_hoc_error",
+        };
+    }
+    return null;
+}
+/**
+ * Per-DB memo of whether `agent_actions` carries the migration-added
+ * cache-token columns. Pre-migration databases (the `AuditLogger`
+ * guards the same way) must not make the whole best-effort INSERT
+ * fail just because the optional columns are absent.
+ */
+const cacheColumnSupport = new WeakMap();
+function hasCacheTokenColumns(db) {
+    const cached = cacheColumnSupport.get(db);
+    if (cached !== undefined)
+        return cached;
+    let supported = false;
+    try {
+        const columns = db
+            .prepare("PRAGMA table_info(agent_actions)")
+            .all();
+        const names = new Set(columns.map((c) => c.name));
+        supported = names.has("cache_creation_tokens") && names.has("cache_read_tokens");
+    }
+    catch {
+        supported = false;
+    }
+    cacheColumnSupport.set(db, supported);
+    return supported;
+}
+/**
+ * Write a `result='failed'` agent_actions row carrying the actual spend
+ * for a turn the backend completed (or partially ran) before failing.
+ * One row per distinct billed backend attempt — a fallback-success run
+ * gets a `failed` row for the main attempt next to the ResultProcessor's
+ * `success` row for the fallback.
+ *
+ * Best-effort: a logging failure must not mask the original control
+ * flow — we catch and warn instead of rethrowing.
+ */
+export function recordFailureSpendRow(db, event, spendInfo, errorMessage) {
+    const { spend } = spendInfo;
+    try {
+        const columns = [
+            "event_id",
+            "action_type",
+            "model_used",
+            "cost_usd",
+            "tokens_input",
+            "tokens_output",
+            "duration_ms",
+            "num_turns",
+            "result",
+            "backend",
+            "cost_source",
+            "error",
+            "completed_at",
+        ];
+        const values = [
+            event.correlationId,
+            event.type,
+            spend.modelId,
+            spend.costUsd,
+            spend.usage.inputTokens,
+            spend.usage.outputTokens,
+            spend.durationMs,
+            spend.numTurns,
+            "failed",
+            spendInfo.backendId,
+            spendInfo.costSource,
+            errorMessage.slice(0, 4096),
+            new Date().toISOString(),
+        ];
+        if (hasCacheTokenColumns(db)) {
+            columns.splice(6, 0, "cache_creation_tokens", "cache_read_tokens");
+            values.splice(6, 0, spend.usage.cacheCreationInputTokens, spend.usage.cacheReadInputTokens);
+        }
+        const placeholders = columns.map(() => "?").join(", ");
+        db.prepare(`INSERT INTO agent_actions (${columns.join(", ")}) VALUES (${placeholders})`).run(...values);
+    }
+    catch (err) {
+        logger.warn({ err, eventType: event.type, backendId: spendInfo.backendId }, "Failed to record post-hoc failure spend in agent_actions");
+    }
+}

package/dist/core/backends/gemini-cli-core.d.ts CHANGED Viewed

@@ -300,6 +300,12 @@ export declare class GeminiCliCore implements IAgentCore {
      */
     private incrementRequestsCount;
     private classifyFailure;
+    /**
+     * PREPASS_COST_REDUCTION_PLAN.md N1 — spend recovered from the failed
+     * run's JSONL stats so terminal errors carry what the provider already
+     * billed. Null when the stream never reported usage.
+     */
+    private recoverFailureSpend;
     private assertWithinMaxBudget;
     private assertPromptWithinMaxBudget;
     /**

package/dist/core/backends/gemini-cli-core.js CHANGED Viewed

@@ -19,7 +19,7 @@ import { ALWAYS_DISALLOWED_TOOLS } from "../../safety/always-disallowed.js";
 import { CliPathCache, parseJsonLine, runLineCommand, } from "./cli-utils.js";
 import { isPathInsideOrEqual, jsonStringPathForms, shellPathForms, } from "../path-compat.js";
 import { probeApiKeyServerSide } from "./api-key-probe.js";
-import { assertCostWithinMaxBudget, assertPromptCostWithinMaxBudget, classifyCliFailure, } from "./cli-quota-guards.js";
+import { assertCostWithinMaxBudget, assertPromptCostWithinMaxBudget, classifyCliFailure, recoverCliFailureSpend, } from "./cli-quota-guards.js";
 import { buildAgentDayBoundaryHint } from "./quota-reset-hints.js";
 import { auditStreamObservation, extractGeminiToolUseTarget, } from "../../safety/subprocess-block-scanner.js";
 import { extractSilentApiErrors, logSilentApiErrors, } from "./silent-api-error-detector.js";
@@ -783,7 +783,7 @@ export class GeminiCliCore {
             // the wall-clock case, but the audit trail and operator alert
             // call out the idle hang specifically.
             if (maxTurnsExceeded) {
-                const err = new BackendDecisiveFailure(this.backendId, "max_turns", new Error(`Gemini execution exceeded max-turns cap of ${maxTurns} (observed ${toolCallCount} tool calls).`));
+                const err = new BackendDecisiveFailure(this.backendId, "max_turns", new Error(`Gemini execution exceeded max-turns cap of ${maxTurns} (observed ${toolCallCount} tool calls).`), this.recoverFailureSpend(stats, params.modelId, toolCallCount, startMs));
                 logger.error({
                     err,
                     eventType: params.eventType,
@@ -795,12 +795,12 @@ export class GeminiCliCore {
                 throw err;
             }
             if (idleTimedOut) {
-                const err = new BackendDecisiveFailure(this.backendId, "timeout", new Error(`Gemini reactive stream went idle for ${REACTIVE_IDLE_TIMEOUT_MS}ms (no events from CLI subprocess)`));
+                const err = new BackendDecisiveFailure(this.backendId, "timeout", new Error(`Gemini reactive stream went idle for ${REACTIVE_IDLE_TIMEOUT_MS}ms (no events from CLI subprocess)`), this.recoverFailureSpend(stats, params.modelId, toolCallCount, startMs));
                 logger.error({ err, eventType: params.eventType, model: params.modelId, durationMs: Date.now() - startMs }, "Gemini execute idle-timed-out");
                 throw err;
             }
             if (runResult.timedOut) {
-                const err = new BackendDecisiveFailure(this.backendId, "timeout", new Error(`Gemini execution exceeded timeout of ${this.config.executeTimeoutMinutes} minutes`));
+                const err = new BackendDecisiveFailure(this.backendId, "timeout", new Error(`Gemini execution exceeded timeout of ${this.config.executeTimeoutMinutes} minutes`), this.recoverFailureSpend(stats, params.modelId, toolCallCount, startMs));
                 logger.error({ err, eventType: params.eventType, model: params.modelId, durationMs: Date.now() - startMs }, "Gemini execute timed out");
                 throw err;
             }
@@ -813,7 +813,7 @@ export class GeminiCliCore {
                     ?? firstFailureLine(runResult.stdoutLines)
                     ?? firstFailureLine(runResult.stderrLines)
                     ?? "Gemini execution did not complete successfully.";
-                const classified = this.classifyFailure(failureText);
+                const classified = this.classifyFailure(failureText, this.recoverFailureSpend(stats, params.modelId, toolCallCount, startMs));
                 logger.error({ err: classified, eventType: params.eventType, model: params.modelId, exitCode: runResult.exitCode, durationMs: Date.now() - startMs }, "Gemini execute failed");
                 throw classified;
             }
@@ -1703,7 +1703,7 @@ ${fetchClause}`;
     // Codex core; the logic lives in `cli-quota-guards.ts` (single source of
     // truth) and each backend passes its own regexes / label. Gemini adds a
     // pre-auth policy-deny branch via `classifyGeminiPolicyDeny`.
-    classifyFailure(message) {
+    classifyFailure(message, spend) {
         return classifyCliFailure({
             backendId: this.backendId,
             message,
@@ -1711,6 +1711,25 @@ ${fetchClause}`;
             rateLimitPattern: /rate limit|quota|429/i,
             authPattern: /authentication page|oauth|api key|login|required/i,
             extraClassifier: classifyGeminiPolicyDeny,
+            ...(spend !== undefined ? { spend } : {}),
+        });
+    }
+    /**
+     * PREPASS_COST_REDUCTION_PLAN.md N1 — spend recovered from the failed
+     * run's JSONL stats so terminal errors carry what the provider already
+     * billed. Null when the stream never reported usage.
+     */
+    recoverFailureSpend(stats, modelId, toolCallCount, startMs) {
+        return recoverCliFailureSpend({
+            backendId: this.backendId,
+            priceFetcher: this.priceFetcher,
+            usage: normalizeGeminiUsage(stats),
+            modelId,
+            // Matches the success branch / budget-assert formula
+            // (`toolCallCount + 1`) so a failed and a successful run with the
+            // same tool fan-out report the same turn count.
+            numTurns: toolCallCount + 1,
+            durationMs: Date.now() - startMs,
         });
     }
     assertWithinMaxBudget(costUsd, maxBudgetUsd, modelId, spend) {

package/dist/core/backends/model-registry.d.ts CHANGED Viewed

@@ -6,7 +6,7 @@ import type { BackendId, BackendModel, BackendModelTier, BackendUsage } from "@a
  *
  * Tier semantics (see `BackendModelTier` in shared/backend.ts):
  *   - `LITE`   — delegated proxy + observer-fired short-shape tasks.
- *   - `MEDIUM` — main agent surfaces (DM, routines, hourly check, reviews).
+ *   - `MEDIUM` — main agent surfaces (DM, routines, activity scan, reviews).
  *   - `HIGH`   — heavy reasoning (advisor, knowledge import, generative one-shots).
  *
  * Sources of truth for the alias → API ID mapping:

package/dist/core/backends/model-registry.js CHANGED Viewed

@@ -5,7 +5,7 @@
  *
  * Tier semantics (see `BackendModelTier` in shared/backend.ts):
  *   - `LITE`   — delegated proxy + observer-fired short-shape tasks.
- *   - `MEDIUM` — main agent surfaces (DM, routines, hourly check, reviews).
+ *   - `MEDIUM` — main agent surfaces (DM, routines, activity scan, reviews).
  *   - `HIGH`   — heavy reasoning (advisor, knowledge import, generative one-shots).
  *
  * Sources of truth for the alias → API ID mapping:
@@ -18,7 +18,7 @@ export const DEFAULT_CLAUDE_LITE_MODEL = "claude-haiku-4-5-20251001";
 export const DEFAULT_CLAUDE_MEDIUM_MODEL = "claude-sonnet-4-6";
 export const DEFAULT_CLAUDE_HIGH_MODEL = "claude-opus-4-8";
 // Codex (gpt-5.4-mini is the lite-tier pick; gpt-5.4 is the medium-tier
-// default — morning_routine / hourly_check / evening_review run on this.
+// default — morning_routine / activity_scan / evening_review run on this.
 // gpt-5.5 and gpt-5.5-chat-latest are the flagship reasoning models and
 // stay registered at high tier as selectable opt-ins, but the seeded
 // default for Codex's high tier is also gpt-5.4: gpt-5.5 carries Opus-
@@ -34,7 +34,7 @@ export const DEFAULT_CODEX_HIGH_MODEL = "gpt-5.4";
 // medium-tier flash equivalent left. `gemini-3.1-pro-preview` is priced in
 // the Sonnet band — $0.002/$0.012 per 1k in/out under 200k context, ~2/3
 // the cost of Sonnet 4.6 — so it serves as the "main agent work" pick for
-// every medium-tier surface (morning_routine, message.dm, hourly_check,
+// every medium-tier surface (morning_routine, message.dm, activity_scan,
 // evening / weekly / monthly review). High tier collapses onto the same
 // model via `SEED_HIGH_TIER_OVERRIDE` below: there's no Opus-priced Google
 // flagship worth defaulting to, and operators who genuinely want
@@ -274,7 +274,7 @@ const MODEL_REGISTRY = [
         displayName: "GPT-5.4",
         // Promoted from `high` to `medium` after gpt-5.5 shipped: gpt-5.4 is
         // priced ~half of gpt-5.5 for the same context shapes, and the
-        // medium-tier routines (morning_routine / hourly_check /
+        // medium-tier routines (morning_routine / activity_scan /
         // evening_review / message.dm) do not benefit from gpt-5.5's
         // deeper reasoning enough to justify the cost. gpt-5.4 is ALSO the
         // seeded default for codex's high tier via `SEED_HIGH_TIER_OVERRIDE`

package/dist/core/backends/opencode-core.d.ts CHANGED Viewed

@@ -289,7 +289,7 @@ export declare function auditOpencodeTools(tools: ReturnType<typeof extractToolU
     sessionId: number | null;
 }): void;
 /**
- * docs/design/appendices/opencode-backend.md Phase 4 — Stage 2 hourly-check triage
+ * docs/design/appendices/opencode-backend.md Phase 4 — Stage 2 activity-scan triage
  * schema. Mirrors the `parseStage2Verdict` text contract
  * (`dispatcher-types.ts`): the agent must return exactly
  * `{ "action": "log_only" | "escalate", "reason": string }`. Opencode

package/dist/core/backends/opencode-core.js CHANGED Viewed

@@ -609,7 +609,7 @@ export class OpencodeCore {
             const renderedPrompt = isResume
                 ? params.prompt
                 : buildExecutionPrompt(params.prompt, params.context, params.event, params.conversationHistory);
-            // docs/design/appendices/opencode-backend.md §4 / Phase 4 — `routine.hourly_check.triage`
+            // docs/design/appendices/opencode-backend.md §4 / Phase 4 — `routine.activity_scan.triage`
             // returns a strict JSON envelope (`{ "action": "log_only" |
             // "escalate", … }`) parsed by `parseStage2Verdict`. opencode's
             // `format: { type: "json_schema", … }` honours the schema with
@@ -767,7 +767,7 @@ export class OpencodeCore {
                 const durationMs = Date.now() - startMs;
                 const stopReason = assistantMessage?.finish ?? null;
                 // Best-effort cleanup of the on-disk opencode session row when we
-                // own the workdir — keeps disk usage bounded under hourly_check.
+                // own the workdir — keeps disk usage bounded under activity_scan.
                 // On resume we must never delete: the dispatcher's next turn
                 // needs the same session id to resolve to a live server-side
                 // history. (`ownsSessionDir` is already false when sessionDir is
@@ -1466,7 +1466,7 @@ function classifyStreamError(payload, backendId) {
     return new BackendDecisiveFailure(backendId, "other_non_retryable", new Error(message));
 }
 /**
- * docs/design/appendices/opencode-backend.md Phase 4 — Stage 2 hourly-check triage
+ * docs/design/appendices/opencode-backend.md Phase 4 — Stage 2 activity-scan triage
  * schema. Mirrors the `parseStage2Verdict` text contract
  * (`dispatcher-types.ts`): the agent must return exactly
  * `{ "action": "log_only" | "escalate", "reason": string }`. Opencode
@@ -1493,11 +1493,11 @@ export const STAGE2_TRIAGE_JSON_SCHEMA = {
 /**
  * Returns the opencode `format` envelope to apply when a given process
  * key has a strict structured-output contract; null otherwise. v1
- * covers `routine.hourly_check.triage`; future strict-JSON process
+ * covers `routine.activity_scan.triage`; future strict-JSON process
  * keys (e.g. delegated classifiers) extend this map.
  */
 function formatForProcessKey(processKey) {
-    if (processKey === "routine.hourly_check.triage") {
+    if (processKey === "routine.activity_scan.triage") {
         return {
             type: "json_schema",
             schema: STAGE2_TRIAGE_JSON_SCHEMA,

package/dist/core/backends/plan-presets.js CHANGED Viewed

@@ -222,27 +222,44 @@ const ENVELOPE_OVERRIDES_BY_PROCESS_KEY = {
     // cost-reduction-structural §B — Stage 2 lite-tier triage. Strict
     // JSON-only output (~2K input / ~50 output) decides log_only vs
     // escalate. 1 turn / $0.05 mirrors observation.summarize.
-    "routine.hourly_check.triage": { maxTurns: 1, maxBudgetUsd: 0.05 },
+    "routine.activity_scan.triage": { maxTurns: 1, maxBudgetUsd: 0.05 },
     // docs/design/appendices/routine-data-acquisition.md §6.2 / §6.9 pre-pass fetcher.
     // The lite-tier nominal ($0.20) under-provisioned the morning fan-out
     // (2 mail providers × N accounts + calendar + notion) and tripped
     // BackendQuotaError(max_budget_usd) mid-fetch — widened to $0.50 so
     // the cap still binds well before runaway but accommodates the real
-    // worst-case fan-out. 20-turn turn count is unchanged. Keep in
-    // lock-step with the corresponding schema-seed row.
-    "routine.fetch_window": { maxTurns: 20, maxBudgetUsd: 0.5 },
+    // worst-case fan-out. Keep in lock-step with the corresponding
+    // schema-seed row.
+    //
+    // maxTurns 20 → 10 (PREPASS_COST_REDUCTION_PLAN.md N4, 2026-06-10):
+    // measured over 502 fetch_window runs on a live install, num_turns
+    // P50=3 / P95=6 / P99=8 / max=11 (avg 3.08). The per-integration
+    // fan-out means each session handles ONE partial, so the original
+    // "~6 partials × 3 tool calls" sizing no longer applies. 10 bounds
+    // budget-cap wander (a stuck session now stops at half the previous
+    // exploration depth) while clearing P99 with 2 turns of headroom.
+    "routine.fetch_window": { maxTurns: 10, maxBudgetUsd: 0.5 },
     // BROWSER_HISTORY_INTEGRATION_PLAN P3 — keep these in lock-step with
-    // the schema seed rows. cluster_update is a tiny dispatcher (1 PUT
-    // + a list call), so the absolute floor of 5/$0.05 is the right
-    // envelope. research_offer_dm is even tighter — a single DM
-    // composition (GET /research-clusters/<slug> + POST /api/notify),
-    // 5/$0.02 leaves no room for runaway. research_dispatch carries the
-    // WebFetch fan-out; mirrors evening_review (50/$1.00).
-    // research_wiki_summary is tighter (30/$0.50) — it reads the cluster
-    // journal the agent already wrote and composes from it, with
-    // bounded external work.
-    "routine.research_cluster_update": { maxTurns: 5, maxBudgetUsd: 0.05 },
-    "routine.research_offer_dm": { maxTurns: 5, maxBudgetUsd: 0.02 },
+    // the schema seed rows (research_offer_dm has NO seed row — this
+    // entry is its only default, materialized on main-backend switch or
+    // Reset).
+    //
+    // cluster_update / offer_dm budgets are STOP-LOSSES sized to cover
+    // one cold-prompt-cache run, not per-run cost targets
+    // (RESEARCH_CLUSTER_COST_FIX_PLAN.md RC2/F3): the SDK budget check
+    // only fires between turns, and a cold run writes the full session
+    // prefix to prompt cache (~$0.13-0.30 observed on Haiku) before the
+    // check can abort — the original floor values ($0.05/$0.02) killed
+    // every cold run AFTER the money was spent and the journal was never
+    // written. With the F1 per-agent-day enqueue stamp, cluster_update
+    // runs at most once per cluster per day, so $0.50 bounds daily spend
+    // per cluster. Bumped for upgrading installs by migration 0012.
+    // research_dispatch carries the WebFetch fan-out; mirrors
+    // evening_review (50/$1.00). research_wiki_summary is tighter
+    // (30/$0.50) — it reads the cluster journal the agent already wrote
+    // and composes from it, with bounded external work.
+    "routine.research_cluster_update": { maxTurns: 5, maxBudgetUsd: 0.5 },
+    "routine.research_offer_dm": { maxTurns: 5, maxBudgetUsd: 0.15 },
     "routine.research_dispatch": { maxTurns: 50, maxBudgetUsd: 1.0 },
     "routine.research_wiki_summary": { maxTurns: 30, maxBudgetUsd: 0.5 },
     // BROWSER_TASK_REDESIGN_PLAN.md §5 — open-ended browser sub-agent.
@@ -254,6 +271,13 @@ const ENVELOPE_OVERRIDES_BY_PROCESS_KEY = {
     // cost without tripping BackendQuotaError. Lock-step with the
     // schema-seed row.
     "browser_task": { maxTurns: 30, maxBudgetUsd: 1.0 },
+    // BACKGROUND_TASK_RUNNER_DESIGN.md §6 — generic detached worker. The
+    // medium-tier nominal (50/$1.00) is too tight for long-running research
+    // / multi-repo audits, so the seed picks 40 turns / $2.00 (the
+    // medium-tier base in background-task-budget.ts). Kept in lock-step
+    // with the schema-seed row so a force=true backend-switch reset
+    // preserves this envelope instead of clobbering it to the tier default.
+    "background_task": { maxTurns: 40, maxBudgetUsd: 2.0 },
 };
 /**
  * Resolve the seed `(model, envelope)` for a configurable process key on

package/dist/core/bang-commands/commands-cost.js CHANGED Viewed

@@ -88,7 +88,9 @@ function makeCostBackendCommand(backend) {
     return {
         name: `!cost ${backend}`,
         title: `Cost for ${backend}`,
-        describe: `Agent spend on ${backend} over the past 7 days.`,
+        // Short on purpose — one of these renders per registered backend in
+        // `!help`, and the whole list must fit MOBILE_REPLY_BUDGET.
+        describe: `Agent spend on ${backend} (7 days).`,
         details: [
             `Reports trailing 7-day spend for ${backend}.`,
             "Does not invoke an LLM.",

package/dist/core/bang-commands/commands-report.js CHANGED Viewed

@@ -18,7 +18,7 @@ const REPORT_SQL = `
       MIN(started_at) AS first_seen,
       MAX(started_at) AS last_seen
     FROM agent_actions
-    WHERE result = 'failed'
+    WHERE result IN ('failed', 'partial')
       AND started_at >= datetime('now', '-7 days')
       AND error IS NOT NULL
     GROUP BY backend, action_type
@@ -27,7 +27,7 @@ const REPORT_SQL = `
     ON latest.action_type = g.action_type
    AND COALESCE(latest.backend, 'claude') = COALESCE(g.backend, 'claude')
    AND latest.started_at = g.last_seen
-   AND latest.result = 'failed'
+   AND latest.result IN ('failed', 'partial')
    AND latest.error IS NOT NULL
   GROUP BY g.backend, g.action_type
   ORDER BY g.n DESC, g.last_seen DESC
@@ -42,7 +42,7 @@ function queryReport(db) {
          COUNT(DISTINCT COALESCE(backend, 'claude') || '|' || action_type) AS groups,
          COUNT(*) AS total
        FROM agent_actions
-       WHERE result = 'failed'
+       WHERE result IN ('failed', 'partial')
          AND started_at >= datetime('now', '-7 days')
          AND error IS NOT NULL`)
         .get();
@@ -94,6 +94,7 @@ export const reportCommand = {
     describe: "Agent errors over the past 7 days.",
     details: [
         "Summarizes recent failed agent actions by action type and backend.",
+        "Includes partial runs that failed a post-run outcome check.",
         "Samples are redacted before sending to messaging surfaces.",
         "Does not invoke an LLM.",
     ],

package/dist/core/bang-commands/commands-research.js CHANGED Viewed

@@ -242,7 +242,10 @@ async function handleRename(ctx, slug, newName) {
 export const researchCommand = {
     prefix: "!research",
     title: "Research clusters",
-    describe: "manage browser-history research clusters (list / show / accept / wiki / decline / mute / unmute / rename / conclude)",
+    // Keep this one-liner short: `!help` renders every registered describe
+    // inside the 1500-char MOBILE_REPLY_BUDGET, and the subcommand catalogue
+    // already lives in `details` below (and in the `!research` reply itself).
+    describe: "manage browser-history research clusters",
     details: [
         "Subcommands:",
         "- `!research` — list active clusters",

package/dist/core/bang-commands/commands-revert-tuning.d.ts ADDED Viewed

@@ -0,0 +1,18 @@
+/**
+ * `!revert tuning` — undo the most recent applied self-tuning config change
+ * (SELF_TUNING_REVIEW_CYCLE_DESIGN.md §3.4, Phase 3).
+ *
+ * The owner-side escape hatch for the Autonomous-plus-DM actuation posture
+ * (D1): every applied change DMs "Reply `!revert tuning` to undo", and this
+ * command is that reply. It restores the ledger's `prev` value through the
+ * same `applyConfigUpdates` chokepoint the actuator used, stamps
+ * `reverted_at` (which puts the key into the 28-day re-proposal cool-down),
+ * audits `self_tuning.reverted`, and records an explicit-correction
+ * feedback signal so the lesson loop learns from the owner's override.
+ *
+ * `runsWhilePaused: true` — a pure DB/config write with no LLM dispatch,
+ * and the owner may well have paused the agent *because* of a bad tuning
+ * change; the undo must not be locked behind `!start`.
+ */
+import { type BangPrefixCommand } from "./registry.js";
+export declare const revertTuningCommand: BangPrefixCommand;