npm - clementine-agent - Versions diffs - 1.18.19 → 1.18.20 - Mend

clementine-agent 1.18.19 → 1.18.20

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (6) hide show

package/dist/agent/assistant.d.ts CHANGED Viewed

@@ -31,6 +31,8 @@ export declare function looksLikeContextThrashText(value: unknown): boolean;
 export declare function contextThrashRecoveryNotice(): string;
 export declare function buildContextThrashRecoveryPrompt(userRequest: string, priorFailureText?: string): string;
 export declare function looksLikeOneMillionContextError(value: unknown): boolean;
+export declare function oneMillionContextRecoveryMessage(): string;
+export declare function looksLikeProviderApiErrorResponse(value: unknown): boolean;
 export declare function looksLikeNoResponseRequested(value: unknown): boolean;
 /** Autonomous jobs use this sentinel to mean "completed, but do not notify the owner." */
 export declare function isAutonomousNothingOutput(response: string): boolean;

package/dist/agent/assistant.js CHANGED Viewed

@@ -343,6 +343,15 @@ function resultInputTokens(result) {
 export function looksLikeOneMillionContextError(value) {
     return looksLikeClaudeOneMillionContextError(value);
 }
+export function oneMillionContextRecoveryMessage() {
+    return "Claude rejected 1M context for this account. I've switched Clementine to persistent 200K recovery mode and reset the session. Restart Clementine once so every background worker starts with the same safe setting.";
+}
+export function looksLikeProviderApiErrorResponse(value) {
+    const text = String(value ?? '').trim();
+    return /^api error:/i.test(text)
+        || /^error:\s*api error:/i.test(text)
+        || looksLikeOneMillionContextError(text);
+}
 export function looksLikeNoResponseRequested(value) {
     const text = String(value ?? '').trim();
     return /^no response requested\.?$/i.test(text);
@@ -2992,7 +3001,7 @@ You have a cost budget per message — not a hard turn limit. Work until the tas
         // Track exchange count, timestamp, and last exchange.
         // Never store API error responses — they poison session history and create
         // a self-reinforcing loop where every subsequent request replays the errors.
-        const isApiError = responseText.startsWith('Error:') && responseText.includes('API Error:');
+        const isApiError = looksLikeProviderApiErrorResponse(responseText);
         if (key && !isApiError) {
             this.exchangeCounts.set(key, (this.exchangeCounts.get(key) ?? 0) + 1);
             this.sessionTimestamps.set(key, new Date());
@@ -3432,7 +3441,7 @@ You have a cost budget per message — not a hard turn limit. Work until the tas
                                             this.exchangeCounts.set(sessionKey, 0);
                                             this._compactedSessions.delete(sessionKey);
                                         }
-                                        responseText = responseText || ("Claude rejected 1M context for this account. I've switched Clementine to persistent 200K recovery mode and reset the session. Restart Clementine once so every background worker starts with the same safe setting.");
+                                        responseText = responseText || (oneMillionContextRecoveryMessage());
                                     }
                                     else if (lower.includes('rate') && lower.includes('limit')) {
                                         hitRateLimit = true;
@@ -3485,7 +3494,19 @@ You have a cost budget per message — not a hard turn limit. Work until the tas
                             else if ('result' in result && result.result) {
                                 // Success: use SDK result text if streaming didn't capture a substantive response
                                 const sdkResult = result.result;
-                                if (looksLikeContextThrashText(sdkResult)) {
+                                if (looksLikeOneMillionContextError(sdkResult)) {
+                                    logger.warn({ sessionKey }, '1M context error surfaced as SDK result text — forcing recovery');
+                                    applyOneMillionContextRecovery();
+                                    if (sessionKey) {
+                                        this.sessions.delete(sessionKey);
+                                        this.exchangeCounts.set(sessionKey, 0);
+                                        this._compactedSessions.delete(sessionKey);
+                                    }
+                                    responseText = oneMillionContextRecoveryMessage();
+                                    if (onText)
+                                        await onText(responseText);
+                                }
+                                else if (looksLikeContextThrashText(sdkResult)) {
                                     logger.warn({ sessionKey }, 'Autocompact thrashing surfaced as SDK result text — rotating session');
                                     preRotationSnapshot = {
                                         toolCalls: stallGuard?.getToolCalls() ?? [],
@@ -3563,7 +3584,7 @@ You have a cost budget per message — not a hard turn limit. Work until the tas
                             this.exchangeCounts.set(sessionKey, 0);
                             this._compactedSessions.delete(sessionKey);
                         }
-                        responseText = responseText || ("Claude rejected 1M context for this account. I've switched Clementine to persistent 200K recovery mode and reset the session. Restart Clementine once so every background worker starts with the same safe setting.");
+                        responseText = responseText || (oneMillionContextRecoveryMessage());
                     }
                     else if (errStr.includes('rate') && (errStr.includes('limit') || errStr.includes('rate_limit'))) {
                         hitRateLimit = true;

package/dist/cli/dashboard.js CHANGED Viewed

@@ -39,6 +39,7 @@ const HEARTBEAT_WORK_QUEUE_FILE = path.join(BASE_DIR, 'heartbeat', 'work-queue.j
 const MEMORY_DB_PATH = path.join(VAULT_DIR, '.memory.db');
 const PROJECTS_META_FILE = path.join(BASE_DIR, 'projects.json');
 const DASHBOARD_PID_FILE = path.join(BASE_DIR, '.dashboard.pid');
+const INTERACTIVE_FAILURE_LOG = path.join(BASE_DIR, 'self-improve', 'interactive-failures.jsonl');
 /**
  * Kill all existing dashboard processes before starting a new one.
  * Uses both the PID file and a process sweep to catch orphans.
@@ -5679,6 +5680,43 @@ If the tool returns nothing or errors, return an empty array \`[]\`.`,
         process.env[key] = normalized;
         return { ok: true, value: normalized };
     }
+    function readRecentDashboardChatFailures(limit = 5) {
+        try {
+            if (!existsSync(INTERACTIVE_FAILURE_LOG))
+                return [];
+            const lines = readFileSync(INTERACTIVE_FAILURE_LOG, 'utf-8')
+                .trim()
+                .split('\n')
+                .filter(Boolean)
+                .slice(-80)
+                .reverse();
+            const out = [];
+            for (const line of lines) {
+                try {
+                    const item = JSON.parse(line);
+                    const error = String(item.error ?? '');
+                    const stage = String(item.stage ?? '');
+                    const haystack = `${stage} ${error}`;
+                    if (!/1m|context|budget|credit|api error|rate.?limit/i.test(haystack))
+                        continue;
+                    out.push({
+                        createdAt: String(item.createdAt ?? ''),
+                        stage,
+                        sessionKey: String(item.sessionKey ?? ''),
+                        textPreview: String(item.textPreview ?? '').slice(0, 220),
+                        error: error.slice(0, 500),
+                    });
+                    if (out.length >= limit)
+                        break;
+                }
+                catch { /* skip malformed lines */ }
+            }
+            return out;
+        }
+        catch {
+            return [];
+        }
+    }
     const ASSISTANT_PREF_OPTIONS = {
         proactivity: ['quiet', 'balanced', 'proactive', 'operator'],
         responseStyle: ['concise', 'balanced', 'detailed'],
@@ -5797,6 +5835,7 @@ If the tool returns nothing or errors, return an empty array \`[]\`.`,
                     legacyMode,
                 },
                 findings,
+                recentFailures: readRecentDashboardChatFailures(),
                 counts: doctor.counts,
             });
         }
@@ -20083,6 +20122,7 @@ async function refreshBudgetHealth() {
     var modeClass = mode === 'off' ? 'badge-green' : mode === 'on' ? 'badge-yellow' : 'badge-blue';
     var rows = d.budgets || [];
     var findings = d.findings || [];
+    var recentFailures = d.recentFailures || [];
     var html = '<div class="card">'
       + '<div class="card-header" style="display:flex;align-items:center;justify-content:space-between;gap:12px">'
       + '<div style="display:flex;align-items:center;gap:8px"><span>Spend Guards &amp; Context Health</span><span class="badge ' + modeClass + '" style="font-size:10px">1M ' + esc(mode) + '</span></div>'
@@ -20131,6 +20171,22 @@ async function refreshBudgetHealth() {
       + '<div style="font-size:12px;color:var(--text-secondary);margin-top:4px">Safe Recovery lowers autonomous spend and disables 1M context for accounts seeing credit or entitlement errors.</div>'
       + '<div style="font-size:11px;color:var(--text-muted);margin-top:6px">Restart the daemon after changing budgets or context mode.</div>'
       + '</div></div>';
+    if (recentFailures.length) {
+      html += '<div style="border-top:1px solid var(--border);padding-top:10px;margin-bottom:10px">'
+        + '<div style="font-weight:600;font-size:13px;margin-bottom:6px">Recent chat failures</div>';
+      for (var rf = 0; rf < recentFailures.length; rf++) {
+        var fail = recentFailures[rf] || {};
+        html += '<div style="padding:8px 0;border-bottom:1px solid rgba(127,127,127,0.12)">'
+          + '<div style="display:flex;gap:8px;align-items:center;flex-wrap:wrap">'
+          + '<span class="badge badge-yellow" style="font-size:10px">' + esc(fail.stage || 'failure') + '</span>'
+          + '<span style="font-size:11px;color:var(--text-muted)">' + esc(fail.createdAt || '') + '</span>'
+          + '</div>'
+          + '<div style="font-size:12px;color:var(--text-secondary);margin-top:4px">' + esc(fail.error || '') + '</div>'
+          + (fail.textPreview ? '<div style="font-size:11px;color:var(--text-muted);margin-top:3px">Prompt: ' + esc(fail.textPreview) + '</div>' : '')
+          + '</div>';
+      }
+      html += '</div>';
+    }
     if (findings.length) {
       html += '<div style="border-top:1px solid var(--border);padding-top:10px">'
         + '<div style="font-weight:600;font-size:13px;margin-bottom:6px">Potential causes</div>';

package/dist/gateway/router.d.ts CHANGED Viewed

@@ -11,7 +11,7 @@ import { TeamRouter } from '../agent/team-router.js';
 import { TeamBus } from '../agent/team-bus.js';
 import type { NotificationDispatcher } from './notifications.js';
 import { type ProactiveNotificationInput } from './notification-context.js';
-export type ChatErrorKind = 'rate_limit' | 'context_overflow' | 'auth' | 'billing' | 'transient' | 'unknown';
+export type ChatErrorKind = 'rate_limit' | 'one_million_context' | 'context_overflow' | 'auth' | 'billing' | 'transient' | 'unknown';
 export declare function classifyChatError(err: unknown): ChatErrorKind;
 /** Detect auth-like errors in response text that the SDK returned as "successful" results. */
 export declare function looksLikeAuthError(text: string): boolean;

package/dist/gateway/router.js CHANGED Viewed

@@ -7,10 +7,10 @@
 import path from 'node:path';
 import { appendFileSync, existsSync, mkdirSync, readdirSync, readFileSync, statSync, writeFileSync } from 'node:fs';
 import pino from 'pino';
-import { buildContextThrashRecoveryPrompt, contextThrashRecoveryNotice, isAutonomousNothingOutput, looksLikeContextThrashText, PersonalAssistant, } from '../agent/assistant.js';
+import { buildContextThrashRecoveryPrompt, contextThrashRecoveryNotice, isAutonomousNothingOutput, looksLikeContextThrashText, looksLikeProviderApiErrorResponse, oneMillionContextRecoveryMessage, PersonalAssistant, } from '../agent/assistant.js';
 import { runWithTrace, logAuditJsonl } from '../agent/hooks.js';
 import { SelfImproveLoop } from '../agent/self-improve.js';
-import { MODELS, AGENTS_DIR, TEAM_COMMS_LOG, BASE_DIR, SEEN_CHANNELS_FILE, AUTO_DELEGATE_ENABLED } from '../config.js';
+import { MODELS, AGENTS_DIR, TEAM_COMMS_LOG, BASE_DIR, SEEN_CHANNELS_FILE, AUTO_DELEGATE_ENABLED, applyOneMillionContextRecovery, looksLikeClaudeOneMillionContextError, } from '../config.js';
 import { scanner } from '../security/scanner.js';
 import { lanes } from './lanes.js';
 import { AgentManager } from '../agent/agent-manager.js';
@@ -42,7 +42,9 @@ export function classifyChatError(err) {
         return 'billing';
     if (/rate.?limit|\b429\b|too many requests|quota.?exceeded/i.test(msg))
         return 'rate_limit';
-    if (looksLikeContextThrashText(msg) || /extra usage.*1m context|1m context.*extra usage|context-1m|context.?length|token.?limit|maximum.?context|prompt.?too.?long/i.test(msg))
+    if (looksLikeClaudeOneMillionContextError(msg))
+        return 'one_million_context';
+    if (looksLikeContextThrashText(msg) || /context.?length|token.?limit|maximum.?context|prompt.?too.?long/i.test(msg))
         return 'context_overflow';
     if (/\b401\b|\b403\b|auth|forbidden|invalid.?api.?key|permission|does not have access|please run \/login/i.test(msg))
         return 'auth';
@@ -1500,6 +1502,19 @@ export class Gateway {
                     }, 'chat:latency');
                     // Re-baseline integrity checksums after chat (auto-memory may write to vault)
                     scanner.refreshIntegrity();
+                    if (response && looksLikeClaudeOneMillionContextError(response)) {
+                        logger.warn({ sessionKey, responsePreview: response.slice(0, 200) }, '1M context error returned as assistant text — forcing recovery');
+                        this.recordInteractiveFailure(sessionKey, text, response, 'one_million_context_result_text', { effectiveSessionKey });
+                        applyOneMillionContextRecovery();
+                        this.clearSession(effectiveSessionKey);
+                        return oneMillionContextRecoveryMessage();
+                    }
+                    if (response && looksLikeProviderApiErrorResponse(response)) {
+                        logger.warn({ sessionKey, responsePreview: response.slice(0, 200) }, 'Provider API error returned as assistant text — clearing session');
+                        this.recordInteractiveFailure(sessionKey, text, response, 'provider_api_result_text', { effectiveSessionKey });
+                        this.clearSession(effectiveSessionKey);
+                        return "Claude returned a provider API error instead of a normal answer. I've reset this session so the error does not get replayed into future context. Please try that question again.";
+                    }
                     if (response && looksLikeContextThrashText(response)) {
                         logger.warn({ sessionKey, responsePreview: response.slice(0, 200) }, 'Context-thrash text returned from assistant — starting recovery pass');
                         return this.startContextThrashRecovery(sessionKey, text, response, {
@@ -1668,6 +1683,11 @@ export class Gateway {
                     switch (errKind) {
                         case 'rate_limit':
                             return "I'm being rate-limited by the API right now. Please wait a minute and try again.";
+                        case 'one_million_context':
+                            this.recordInteractiveFailure(sessionKey, text, err, 'one_million_context_exception', { effectiveSessionKey });
+                            applyOneMillionContextRecovery();
+                            this.clearSession(effectiveSessionKey);
+                            return oneMillionContextRecoveryMessage();
                         case 'context_overflow':
                             logger.info({ sessionKey }, 'Context overflow — rotating session');
                             this.assistant.clearSession(effectiveSessionKey);

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "clementine-agent",
-  "version": "1.18.19",
+  "version": "1.18.20",
   "description": "Clementine — Personal AI Assistant (TypeScript)",
   "type": "module",
   "main": "dist/index.js",