npm - @bastani/atomic - Versions diffs - 0.8.31-alpha.2 → 0.8.31-alpha.4 - Mend

@bastani/atomic 0.8.31-alpha.2 → 0.8.31-alpha.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (67) hide show

package/CHANGELOG.md +16 -3
package/dist/builtin/cursor/CHANGELOG.md +1 -1
package/dist/builtin/cursor/package.json +2 -2
package/dist/builtin/intercom/package.json +1 -1
package/dist/builtin/mcp/CHANGELOG.md +5 -0
package/dist/builtin/mcp/direct-tools.ts +4 -2
package/dist/builtin/mcp/package.json +1 -1
package/dist/builtin/mcp/proxy-modes.ts +4 -2
package/dist/builtin/mcp/utils.ts +25 -0
package/dist/builtin/subagents/package.json +1 -1
package/dist/builtin/web-access/package.json +1 -1
package/dist/builtin/workflows/CHANGELOG.md +5 -0
package/dist/builtin/workflows/builtin/ralph.ts +1 -0
package/dist/builtin/workflows/package.json +1 -1
package/dist/builtin/workflows/src/runs/foreground/stage-runner.ts +114 -4
package/dist/core/agent-session.d.ts +25 -0
package/dist/core/agent-session.d.ts.map +1 -1
package/dist/core/agent-session.js +135 -11
package/dist/core/agent-session.js.map +1 -1
package/dist/core/auth-guidance.d.ts +12 -0
package/dist/core/auth-guidance.d.ts.map +1 -1
package/dist/core/auth-guidance.js +24 -0
package/dist/core/auth-guidance.js.map +1 -1
package/dist/core/auth-storage.d.ts +42 -0
package/dist/core/auth-storage.d.ts.map +1 -1
package/dist/core/auth-storage.js +71 -10
package/dist/core/auth-storage.js.map +1 -1
package/dist/core/context-window.d.ts +15 -0
package/dist/core/context-window.d.ts.map +1 -1
package/dist/core/context-window.js +11 -0
package/dist/core/context-window.js.map +1 -1
package/dist/core/copilot-gemini-payload-sanitizer.d.ts +72 -0
package/dist/core/copilot-gemini-payload-sanitizer.d.ts.map +1 -0
package/dist/core/copilot-gemini-payload-sanitizer.js +296 -0
package/dist/core/copilot-gemini-payload-sanitizer.js.map +1 -0
package/dist/core/copilot-gemini-reasoning.d.ts +118 -0
package/dist/core/copilot-gemini-reasoning.d.ts.map +1 -0
package/dist/core/copilot-gemini-reasoning.js +260 -0
package/dist/core/copilot-gemini-reasoning.js.map +1 -0
package/dist/core/copilot-gemini-tool-arguments.d.ts +42 -0
package/dist/core/copilot-gemini-tool-arguments.d.ts.map +1 -0
package/dist/core/copilot-gemini-tool-arguments.js +179 -0
package/dist/core/copilot-gemini-tool-arguments.js.map +1 -0
package/dist/core/copilot-model-catalog.d.ts +26 -11
package/dist/core/copilot-model-catalog.d.ts.map +1 -1
package/dist/core/copilot-model-catalog.js +34 -9
package/dist/core/copilot-model-catalog.js.map +1 -1
package/dist/core/flattened-tool-arguments.d.ts +41 -0
package/dist/core/flattened-tool-arguments.d.ts.map +1 -0
package/dist/core/flattened-tool-arguments.js +136 -0
package/dist/core/flattened-tool-arguments.js.map +1 -0
package/dist/core/http-dispatcher.d.ts.map +1 -1
package/dist/core/http-dispatcher.js +5 -0
package/dist/core/http-dispatcher.js.map +1 -1
package/dist/core/model-registry.d.ts.map +1 -1
package/dist/core/model-registry.js +6 -4
package/dist/core/model-registry.js.map +1 -1
package/dist/core/sdk.d.ts.map +1 -1
package/dist/core/sdk.js +38 -8
package/dist/core/sdk.js.map +1 -1
package/dist/index.d.ts +2 -1
package/dist/index.d.ts.map +1 -1
package/dist/index.js +2 -1
package/dist/index.js.map +1 -1
package/docs/providers.md +4 -3
package/docs/workflows.md +2 -0
package/package.json +2 -2

package/dist/core/agent-session.js CHANGED Viewed

@@ -20,10 +20,10 @@ import { stripFrontmatter } from "../utils/frontmatter.js";
 import { resolvePath } from "../utils/paths.js";
 import { sleep } from "../utils/sleep.js";
 import { ATOMIC_GUIDE_COMMAND_NAME, ATOMIC_GUIDE_HELP_CHOICES, atomicGuideModeForChoice, getAtomicGuideMessage, isAtomicGuideHelpChoice, normalizeAtomicGuideMode, } from "./atomic-guide-command.js";
-import { formatNoApiKeyFoundMessage, formatNoModelSelectedMessage, formatUnresolvedModelMessage, } from "./auth-guidance.js";
+import { formatAuthStorageLoadFailedMessage, formatNoApiKeyFoundMessage, formatNoModelSelectedMessage, formatUnresolvedModelMessage, } from "./auth-guidance.js";
 import { executeBashWithOperations } from "./bash-executor.js";
 import { calculateContextTokens, collectEntriesForBranchSummary, contextCompact as runContextCompact, estimateContextTokens, generateBranchSummary, prepareContextCompaction, shouldCompact, validateContextDeletionRequest, } from "./compaction/index.js";
-import { getModelDefaultContextWindow, getSupportedContextWindows, selectContextWindow } from "./context-window.js";
+import { getEffectiveInputBudget, getModelDefaultContextWindow, getSupportedContextWindows, selectContextWindow } from "./context-window.js";
 import { formatCopilotProviderError, parseCopilotPromptLimitError } from "./copilot-errors.js";
 import { DEFAULT_THINKING_LEVEL } from "./defaults.js";
 import { exportSessionToHtml } from "./export-html/index.js";
@@ -39,6 +39,8 @@ import { evaluateBashCommandPolicy, formatBashCommandPolicyRejection, } from "./
 import { createAllToolDefinitions, defaultToolNames } from "./tools/index.js";
 import { redirectOversizedToolResult } from "./tools/oversized-tool-result.js";
 import { createToolDefinitionFromAgentTool } from "./tools/tool-definition-wrapper.js";
+import { isCopilotGeminiModel } from "./copilot-gemini-payload-sanitizer.js";
+import { normalizeToolArgumentsForModel } from "./copilot-gemini-tool-arguments.js";
 function deepFreeze(value) {
     if (value && typeof value === "object") {
         Object.freeze(value);
@@ -388,6 +390,9 @@ export class AgentSession {
             else if (event.message.role === "user" ||
                 event.message.role === "assistant" ||
                 event.message.role === "toolResult") {
+                if (event.message.role === "assistant") {
+                    this._normalizePersistedGeminiToolArgs(event.message);
+                }
                 // Regular LLM message - persist as SessionMessageEntry
                 this.sessionManager.appendMessage(event.message);
             }
@@ -396,12 +401,17 @@ export class AgentSession {
             if (event.message.role === "assistant") {
                 this._lastAssistantMessage = event.message;
                 const assistantMsg = event.message;
-                if (assistantMsg.stopReason !== "error") {
+                // Treat degenerate empty completions (no content, zero output tokens) as
+                // failures alongside stopReason === "error". Otherwise an empty turn that
+                // stops with reason "stop" would reset the retry counter on every attempt,
+                // causing unbounded retries instead of honoring maxRetries.
+                const assistantFailed = assistantMsg.stopReason === "error" || this._isEmptyCompletion(assistantMsg);
+                if (!assistantFailed) {
                     this._overflowRecoveryAttempted = false;
                 }
                 // Reset retry counter immediately on successful assistant response
                 // This prevents accumulation across multiple LLM calls within a turn
-                if (assistantMsg.stopReason !== "error" && this._retryAttempt > 0) {
+                if (!assistantFailed && this._retryAttempt > 0) {
                     this._emit({
                         type: "auto_retry_end",
                         success: true,
@@ -415,8 +425,16 @@ export class AgentSession {
         if (event.type === "agent_end" && this._lastAssistantMessage) {
             const msg = this._lastAssistantMessage;
             this._lastAssistantMessage = undefined;
-            // Check for retryable errors first (overloaded, rate limit, server errors)
-            if (this._isRetryableError(msg)) {
+            // Check for retryable errors first (overloaded, rate limit, server errors,
+            // transient provider finish_reason errors, or degenerate empty completions)
+            const retryableError = this._isRetryableError(msg);
+            const emptyCompletion = !retryableError && this._isEmptyCompletion(msg);
+            if (retryableError || emptyCompletion) {
+                if (emptyCompletion && !msg.errorMessage) {
+                    // Surface a clear reason in the retry banner; empty completions carry no
+                    // provider error message of their own.
+                    msg.errorMessage = "Provider returned an empty completion";
+                }
                 const didRetry = await this._handleRetryableError(msg);
                 if (didRetry)
                     return; // Retry was initiated, don't proceed to compaction
@@ -879,6 +897,16 @@ export class AgentSession {
                 throw new Error(formatUnresolvedModelMessage(this.model));
             }
             if (!this._modelRegistry.hasConfiguredAuth(this.model)) {
+                // A failed credential-store load (for example auth.json briefly locked
+                // by a concurrent process, or invalid JSON) leaves an empty in-memory
+                // credential set. That would otherwise be misreported here as
+                // "No API key found" even though the credentials exist on disk. Surface
+                // the real load failure instead so configured providers are not falsely
+                // reported as unauthenticated (issue #1431).
+                const authLoadError = this._modelRegistry.authStorage.getLoadError();
+                if (authLoadError) {
+                    throw new Error(formatAuthStorageLoadFailedMessage(this.model.provider, authLoadError), { cause: authLoadError });
+                }
                 const isOAuth = this._modelRegistry.isUsingOAuth(this.model);
                 if (isOAuth) {
                     throw new Error(`Authentication failed for "${this.model.provider}". ` +
@@ -2009,7 +2037,11 @@ export class AgentSession {
         else {
             contextTokens = calculateContextTokens(assistantMessage.usage);
         }
-        if (shouldCompact(contextTokens, contextWindow, settings)) {
+        // Compact against the effective input budget (the hard prompt cap for providers like Copilot
+        // that advertise a larger total window) so we compact before overrunning the server-side limit
+        // rather than relying on reactive overflow recovery near the cap.
+        const compactionBudget = this.model ? getEffectiveInputBudget(this.model) : contextWindow;
+        if (shouldCompact(contextTokens, compactionBudget, settings)) {
             await this._runAutoCompaction("threshold", false);
         }
     }
@@ -2017,7 +2049,11 @@ export class AgentSession {
         if (!this.model || this.model.provider !== "github-copilot" || !assistantMessage.errorMessage)
             return false;
         const promptLimitError = parseCopilotPromptLimitError(assistantMessage.errorMessage);
-        return promptLimitError !== undefined && this.model.contextWindow > promptLimitError.limitTokens;
+        // Compare against the effective input budget (the model's real prompt cap), not the displayed
+        // total window. A rejection at the prompt cap is a normal overflow we should compact-and-retry;
+        // only a rejection *below* the cap (e.g. a missing long-context entitlement dropping the account
+        // to a lower server tier) keeps the friendly error visible instead of silently compacting down.
+        return promptLimitError !== undefined && getEffectiveInputBudget(this.model) > promptLimitError.limitTokens;
     }
     /**
      * Internal: remove the trailing overflow error from retry context if it is still present.
@@ -2386,7 +2422,23 @@ export class AgentSession {
         for (const tool of wrappedExtensionTools) {
             toolRegistry.set(tool.name, tool);
         }
-        this._toolRegistry = toolRegistry;
+        // GitHub Copilot Gemini serializes array/object tool-call arguments as
+        // flattened `name[index]` keys (confirmed on the raw CAPI wire). Reconstruct
+        // them into proper arrays/objects before per-tool preparation and schema
+        // validation, so tool calls (notably structured_output) don't fail and loop.
+        // Gated to Copilot Gemini at call time via this.model; a no-op otherwise.
+        // `prepareArguments` is a plain function field (no `this` binding), and the
+        // `{ ...tool }` spread assumes AgentTools are plain objects — matching the
+        // existing tool-definition-wrapper pattern; a class-instance tool would lose
+        // prototype members here.
+        this._toolRegistry = new Map(Array.from(toolRegistry, ([name, tool]) => {
+            const basePrepareArguments = tool.prepareArguments;
+            const prepareArguments = (args) => {
+                const normalized = normalizeToolArgumentsForModel(args, this.model, tool.parameters);
+                return basePrepareArguments ? basePrepareArguments(normalized) : normalized;
+            };
+            return [name, { ...tool, prepareArguments }];
+        }));
         const nextActiveToolNames = (options?.activeToolNames ? [...options.activeToolNames] : [...previousActiveToolNames]).filter((name) => isExposedTool(name));
         if (allowedToolNames) {
             for (const toolName of this._toolRegistry.keys()) {
@@ -2484,8 +2536,80 @@ export class AgentSession {
         if (isContextOverflow(message, contextWindow))
             return false;
         const err = message.errorMessage;
-        // Match: overloaded_error, provider returned error, rate limit, 429, 500, 502, 503, 504, service unavailable, network/connection errors (including connection lost), WebSocket transport closes/errors, fetch failed, premature stream endings, HTTP/2 closed before response, terminated, retry delay exceeded
-        return /overloaded|provider.?returned.?error|rate.?limit|too many requests|429|500|502|503|504|service.?unavailable|server.?error|internal.?error|network.?error|connection.?error|connection.?refused|connection.?lost|websocket.?closed|websocket.?error|other side closed|fetch failed|upstream.?connect|reset before headers|socket hang up|ended without|stream ended before message_stop|http2 request did not get a response|timed? out|timeout|terminated|retry delay/i.test(err);
+        // A genuine `content_filter` stop is a deliberate safety block: retrying it
+        // re-issues the same blocked request up to maxRetries times for no benefit.
+        // GitHub Copilot Gemini is the exception — CAPI maps spurious Gemini blocks
+        // (RECITATION/safety on MALFORMED_FUNCTION_CALL etc.) to `content_filter`, so
+        // only treat `content_filter` as retryable for those models.
+        if (isCopilotGeminiModel({ provider: message.provider, api: message.api, id: message.model }) &&
+            /finish.?reason:?\s*content.?filter/i.test(err)) {
+            return true;
+        }
+        // Match: overloaded_error, provider returned error, rate limit, 429, 500, 502, 503, 504, service unavailable, network/connection errors (including connection lost), WebSocket transport closes/errors, fetch failed, premature stream endings, HTTP/2 closed before response, terminated, retry delay exceeded, and a bare/transient provider finish_reason "error" (e.g. github-copilot Gemini's CAPI mapping of MALFORMED_FUNCTION_CALL/OTHER/UNEXPECTED_TOOL_CALL). These are provider-agnostic transient failures.
+        return /overloaded|provider.?returned.?error|rate.?limit|too many requests|429|500|502|503|504|service.?unavailable|server.?error|internal.?error|network.?error|connection.?error|connection.?refused|connection.?lost|websocket.?closed|websocket.?error|other side closed|fetch failed|upstream.?connect|reset before headers|socket hang up|ended without|stream ended before message_stop|http2 request did not get a response|timed? out|timeout|terminated|retry delay|finish.?reason:?\s*error/i.test(err);
+    }
+    /**
+     * For GitHub Copilot Gemini, reconstruct flattened tool-call arguments
+     * (for example `edits[0].newText`) into the nested arrays/objects Gemini
+     * produced before the assistant message is persisted, so saved transcripts
+     * never carry the flattened CAPI wire shape and replays loaded from disk match
+     * the structure Gemini signed. In-place, gated to Copilot Gemini, and a no-op
+     * for well-formed arguments or any other provider/model. The outbound replay
+     * normalizer still heals already-persisted (legacy) sessions on the wire.
+     */
+    _normalizePersistedGeminiToolArgs(message) {
+        const model = this.model;
+        if (!model || !isCopilotGeminiModel(model))
+            return;
+        for (const block of message.content) {
+            if (block.type !== "toolCall")
+                continue;
+            const tool = this._toolRegistry.get(block.name);
+            const normalized = normalizeToolArgumentsForModel(block.arguments, model, tool?.parameters);
+            if (normalized !== block.arguments && normalized !== null && typeof normalized === "object") {
+                block.arguments = normalized;
+            }
+        }
+    }
+    /**
+     * Detect a degenerate empty completion: the provider ended the stream with no
+     * usable content and zero output tokens. Seen with github-copilot Gemini models
+     * that emit finish_reason "stop" (or a tool-use stop) with an empty content array
+     * and 0 output tokens, leaving the turn dead instead of producing the next step.
+     *
+     * These are treated as retryable so the harness re-issues the request rather than
+     * silently stopping mid-task. Guarded tightly (no text, no tool call, no thinking,
+     * and output === 0) so legitimate non-empty turns are never matched.
+     *
+     * Intentionally provider-agnostic (not gated to Copilot Gemini): a degenerate
+     * empty turn is a transient failure for any provider. It is bounded by
+     * `maxRetries` and falls through to normal handling on exhaustion.
+     */
+    _isEmptyCompletion(message) {
+        // Only "completed" stop reasons can be deceptively empty. Real errors are handled
+        // by _isRetryableError; aborted/length turns are intentional outcomes.
+        if (message.stopReason !== "stop" && message.stopReason !== "toolUse")
+            return false;
+        const content = message.content;
+        if (Array.isArray(content)) {
+            const hasContent = content.some((part) => {
+                if (part.type === "text")
+                    return part.text.trim().length > 0;
+                if (part.type === "toolCall")
+                    return true;
+                if (part.type === "thinking")
+                    return part.redacted === true || part.thinking.trim().length > 0;
+                return true; // unknown part types count as content
+            });
+            if (hasContent)
+                return false;
+        }
+        // A turn that produced output tokens but no surfaced content is not "empty"
+        // (e.g. reasoning-only responses); leave those alone. Note: a provider that
+        // fails to report `usage` (output defaults to 0) would make every
+        // content-less turn match here; the dual requirement (empty content AND zero
+        // output) keeps that false-positive risk low in practice.
+        return (message.usage?.output ?? 0) === 0;
     }
     /**
      * Handle retryable errors with exponential backoff.