npm - @llumiverse/drivers - Versions diffs - 1.0.0-dev.20260202.145450Z → 1.0.0 - Mend

@llumiverse/drivers 1.0.0-dev.20260202.145450Z → 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (240) hide show

package/lib/cjs/adobe/firefly.js +120 -0
package/lib/cjs/adobe/firefly.js.map +1 -0
package/lib/cjs/azure/azure_foundry.js +432 -0
package/lib/cjs/azure/azure_foundry.js.map +1 -0
package/lib/cjs/bedrock/converse.js +359 -0
package/lib/cjs/bedrock/converse.js.map +1 -0
package/lib/cjs/bedrock/index.js +1441 -0
package/lib/cjs/bedrock/index.js.map +1 -0
package/lib/cjs/bedrock/nova-image-payload.js +207 -0
package/lib/cjs/bedrock/nova-image-payload.js.map +1 -0
package/lib/cjs/bedrock/payloads.js +3 -0
package/lib/cjs/bedrock/payloads.js.map +1 -0
package/lib/cjs/bedrock/s3.js +107 -0
package/lib/cjs/bedrock/s3.js.map +1 -0
package/lib/cjs/bedrock/twelvelabs.js +87 -0
package/lib/cjs/bedrock/twelvelabs.js.map +1 -0
package/lib/cjs/groq/index.js +326 -0
package/lib/cjs/groq/index.js.map +1 -0
package/lib/cjs/huggingface_ie.js +201 -0
package/lib/cjs/huggingface_ie.js.map +1 -0
package/lib/cjs/index.js +31 -0
package/lib/cjs/index.js.map +1 -0
package/lib/cjs/mistral/index.js +176 -0
package/lib/cjs/mistral/index.js.map +1 -0
package/lib/cjs/mistral/types.js +83 -0
package/lib/cjs/mistral/types.js.map +1 -0
package/lib/cjs/openai/azure_openai.js +72 -0
package/lib/cjs/openai/azure_openai.js.map +1 -0
package/lib/cjs/openai/index.js +1100 -0
package/lib/cjs/openai/index.js.map +1 -0
package/lib/cjs/openai/openai.js +21 -0
package/lib/cjs/openai/openai.js.map +1 -0
package/lib/cjs/openai/openai_compatible.js +63 -0
package/lib/cjs/openai/openai_compatible.js.map +1 -0
package/lib/cjs/openai/openai_format.js +131 -0
package/lib/cjs/openai/openai_format.js.map +1 -0
package/lib/cjs/package.json +3 -0
package/lib/cjs/replicate.js +275 -0
package/lib/cjs/replicate.js.map +1 -0
package/lib/cjs/test-driver/TestErrorCompletionStream.js +20 -0
package/lib/cjs/test-driver/TestErrorCompletionStream.js.map +1 -0
package/lib/cjs/test-driver/TestValidationErrorCompletionStream.js +24 -0
package/lib/cjs/test-driver/TestValidationErrorCompletionStream.js.map +1 -0
package/lib/cjs/test-driver/index.js +109 -0
package/lib/cjs/test-driver/index.js.map +1 -0
package/lib/cjs/test-driver/utils.js +30 -0
package/lib/cjs/test-driver/utils.js.map +1 -0
package/lib/cjs/togetherai/index.js +126 -0
package/lib/cjs/togetherai/index.js.map +1 -0
package/lib/cjs/togetherai/interfaces.js +3 -0
package/lib/cjs/togetherai/interfaces.js.map +1 -0
package/lib/cjs/vertexai/debug.js +12 -0
package/lib/cjs/vertexai/debug.js.map +1 -0
package/lib/cjs/vertexai/embeddings/embeddings-image.js +27 -0
package/lib/cjs/vertexai/embeddings/embeddings-image.js.map +1 -0
package/lib/cjs/vertexai/embeddings/embeddings-text.js +23 -0
package/lib/cjs/vertexai/embeddings/embeddings-text.js.map +1 -0
package/lib/cjs/vertexai/index.js +635 -0
package/lib/cjs/vertexai/index.js.map +1 -0
package/lib/cjs/vertexai/models/claude.js +842 -0
package/lib/cjs/vertexai/models/claude.js.map +1 -0
package/lib/cjs/vertexai/models/gemini.js +1110 -0
package/lib/cjs/vertexai/models/gemini.js.map +1 -0
package/lib/cjs/vertexai/models/imagen.js +303 -0
package/lib/cjs/vertexai/models/imagen.js.map +1 -0
package/lib/cjs/vertexai/models/llama.js +183 -0
package/lib/cjs/vertexai/models/llama.js.map +1 -0
package/lib/cjs/vertexai/models.js +35 -0
package/lib/cjs/vertexai/models.js.map +1 -0
package/lib/cjs/watsonx/index.js +161 -0
package/lib/cjs/watsonx/index.js.map +1 -0
package/lib/cjs/watsonx/interfaces.js +3 -0
package/lib/cjs/watsonx/interfaces.js.map +1 -0
package/lib/cjs/xai/index.js +65 -0
package/lib/cjs/xai/index.js.map +1 -0
package/lib/esm/adobe/firefly.js +116 -0
package/lib/esm/adobe/firefly.js.map +1 -0
package/lib/esm/azure/azure_foundry.js +426 -0
package/lib/esm/azure/azure_foundry.js.map +1 -0
package/lib/esm/bedrock/converse.js +352 -0
package/lib/esm/bedrock/converse.js.map +1 -0
package/lib/esm/bedrock/index.js +1434 -0
package/lib/esm/bedrock/index.js.map +1 -0
package/lib/esm/bedrock/nova-image-payload.js +203 -0
package/lib/esm/bedrock/nova-image-payload.js.map +1 -0
package/lib/esm/bedrock/payloads.js +2 -0
package/lib/esm/bedrock/payloads.js.map +1 -0
package/lib/esm/bedrock/s3.js +99 -0
package/lib/esm/bedrock/s3.js.map +1 -0
package/lib/esm/bedrock/twelvelabs.js +84 -0
package/lib/esm/bedrock/twelvelabs.js.map +1 -0
package/lib/esm/groq/index.js +319 -0
package/lib/esm/groq/index.js.map +1 -0
package/lib/esm/huggingface_ie.js +197 -0
package/lib/esm/huggingface_ie.js.map +1 -0
package/lib/esm/index.js +15 -0
package/lib/esm/index.js.map +1 -0
package/lib/esm/mistral/index.js +172 -0
package/lib/esm/mistral/index.js.map +1 -0
package/lib/esm/mistral/types.js +80 -0
package/lib/esm/mistral/types.js.map +1 -0
package/lib/esm/openai/azure_openai.js +68 -0
package/lib/esm/openai/azure_openai.js.map +1 -0
package/lib/esm/openai/index.js +1093 -0
package/lib/esm/openai/index.js.map +1 -0
package/lib/esm/openai/openai.js +14 -0
package/lib/esm/openai/openai.js.map +1 -0
package/lib/esm/openai/openai_compatible.js +56 -0
package/lib/esm/openai/openai_compatible.js.map +1 -0
package/lib/esm/openai/openai_format.js +127 -0
package/lib/esm/openai/openai_format.js.map +1 -0
package/lib/esm/replicate.js +268 -0
package/lib/esm/replicate.js.map +1 -0
package/lib/esm/test-driver/TestErrorCompletionStream.js +16 -0
package/lib/esm/test-driver/TestErrorCompletionStream.js.map +1 -0
package/lib/esm/test-driver/TestValidationErrorCompletionStream.js +20 -0
package/lib/esm/test-driver/TestValidationErrorCompletionStream.js.map +1 -0
package/lib/esm/test-driver/index.js +91 -0
package/lib/esm/test-driver/index.js.map +1 -0
package/lib/esm/test-driver/utils.js +25 -0
package/lib/esm/test-driver/utils.js.map +1 -0
package/lib/esm/togetherai/index.js +122 -0
package/lib/esm/togetherai/index.js.map +1 -0
package/lib/esm/togetherai/interfaces.js +2 -0
package/lib/esm/togetherai/interfaces.js.map +1 -0
package/lib/esm/vertexai/debug.js +6 -0
package/lib/esm/vertexai/debug.js.map +1 -0
package/lib/esm/vertexai/embeddings/embeddings-image.js +24 -0
package/lib/esm/vertexai/embeddings/embeddings-image.js.map +1 -0
package/lib/esm/vertexai/embeddings/embeddings-text.js +20 -0
package/lib/esm/vertexai/embeddings/embeddings-text.js.map +1 -0
package/lib/esm/vertexai/index.js +630 -0
package/lib/esm/vertexai/index.js.map +1 -0
package/lib/esm/vertexai/models/claude.js +833 -0
package/lib/esm/vertexai/models/claude.js.map +1 -0
package/lib/esm/vertexai/models/gemini.js +1104 -0
package/lib/esm/vertexai/models/gemini.js.map +1 -0
package/lib/esm/vertexai/models/imagen.js +299 -0
package/lib/esm/vertexai/models/imagen.js.map +1 -0
package/lib/esm/vertexai/models/llama.js +179 -0
package/lib/esm/vertexai/models/llama.js.map +1 -0
package/lib/esm/vertexai/models.js +32 -0
package/lib/esm/vertexai/models.js.map +1 -0
package/lib/esm/watsonx/index.js +157 -0
package/lib/esm/watsonx/index.js.map +1 -0
package/lib/esm/watsonx/interfaces.js +2 -0
package/lib/esm/watsonx/interfaces.js.map +1 -0
package/lib/esm/xai/index.js +58 -0
package/lib/esm/xai/index.js.map +1 -0
package/lib/types/adobe/firefly.d.ts +30 -0
package/lib/types/adobe/firefly.d.ts.map +1 -0
package/lib/types/azure/azure_foundry.d.ts +52 -0
package/lib/types/azure/azure_foundry.d.ts.map +1 -0
package/lib/types/bedrock/converse.d.ts +8 -0
package/lib/types/bedrock/converse.d.ts.map +1 -0
package/lib/types/bedrock/index.d.ts +135 -0
package/lib/types/bedrock/index.d.ts.map +1 -0
package/lib/types/bedrock/nova-image-payload.d.ts +74 -0
package/lib/types/bedrock/nova-image-payload.d.ts.map +1 -0
package/lib/types/bedrock/payloads.d.ts +12 -0
package/lib/types/bedrock/payloads.d.ts.map +1 -0
package/lib/types/bedrock/s3.d.ts +23 -0
package/lib/types/bedrock/s3.d.ts.map +1 -0
package/lib/types/bedrock/twelvelabs.d.ts +50 -0
package/lib/types/bedrock/twelvelabs.d.ts.map +1 -0
package/lib/types/groq/index.d.ts +27 -0
package/lib/types/groq/index.d.ts.map +1 -0
package/lib/types/huggingface_ie.d.ts +35 -0
package/lib/types/huggingface_ie.d.ts.map +1 -0
package/lib/types/index.d.ts +15 -0
package/lib/types/index.d.ts.map +1 -0
package/lib/types/mistral/index.d.ts +25 -0
package/lib/types/mistral/index.d.ts.map +1 -0
package/lib/types/mistral/types.d.ts +127 -0
package/lib/types/mistral/types.d.ts.map +1 -0
package/lib/types/openai/azure_openai.d.ts +25 -0
package/lib/types/openai/azure_openai.d.ts.map +1 -0
package/lib/types/openai/index.d.ts +126 -0
package/lib/types/openai/index.d.ts.map +1 -0
package/lib/types/openai/openai.d.ts +15 -0
package/lib/types/openai/openai.d.ts.map +1 -0
package/lib/types/openai/openai_compatible.d.ts +31 -0
package/lib/types/openai/openai_compatible.d.ts.map +1 -0
package/lib/types/openai/openai_format.d.ts +21 -0
package/lib/types/openai/openai_format.d.ts.map +1 -0
package/lib/types/replicate.d.ts +48 -0
package/lib/types/replicate.d.ts.map +1 -0
package/lib/types/test-driver/TestErrorCompletionStream.d.ts +9 -0
package/lib/types/test-driver/TestErrorCompletionStream.d.ts.map +1 -0
package/lib/types/test-driver/TestValidationErrorCompletionStream.d.ts +9 -0
package/lib/types/test-driver/TestValidationErrorCompletionStream.d.ts.map +1 -0
package/lib/types/test-driver/index.d.ts +24 -0
package/lib/types/test-driver/index.d.ts.map +1 -0
package/lib/types/test-driver/utils.d.ts +5 -0
package/lib/types/test-driver/utils.d.ts.map +1 -0
package/lib/types/togetherai/index.d.ts +23 -0
package/lib/types/togetherai/index.d.ts.map +1 -0
package/lib/types/togetherai/interfaces.d.ts +96 -0
package/lib/types/togetherai/interfaces.d.ts.map +1 -0
package/lib/types/vertexai/debug.d.ts +2 -0
package/lib/types/vertexai/debug.d.ts.map +1 -0
package/lib/types/vertexai/embeddings/embeddings-image.d.ts +11 -0
package/lib/types/vertexai/embeddings/embeddings-image.d.ts.map +1 -0
package/lib/types/vertexai/embeddings/embeddings-text.d.ts +10 -0
package/lib/types/vertexai/embeddings/embeddings-text.d.ts.map +1 -0
package/lib/types/vertexai/index.d.ts +79 -0
package/lib/types/vertexai/index.d.ts.map +1 -0
package/lib/types/vertexai/models/claude.d.ts +103 -0
package/lib/types/vertexai/models/claude.d.ts.map +1 -0
package/lib/types/vertexai/models/gemini.d.ts +78 -0
package/lib/types/vertexai/models/gemini.d.ts.map +1 -0
package/lib/types/vertexai/models/imagen.d.ts +75 -0
package/lib/types/vertexai/models/imagen.d.ts.map +1 -0
package/lib/types/vertexai/models/llama.d.ts +20 -0
package/lib/types/vertexai/models/llama.d.ts.map +1 -0
package/lib/types/vertexai/models.d.ts +20 -0
package/lib/types/vertexai/models.d.ts.map +1 -0
package/lib/types/watsonx/index.d.ts +27 -0
package/lib/types/watsonx/index.d.ts.map +1 -0
package/lib/types/watsonx/interfaces.d.ts +65 -0
package/lib/types/watsonx/interfaces.d.ts.map +1 -0
package/lib/types/xai/index.d.ts +18 -0
package/lib/types/xai/index.d.ts.map +1 -0
package/package.json +18 -18
package/src/bedrock/converse.ts +85 -10
package/src/bedrock/error-handling.test.ts +352 -0
package/src/bedrock/index.ts +293 -16
package/src/groq/index.ts +9 -4
package/src/mistral/index.ts +25 -22
package/src/mistral/types.ts +0 -5
package/src/openai/error-handling.test.ts +567 -0
package/src/openai/index.ts +513 -33
package/src/openai/openai_compatible.ts +7 -0
package/src/openai/openai_format.ts +1 -1
package/src/vertexai/index.ts +61 -13
package/src/vertexai/models/claude-error-handling.test.ts +432 -0
package/src/vertexai/models/claude.ts +287 -10
package/src/vertexai/models/gemini-error-handling.test.ts +353 -0
package/src/vertexai/models/gemini.ts +329 -52
package/src/vertexai/models.ts +7 -2

package/src/vertexai/models/claude.ts CHANGED Viewed

@@ -1,13 +1,37 @@
+import {
+    APIConnectionError,
+    APIConnectionTimeoutError,
+    APIError,
+    AuthenticationError,
+    BadRequestError,
+    ConflictError,
+    InternalServerError,
+    NotFoundError,
+    PermissionDeniedError,
+    RateLimitError,
+    UnprocessableEntityError,
+} from '@anthropic-ai/sdk/error';
 import { ContentBlock, ContentBlockParam, DocumentBlockParam, ImageBlockParam, Message, MessageParam, TextBlockParam, ToolResultBlockParam } from "@anthropic-ai/sdk/resources/index.js";
+import { MessageStreamParams } from "@anthropic-ai/sdk/resources/index.mjs";
+import { MessageCreateParamsBase, MessageCreateParamsNonStreaming, RawMessageStreamEvent } from "@anthropic-ai/sdk/resources/messages.js";
 import {
-    AIModel, Completion, CompletionChunkObject, ExecutionOptions, getMaxTokensLimitVertexAi, JSONObject, ModelType,
-    PromptRole, PromptSegment, readStreamAsBase64, readStreamAsString, StatelessExecutionOptions, ToolUse, VertexAIClaudeOptions
+    AIModel, Completion, CompletionChunkObject, ExecutionOptions,
+    getConversationMeta,
+    getMaxTokensLimitVertexAi,
+    incrementConversationTurn,
+    JSONObject,
+    LlumiverseError, LlumiverseErrorContext,
+    ModelType,
+    PromptRole, PromptSegment, readStreamAsBase64, readStreamAsString, StatelessExecutionOptions,
+    stripBase64ImagesFromConversation,
+    stripHeartbeatsFromConversation,
+    ToolUse,
+    truncateLargeTextInConversation,
+    VertexAIClaudeOptions
 } from "@llumiverse/core";
 import { asyncMap } from "@llumiverse/core/async";
 import { VertexAIDriver } from "../index.js";
 import { ModelDefinition } from "../models.js";
-import { MessageCreateParamsBase, MessageCreateParamsNonStreaming, RawMessageStreamEvent } from "@anthropic-ai/sdk/resources/messages.js";
-import { MessageStreamParams } from "@anthropic-ai/sdk/resources/index.mjs";
 export const ANTHROPIC_REGIONS: Record<string, string> = {
     us: "us-east5",
@@ -83,13 +107,12 @@ function maxToken(option: StatelessExecutionOptions): number {
     if (modelOptions && typeof modelOptions.max_tokens === "number") {
         return modelOptions.max_tokens;
     } else {
-        const thinking_budget = modelOptions?.thinking_budget_tokens ?? 0;
         let maxSupportedTokens = getMaxTokensLimitVertexAi(option.model);
         // Fallback to the default max tokens limit for the model
         if (option.model.includes('claude-3-7-sonnet') && (modelOptions?.thinking_budget_tokens ?? 0) < 48000) {
             maxSupportedTokens = 64000; // Claude 3.7 can go up to 128k with a beta header, but when no max tokens is specified, we default to 64k.
         }
-        return Math.min(16000 + thinking_budget, maxSupportedTokens); // Cap to 16k, to avoid taking up too much context window and quota.
+        return maxSupportedTokens;
     }
 }
@@ -291,6 +314,21 @@ export class ClaudeModelDefinition implements ModelDefinition<ClaudePrompt> {
         conversation = updateConversation(conversation, createPromptFromResponse(result));
+        // Increment turn counter and apply stripping (same pattern as other drivers)
+        conversation = incrementConversationTurn(conversation) as ClaudePrompt;
+        const currentTurn = getConversationMeta(conversation).turnNumber;
+        const stripOptions = {
+            keepForTurns: options.stripImagesAfterTurns ?? Infinity,
+            currentTurn,
+            textMaxTokens: options.stripTextMaxTokens,
+        };
+        let processedConversation = stripBase64ImagesFromConversation(conversation, stripOptions);
+        processedConversation = truncateLargeTextInConversation(processedConversation, stripOptions);
+        processedConversation = stripHeartbeatsFromConversation(processedConversation, {
+            keepForTurns: options.stripHeartbeatsAfterTurns ?? 1,
+            currentTurn,
+        });
         return {
             result: text ? [{ type: "text", value: text }] : [{ type: "text", value: '' }],
             tool_use,
@@ -301,7 +339,7 @@ export class ClaudeModelDefinition implements ModelDefinition<ClaudePrompt> {
             },
             // make sure we set finish_reason to the correct value (claude is normally setting this by itself)
             finish_reason: tool_use ? "tool_use" : claudeFinishReason(result?.stop_reason ?? ''),
-            conversation
+            conversation: processedConversation
         } satisfies Completion;
     }
@@ -433,6 +471,170 @@ export class ClaudeModelDefinition implements ModelDefinition<ClaudePrompt> {
         return stream;
     }
+    /**
+     * Format Anthropic API errors into LlumiverseError with proper status codes and retryability.
+     *
+     * Anthropic API errors have a specific structure:
+     * - APIError.status: HTTP status code (400, 401, 403, 404, 409, 422, 429, 500+)
+     * - APIError.error: Nested error object with type and message
+     * - APIError.requestID: Request ID for support (can be null)
+     *
+     * Common error types:
+     * - BadRequestError (400): Invalid request parameters
+     * - AuthenticationError (401): Authentication required
+     * - PermissionDeniedError (403): Insufficient permissions
+     * - NotFoundError (404): Resource not found
+     * - ConflictError (409): Resource conflict
+     * - UnprocessableEntityError (422): Validation error
+     * - RateLimitError (429): Rate limit exceeded
+     * - InternalServerError (500+): Server-side errors
+     * - APIConnectionError: Connection issues (no status code)
+     * - APIConnectionTimeoutError: Request timeout (no status code)
+     *
+     * @see https://docs.anthropic.com/en/api/errors
+     */
+    formatLlumiverseError(
+        _driver: VertexAIDriver,
+        error: unknown,
+        context: LlumiverseErrorContext
+    ): LlumiverseError {
+        // Check if it's an Anthropic API error
+        const isAnthropicError = this.isAnthropicApiError(error);
+        if (!isAnthropicError) {
+            // Not an Anthropic API error, use default handling
+            throw error;
+        }
+        const apiError = error as APIError;
+        const httpStatusCode = apiError.status;
+        // Extract error message and nested error details
+        let message = apiError.message || String(error);
+        // Extract error type from nested error object if available
+        let errorType: string | undefined;
+        if (apiError.error && typeof apiError.error === 'object') {
+            const nestedError = apiError.error as any;
+            if (nestedError.error && typeof nestedError.error === 'object') {
+                errorType = nestedError.error.type;
+                // Use the nested error message if it's more specific
+                if (nestedError.error.message) {
+                    message = nestedError.error.message;
+                }
+            }
+        }
+        // Build user-facing message with status code
+        let userMessage = message;
+        // Include status code in message (for end-user visibility)
+        if (httpStatusCode) {
+            userMessage = `[${httpStatusCode}] ${userMessage}`;
+        }
+        // Include error type if available
+        if (errorType && errorType !== 'error') {
+            userMessage = `${errorType}: ${userMessage}`;
+        }
+        // Add request ID if available (useful for Anthropic support)
+        if (apiError.requestID) {
+            userMessage += ` (Request ID: ${apiError.requestID})`;
+        }
+        // Determine retryability based on Anthropic error types
+        const retryable = this.isClaudeErrorRetryable(error, httpStatusCode, errorType);
+        // Use the error constructor name as the error name
+        const errorName = error.constructor?.name || 'AnthropicError';
+        return new LlumiverseError(
+            `[${context.provider}] ${userMessage}`,
+            retryable,
+            context,
+            error,
+            httpStatusCode,
+            errorName
+        );
+    }
+    /**
+     * Type guard to check if error is an Anthropic API error.
+     */
+    private isAnthropicApiError(error: unknown): error is APIError {
+        return (
+            error !== null &&
+            typeof error === 'object' &&
+            error instanceof APIError
+        );
+    }
+    /**
+     * Determine if an Anthropic API error is retryable.
+     *
+     * Retryable errors:
+     * - RateLimitError (429): Rate limit exceeded, retry with backoff
+     * - InternalServerError (500+): Server-side errors
+     * - APIConnectionTimeoutError: Request timeout
+     * - 408 (Request Timeout): Request timeout
+     * - 529 (Overloaded): Service overloaded
+     *
+     * Non-retryable errors:
+     * - BadRequestError (400): Invalid request parameters
+     * - AuthenticationError (401): Authentication failure
+     * - PermissionDeniedError (403): Insufficient permissions
+     * - NotFoundError (404): Resource not found
+     * - ConflictError (409): Resource conflict
+     * - UnprocessableEntityError (422): Validation error
+     * - Other 4xx client errors
+     * - invalid_request_error: Invalid request structure
+     *
+     * @param error - The error object
+     * @param httpStatusCode - The HTTP status code if available
+     * @param errorType - The nested error type if available
+     * @returns True if retryable, false if not retryable, undefined if unknown
+     */
+    private isClaudeErrorRetryable(
+        error: unknown,
+        httpStatusCode: number | undefined,
+        errorType: string | undefined
+    ): boolean | undefined {
+        // Check specific Anthropic error types by class
+        if (error instanceof RateLimitError) return true;
+        if (error instanceof InternalServerError) return true;
+        if (error instanceof APIConnectionTimeoutError) return true;
+        // Non-retryable by error type
+        if (error instanceof BadRequestError) return false;
+        if (error instanceof AuthenticationError) return false;
+        if (error instanceof PermissionDeniedError) return false;
+        if (error instanceof NotFoundError) return false;
+        if (error instanceof ConflictError) return false;
+        if (error instanceof UnprocessableEntityError) return false;
+        // Check nested error type
+        if (errorType === 'invalid_request_error') return false;
+        // Use HTTP status code
+        if (httpStatusCode !== undefined) {
+            if (httpStatusCode === 429) return true; // Rate limit
+            if (httpStatusCode === 408) return true; // Request timeout
+            if (httpStatusCode === 529) return true; // Overloaded
+            if (httpStatusCode >= 500 && httpStatusCode < 600) return true; // Server errors
+            if (httpStatusCode >= 400 && httpStatusCode < 500) return false; // Client errors
+        }
+        // Connection errors without status codes
+        if (error instanceof APIConnectionError && !(error instanceof APIConnectionTimeoutError)) {
+            // Generic connection errors might be retryable (network issues)
+            return true;
+        }
+        // Unknown error type - let consumer decide retry strategy
+        return undefined;
+    }
 }
 function createPromptFromResponse(response: Message): ClaudePrompt {
@@ -668,7 +870,7 @@ function getClaudePayload(options: ExecutionOptions, prompt: ClaudePrompt): { pa
     // Fix orphaned tool_use blocks (can occur when agent is stopped mid-tool-execution)
     const fixedMessages = fixOrphanedToolUse(prompt.messages);
     // Sanitize messages to remove empty text blocks (can occur from interrupted streaming)
-    const sanitizedMessages = sanitizeMessages(fixedMessages);
+    let sanitizedMessages = sanitizeMessages(fixedMessages);
     // Validate tools have input_schema.type set to 'object' as required by the Anthropic SDK
     if (options.tools) {
@@ -679,14 +881,21 @@ function getClaudePayload(options: ExecutionOptions, prompt: ClaudePrompt): { pa
         }
     }
+    // When no tools are provided but conversation contains tool_use/tool_result blocks
+    // (e.g. checkpoint summary calls), convert tool blocks to text to avoid API errors
+    const hasTools = options.tools && options.tools.length > 0;
+    if (!hasTools && claudeMessagesContainToolBlocks(sanitizedMessages)) {
+        sanitizedMessages = convertClaudeToolBlocksToText(sanitizedMessages);
+    }
     const payload = {
         messages: sanitizedMessages,
         system: prompt.system,
-        tools: options.tools as MessageCreateParamsBase['tools'],
+        tools: hasTools ? options.tools as MessageCreateParamsBase['tools'] : undefined,
         temperature: model_options?.temperature,
         model: modelName,
         max_tokens: maxToken(options),
-        top_p: model_options?.top_p,
+        top_p: model_options?.temperature != null ? undefined : model_options?.top_p,
         top_k: model_options?.top_k,
         stop_sequences: model_options?.stop_sequence,
         thinking: model_options?.thinking_mode ?
@@ -700,3 +909,71 @@ function getClaudePayload(options: ExecutionOptions, prompt: ClaudePrompt): { pa
     return { payload, requestOptions };
 }
+/**
+ * Checks whether any Claude message contains tool_use or tool_result content blocks.
+ */
+export function claudeMessagesContainToolBlocks(messages: MessageParam[]): boolean {
+    for (const msg of messages) {
+        if (!Array.isArray(msg.content)) continue;
+        for (const block of msg.content) {
+            if (typeof block === 'object' && block !== null && 'type' in block) {
+                if (block.type === 'tool_use' || block.type === 'tool_result') return true;
+            }
+        }
+    }
+    return false;
+}
+/**
+ * Converts tool_use and tool_result blocks to text in Claude messages.
+ * Preserves tool call information while removing structured blocks that
+ * require tools to be defined in the API request.
+ */
+export function convertClaudeToolBlocksToText(messages: MessageParam[]): MessageParam[] {
+    return messages.map(msg => {
+        if (!Array.isArray(msg.content)) return msg;
+        let hasToolBlocks = false;
+        for (const block of msg.content) {
+            if (typeof block === 'object' && block !== null && 'type' in block &&
+                (block.type === 'tool_use' || block.type === 'tool_result')) {
+                hasToolBlocks = true;
+                break;
+            }
+        }
+        if (!hasToolBlocks) return msg;
+        const newContent: MessageParam['content'] = [];
+        for (const block of msg.content) {
+            if (typeof block === 'string') {
+                newContent.push(block);
+                continue;
+            }
+            if (block.type === 'tool_use') {
+                const inputStr = block.input ? JSON.stringify(block.input) : '';
+                const truncated = inputStr.length > 500 ? inputStr.substring(0, 500) + '...' : inputStr;
+                (newContent as Array<{ type: 'text'; text: string }>).push({
+                    type: 'text',
+                    text: `[Tool call: ${block.name}(${truncated})]`,
+                });
+            } else if (block.type === 'tool_result') {
+                let resultStr = 'No content';
+                if (typeof block.content === 'string') {
+                    resultStr = block.content.length > 500 ? block.content.substring(0, 500) + '...' : block.content;
+                } else if (Array.isArray(block.content)) {
+                    const texts = block.content
+                        .filter((c): c is { type: 'text'; text: string } => c.type === 'text')
+                        .map(c => c.text.length > 500 ? c.text.substring(0, 500) + '...' : c.text);
+                    resultStr = texts.join('\n') || 'No text content';
+                }
+                (newContent as Array<{ type: 'text'; text: string }>).push({
+                    type: 'text',
+                    text: `[Tool result: ${resultStr}]`,
+                });
+            } else {
+                newContent.push(block as any);
+            }
+        }
+        return { ...msg, content: newContent };
+    });
+}