npm - @juspay/neurolink - Versions diffs - 9.15.0 → 9.16.0 - Mend

@juspay/neurolink 9.15.0 → 9.16.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (193) hide show

package/CHANGELOG.md +6 -0
package/dist/adapters/video/videoAnalyzer.d.ts +1 -1
package/dist/adapters/video/videoAnalyzer.js +10 -8
package/dist/cli/commands/setup-anthropic.js +1 -14
package/dist/cli/commands/setup-azure.js +1 -12
package/dist/cli/commands/setup-bedrock.js +1 -9
package/dist/cli/commands/setup-google-ai.js +1 -12
package/dist/cli/commands/setup-openai.js +1 -14
package/dist/cli/commands/workflow.d.ts +27 -0
package/dist/cli/commands/workflow.js +216 -0
package/dist/cli/factories/commandFactory.js +79 -20
package/dist/cli/index.js +0 -1
package/dist/cli/parser.js +4 -1
package/dist/cli/utils/maskCredential.d.ts +11 -0
package/dist/cli/utils/maskCredential.js +23 -0
package/dist/constants/contextWindows.js +107 -16
package/dist/constants/enums.d.ts +99 -15
package/dist/constants/enums.js +152 -22
package/dist/context/budgetChecker.js +1 -1
package/dist/context/contextCompactor.js +31 -4
package/dist/context/emergencyTruncation.d.ts +21 -0
package/dist/context/emergencyTruncation.js +88 -0
package/dist/context/errorDetection.d.ts +16 -0
package/dist/context/errorDetection.js +48 -1
package/dist/context/errors.d.ts +19 -0
package/dist/context/errors.js +21 -0
package/dist/context/stages/slidingWindowTruncator.d.ts +6 -0
package/dist/context/stages/slidingWindowTruncator.js +159 -24
package/dist/core/baseProvider.js +306 -200
package/dist/core/conversationMemoryManager.js +104 -61
package/dist/core/evaluationProviders.js +16 -33
package/dist/core/factory.js +237 -164
package/dist/core/modules/GenerationHandler.js +175 -116
package/dist/core/modules/MessageBuilder.js +222 -170
package/dist/core/modules/StreamHandler.d.ts +1 -0
package/dist/core/modules/StreamHandler.js +95 -27
package/dist/core/modules/TelemetryHandler.d.ts +10 -1
package/dist/core/modules/TelemetryHandler.js +25 -7
package/dist/core/modules/ToolsManager.js +115 -191
package/dist/core/redisConversationMemoryManager.js +418 -282
package/dist/factories/providerRegistry.d.ts +5 -0
package/dist/factories/providerRegistry.js +20 -2
package/dist/index.d.ts +2 -2
package/dist/index.js +4 -2
package/dist/lib/adapters/video/videoAnalyzer.d.ts +1 -1
package/dist/lib/adapters/video/videoAnalyzer.js +10 -8
package/dist/lib/constants/contextWindows.js +107 -16
package/dist/lib/constants/enums.d.ts +99 -15
package/dist/lib/constants/enums.js +152 -22
package/dist/lib/context/budgetChecker.js +1 -1
package/dist/lib/context/contextCompactor.js +31 -4
package/dist/lib/context/emergencyTruncation.d.ts +21 -0
package/dist/lib/context/emergencyTruncation.js +89 -0
package/dist/lib/context/errorDetection.d.ts +16 -0
package/dist/lib/context/errorDetection.js +48 -1
package/dist/lib/context/errors.d.ts +19 -0
package/dist/lib/context/errors.js +22 -0
package/dist/lib/context/stages/slidingWindowTruncator.d.ts +6 -0
package/dist/lib/context/stages/slidingWindowTruncator.js +159 -24
package/dist/lib/core/baseProvider.js +306 -200
package/dist/lib/core/conversationMemoryManager.js +104 -61
package/dist/lib/core/evaluationProviders.js +16 -33
package/dist/lib/core/factory.js +237 -164
package/dist/lib/core/modules/GenerationHandler.js +175 -116
package/dist/lib/core/modules/MessageBuilder.js +222 -170
package/dist/lib/core/modules/StreamHandler.d.ts +1 -0
package/dist/lib/core/modules/StreamHandler.js +95 -27
package/dist/lib/core/modules/TelemetryHandler.d.ts +10 -1
package/dist/lib/core/modules/TelemetryHandler.js +25 -7
package/dist/lib/core/modules/ToolsManager.js +115 -191
package/dist/lib/core/redisConversationMemoryManager.js +418 -282
package/dist/lib/factories/providerRegistry.d.ts +5 -0
package/dist/lib/factories/providerRegistry.js +20 -2
package/dist/lib/index.d.ts +2 -2
package/dist/lib/index.js +4 -2
package/dist/lib/mcp/externalServerManager.js +66 -0
package/dist/lib/mcp/mcpCircuitBreaker.js +24 -0
package/dist/lib/mcp/mcpClientFactory.js +16 -0
package/dist/lib/mcp/toolDiscoveryService.js +32 -6
package/dist/lib/mcp/toolRegistry.js +193 -123
package/dist/lib/neurolink.d.ts +6 -0
package/dist/lib/neurolink.js +1162 -646
package/dist/lib/providers/amazonBedrock.d.ts +1 -1
package/dist/lib/providers/amazonBedrock.js +521 -319
package/dist/lib/providers/anthropic.js +73 -17
package/dist/lib/providers/anthropicBaseProvider.js +77 -17
package/dist/lib/providers/googleAiStudio.d.ts +1 -1
package/dist/lib/providers/googleAiStudio.js +292 -227
package/dist/lib/providers/googleVertex.d.ts +36 -1
package/dist/lib/providers/googleVertex.js +553 -260
package/dist/lib/providers/ollama.js +329 -278
package/dist/lib/providers/openAI.js +77 -19
package/dist/lib/providers/sagemaker/parsers.js +3 -3
package/dist/lib/providers/sagemaker/streaming.js +3 -3
package/dist/lib/proxy/proxyFetch.js +81 -48
package/dist/lib/rag/ChunkerFactory.js +1 -1
package/dist/lib/rag/chunkers/MarkdownChunker.d.ts +22 -0
package/dist/lib/rag/chunkers/MarkdownChunker.js +213 -9
package/dist/lib/rag/chunking/markdownChunker.d.ts +16 -0
package/dist/lib/rag/chunking/markdownChunker.js +174 -2
package/dist/lib/rag/pipeline/contextAssembly.js +2 -1
package/dist/lib/rag/ragIntegration.d.ts +18 -1
package/dist/lib/rag/ragIntegration.js +94 -14
package/dist/lib/rag/retrieval/vectorQueryTool.js +21 -4
package/dist/lib/server/abstract/baseServerAdapter.js +4 -1
package/dist/lib/server/adapters/fastifyAdapter.js +35 -30
package/dist/lib/services/server/ai/observability/instrumentation.d.ts +32 -0
package/dist/lib/services/server/ai/observability/instrumentation.js +39 -0
package/dist/lib/telemetry/attributes.d.ts +52 -0
package/dist/lib/telemetry/attributes.js +61 -0
package/dist/lib/telemetry/index.d.ts +3 -0
package/dist/lib/telemetry/index.js +3 -0
package/dist/lib/telemetry/telemetryService.d.ts +6 -0
package/dist/lib/telemetry/telemetryService.js +6 -0
package/dist/lib/telemetry/tracers.d.ts +15 -0
package/dist/lib/telemetry/tracers.js +17 -0
package/dist/lib/telemetry/withSpan.d.ts +9 -0
package/dist/lib/telemetry/withSpan.js +35 -0
package/dist/lib/types/contextTypes.d.ts +10 -0
package/dist/lib/types/streamTypes.d.ts +14 -0
package/dist/lib/utils/conversationMemory.js +121 -82
package/dist/lib/utils/logger.d.ts +5 -0
package/dist/lib/utils/logger.js +50 -2
package/dist/lib/utils/messageBuilder.js +22 -42
package/dist/lib/utils/modelDetection.js +3 -3
package/dist/lib/utils/providerRetry.d.ts +41 -0
package/dist/lib/utils/providerRetry.js +114 -0
package/dist/lib/utils/retryability.d.ts +14 -0
package/dist/lib/utils/retryability.js +23 -0
package/dist/lib/utils/sanitizers/svg.js +4 -5
package/dist/lib/utils/tokenEstimation.d.ts +11 -1
package/dist/lib/utils/tokenEstimation.js +19 -4
package/dist/lib/utils/videoAnalysisProcessor.js +7 -3
package/dist/mcp/externalServerManager.js +66 -0
package/dist/mcp/mcpCircuitBreaker.js +24 -0
package/dist/mcp/mcpClientFactory.js +16 -0
package/dist/mcp/toolDiscoveryService.js +32 -6
package/dist/mcp/toolRegistry.js +193 -123
package/dist/neurolink.d.ts +6 -0
package/dist/neurolink.js +1162 -646
package/dist/providers/amazonBedrock.d.ts +1 -1
package/dist/providers/amazonBedrock.js +521 -319
package/dist/providers/anthropic.js +73 -17
package/dist/providers/anthropicBaseProvider.js +77 -17
package/dist/providers/googleAiStudio.d.ts +1 -1
package/dist/providers/googleAiStudio.js +292 -227
package/dist/providers/googleVertex.d.ts +36 -1
package/dist/providers/googleVertex.js +553 -260
package/dist/providers/ollama.js +329 -278
package/dist/providers/openAI.js +77 -19
package/dist/providers/sagemaker/parsers.js +3 -3
package/dist/providers/sagemaker/streaming.js +3 -3
package/dist/proxy/proxyFetch.js +81 -48
package/dist/rag/ChunkerFactory.js +1 -1
package/dist/rag/chunkers/MarkdownChunker.d.ts +22 -0
package/dist/rag/chunkers/MarkdownChunker.js +213 -9
package/dist/rag/chunking/markdownChunker.d.ts +16 -0
package/dist/rag/chunking/markdownChunker.js +174 -2
package/dist/rag/pipeline/contextAssembly.js +2 -1
package/dist/rag/ragIntegration.d.ts +18 -1
package/dist/rag/ragIntegration.js +94 -14
package/dist/rag/retrieval/vectorQueryTool.js +21 -4
package/dist/server/abstract/baseServerAdapter.js +4 -1
package/dist/server/adapters/fastifyAdapter.js +35 -30
package/dist/services/server/ai/observability/instrumentation.d.ts +32 -0
package/dist/services/server/ai/observability/instrumentation.js +39 -0
package/dist/telemetry/attributes.d.ts +52 -0
package/dist/telemetry/attributes.js +60 -0
package/dist/telemetry/index.d.ts +3 -0
package/dist/telemetry/index.js +3 -0
package/dist/telemetry/telemetryService.d.ts +6 -0
package/dist/telemetry/telemetryService.js +6 -0
package/dist/telemetry/tracers.d.ts +15 -0
package/dist/telemetry/tracers.js +16 -0
package/dist/telemetry/withSpan.d.ts +9 -0
package/dist/telemetry/withSpan.js +34 -0
package/dist/types/contextTypes.d.ts +10 -0
package/dist/types/streamTypes.d.ts +14 -0
package/dist/utils/conversationMemory.js +121 -82
package/dist/utils/logger.d.ts +5 -0
package/dist/utils/logger.js +50 -2
package/dist/utils/messageBuilder.js +22 -42
package/dist/utils/modelDetection.js +3 -3
package/dist/utils/providerRetry.d.ts +41 -0
package/dist/utils/providerRetry.js +113 -0
package/dist/utils/retryability.d.ts +14 -0
package/dist/utils/retryability.js +22 -0
package/dist/utils/sanitizers/svg.js +4 -5
package/dist/utils/tokenEstimation.d.ts +11 -1
package/dist/utils/tokenEstimation.js +19 -4
package/dist/utils/videoAnalysisProcessor.js +7 -3
package/dist/workflow/config.d.ts +26 -26
package/package.json +1 -1

package/dist/providers/googleVertex.js CHANGED Viewed

@@ -1,7 +1,8 @@
 import { createVertex, } from "@ai-sdk/google-vertex";
 import { createVertexAnthropic, } from "@ai-sdk/google-vertex/anthropic";
 import { Output, streamText, } from "ai";
-import dns from "dns";
+import { trace, SpanKind, SpanStatusCode } from "@opentelemetry/api";
+import dns from "node:dns";
 import fs from "fs";
 import os from "os";
 import path from "path";
@@ -14,7 +15,10 @@ import { AuthenticationError, NetworkError, ProviderError, RateLimitError, Inval
 import { ERROR_CODES, NeuroLinkError } from "../utils/errorHandling.js";
 import { FileDetector } from "../utils/fileDetector.js";
 import { logger } from "../utils/logger.js";
+import { estimateTokens } from "../utils/tokenEstimation.js";
 import { isGemini3Model } from "../utils/modelDetection.js";
+import { calculateCost } from "../utils/pricing.js";
+import { tracers, ATTR, withClientSpan } from "../telemetry/index.js";
 import { createGoogleAuthConfig, createVertexProjectConfig, validateApiKey, } from "../utils/providerConfig.js";
 import { convertZodToJsonSchema, inlineJsonSchema, } from "../utils/schemaConversion.js";
 import { composeAbortSignals, createTimeoutController, TimeoutError, } from "../utils/timeout.js";
@@ -30,6 +34,30 @@ import { buildNativeToolDeclarations, buildNativeConfig, computeMaxSteps as comp
 // custom fetch, so it is inherently isolated from user cancellation signals.
 // The image generation path (getImageGenerationAccessToken) has an additional
 // explicit 15s timeout per attempt for direct REST API calls.
+/** Check whether an IP address belongs to a private, loopback, or link-local range. */
+function isPrivateOrLoopbackAddress(address) {
+    const lower = address.toLowerCase();
+    // IPv4 loopback, unspecified, and private ranges
+    if (address.startsWith("127.") || address === "0.0.0.0") {
+        return true;
+    }
+    if (address.startsWith("10.") || address.startsWith("192.168.")) {
+        return true;
+    }
+    if (/^172\.(1[6-9]|2\d|3[01])\./.test(address)) {
+        return true;
+    }
+    // IPv6 loopback, link-local, unique-local
+    if (address === "::1" ||
+        lower.startsWith("fe80:") ||
+        lower.startsWith("fc00:") ||
+        lower.startsWith("fd00:")) {
+        return true;
+    }
+    return false;
+}
+const MAX_IMAGE_DOWNLOAD_BYTES = 10 * 1024 * 1024; // 10 MB
+const streamTracer = trace.getTracer("neurolink.provider.vertex");
 // Enhanced Anthropic support with direct imports
 // Using the dual provider architecture from Vercel AI SDK
 const hasAnthropicSupport = () => {
@@ -63,6 +91,8 @@ const hasGoogleCredentials = () => {
         (process.env.GOOGLE_AUTH_CLIENT_EMAIL &&
             process.env.GOOGLE_AUTH_PRIVATE_KEY));
 };
+// Module-level cache for runtime-created credentials file to avoid per-request writes
+let cachedCredentialsPath = null;
 // Enhanced Vertex settings creation with authentication fallback and proxy support
 const createVertexSettings = async (region) => {
     const location = region || getVertexLocation();
@@ -99,9 +129,14 @@ const createVertexSettings = async (region) => {
         client_x509_cert_url: process.env.GOOGLE_AUTH_CLIENT_CERT_URL,
         universe_domain: process.env.GOOGLE_AUTH_UNIVERSE_DOMAIN,
     };
-    // If we have the essential fields, create a runtime credentials file
+    // If we have the essential fields, create a runtime credentials file (cached)
     if (requiredEnvVarsForFile.client_email &&
         requiredEnvVarsForFile.private_key) {
+        // Return cached path if already written and still exists on disk
+        if (cachedCredentialsPath && fs.existsSync(cachedCredentialsPath)) {
+            process.env.GOOGLE_APPLICATION_CREDENTIALS = cachedCredentialsPath;
+            return baseSettings;
+        }
         try {
             // Build complete service account credentials object
             const serviceAccountCredentials = {
@@ -119,18 +154,26 @@ const createVertexSettings = async (region) => {
                 client_x509_cert_url: requiredEnvVarsForFile.client_x509_cert_url || "",
                 universe_domain: requiredEnvVarsForFile.universe_domain || "googleapis.com",
             };
-            // Create temporary credentials file
+            // Create temporary credentials file with restricted permissions
             const tmpDir = os.tmpdir();
             const credentialsFileName = `google-credentials-${Date.now()}-${Math.random().toString(36).substring(2, 11)}.json`;
             const credentialsFilePath = path.join(tmpDir, credentialsFileName);
-            fs.writeFileSync(credentialsFilePath, JSON.stringify(serviceAccountCredentials, null, 2));
+            fs.writeFileSync(credentialsFilePath, JSON.stringify(serviceAccountCredentials, null, 2), { mode: 0o600 });
+            cachedCredentialsPath = credentialsFilePath;
+            // Register cleanup on process exit to remove the credentials file
+            process.once("exit", () => {
+                try {
+                    if (cachedCredentialsPath && fs.existsSync(cachedCredentialsPath)) {
+                        fs.unlinkSync(cachedCredentialsPath);
+                    }
+                }
+                catch {
+                    /* ignore cleanup errors */
+                }
+            });
             // Set the environment variable to point to our runtime-created file
             process.env.GOOGLE_APPLICATION_CREDENTIALS = credentialsFilePath;
-            // Now continue with the normal flow - check if the file exists
-            const fileExists = fs.existsSync(credentialsFilePath);
-            if (fileExists) {
-                return baseSettings;
-            }
+            return baseSettings;
         }
         catch {
             // Silent error handling for runtime credentials file creation
@@ -246,7 +289,13 @@ const createVertexSettings = async (region) => {
 };
 // Create Anthropic-specific Vertex settings with the same authentication and proxy support
 const createVertexAnthropicSettings = async (region) => {
-    const baseVertexSettings = await createVertexSettings(region);
+    // The @ai-sdk/google-vertex SDK constructs Anthropic URLs as:
+    //   https://{location}-aiplatform.googleapis.com/...
+    // When location is "global", this creates "https://global-aiplatform.googleapis.com"
+    // which is invalid. The correct global endpoint omits the region prefix entirely.
+    // Since the SDK doesn't handle this, redirect "global" to "us-east5" for Anthropic.
+    const anthropicRegion = !region || region === "global" ? "us-east5" : region;
+    const baseVertexSettings = await createVertexSettings(anthropicRegion);
     // GoogleVertexAnthropicProviderSettings extends GoogleVertexProviderSettings
     // so we can use the same settings with proper typing
     return {
@@ -262,6 +311,39 @@ const createVertexAnthropicSettings = async (region) => {
 const isAnthropicModel = (modelName) => {
     return modelName.toLowerCase().includes("claude");
 };
+/**
+ * Vertex Model Aliases
+ *
+ * Maps shorthand model names to their full versioned IDs required by the
+ * Vertex AI API. This allows users to pass convenient names like
+ * "claude-sonnet-4-5" instead of "claude-sonnet-4-5@20250929".
+ *
+ * Alias resolution runs at the very start of getModel() so that all
+ * downstream code (isAnthropicModel, validateAnthropicModelName, etc.)
+ * sees the canonical versioned name.
+ *
+ * To add a new model: simply add an entry mapping the shorthand to the
+ * full versioned string. No other changes are needed.
+ */
+export const VERTEX_MODEL_ALIASES = {
+    // Claude 4.x shorthand aliases → versioned names
+    "claude-sonnet-4-5": "claude-sonnet-4-5@20250929",
+    "claude-opus-4-5": "claude-opus-4-5@20251124",
+    "claude-haiku-4-5": "claude-haiku-4-5@20251001",
+    "claude-sonnet-4": "claude-sonnet-4@20250514",
+    "claude-opus-4": "claude-opus-4@20250514",
+    "claude-opus-4-1": "claude-opus-4-1@20250805",
+    // Claude 3.x shorthand aliases → versioned names
+    "claude-3-7-sonnet": "claude-3-7-sonnet@20250219",
+    "claude-3-5-sonnet": "claude-3-5-sonnet-20241022",
+    "claude-3-5-haiku": "claude-3-5-haiku-20241022",
+    "claude-3-opus": "claude-3-opus-20240229",
+    "claude-3-sonnet": "claude-3-sonnet-20240229",
+    "claude-3-haiku": "claude-3-haiku-20240307",
+    // Gemini shorthand aliases
+    "gemini-3-pro": "gemini-3-pro-latest",
+    "gemini-3-flash": "gemini-3-flash-latest",
+};
 /**
  * Google Vertex AI Provider v2 - BaseProvider Implementation
  *
@@ -366,6 +448,13 @@ export class GoogleVertexProvider extends BaseProvider {
         const model = await this.getModel();
         return model;
     }
+    /**
+     * Resolve a raw model name through the alias map.
+     * Used internally to normalize model names before any API calls.
+     */
+    resolveAlias(modelName) {
+        return VERTEX_MODEL_ALIASES[modelName] ?? modelName;
+    }
     /**
      * Initialize model creation tracking
      */
@@ -373,7 +462,10 @@ export class GoogleVertexProvider extends BaseProvider {
         const modelCreationId = `vertex-model-${Date.now()}-${Math.random().toString(36).substring(2, 11)}`;
         const modelCreationStartTime = Date.now();
         const modelCreationHrTimeStart = process.hrtime.bigint();
-        const modelName = this.modelName || getDefaultVertexModel();
+        // Resolve shorthand model aliases (e.g. "claude-sonnet-4-5" → "claude-sonnet-4-5@20250929")
+        // before any downstream logic that depends on the versioned name.
+        const rawModelName = this.modelName || getDefaultVertexModel();
+        const modelName = VERTEX_MODEL_ALIASES[rawModelName] ?? rawModelName;
         return {
             modelCreationId,
             modelCreationStartTime,
@@ -665,7 +757,7 @@ export class GoogleVertexProvider extends BaseProvider {
      * Creates fresh instances for each request to ensure proper authentication
      */
     async getModel() {
-        // Initialize logging and setup
+        // Initialize logging and setup (alias resolution happens inside)
         const { modelCreationId, modelCreationStartTime, modelCreationHrTimeStart, modelName, } = this.initializeModelCreationLogging();
         // Check if this is an Anthropic model and attempt creation
         const anthropicModel = await this.attemptAnthropicModelCreation(modelName, modelCreationId, modelCreationStartTime, modelCreationHrTimeStart);
@@ -684,7 +776,7 @@ export class GoogleVertexProvider extends BaseProvider {
     }
     async executeStream(options, analysisSchema) {
         // Check if this is a Gemini 3 model with tools - use native SDK for thought_signature
-        const gemini3CheckModelName = options.model || this.modelName || getDefaultVertexModel();
+        const gemini3CheckModelName = this.resolveAlias(options.model || this.modelName || getDefaultVertexModel());
         // Check for tools from options AND from SDK (MCP tools)
         // Need to check early if we should route to native SDK
         const gemini3CheckShouldUseTools = !options.disableTools && this.supportsTools();
@@ -735,7 +827,7 @@ export class GoogleVertexProvider extends BaseProvider {
                 toolNames: Object.keys(tools),
             });
             // Model-specific maxTokens handling
-            const modelName = this.modelName || getDefaultVertexModel();
+            const modelName = this.resolveAlias(options.model || this.modelName || getDefaultVertexModel());
             // Use cached model configuration to determine maxTokens handling for streaming performance
             // This avoids hardcoded model-specific logic and repeated config lookups
             const shouldSetMaxTokens = this.shouldSetMaxTokensCached(modelName);
@@ -748,6 +840,7 @@ export class GoogleVertexProvider extends BaseProvider {
                 messages: messages,
                 temperature: options.temperature,
                 ...(maxTokens && { maxTokens }),
+                maxRetries: 0, // NL11: Disable AI SDK's invisible internal retries; we handle retries with OTel instrumentation
                 ...(shouldUseTools &&
                     Object.keys(tools).length > 0 && {
                     tools,
@@ -819,7 +912,67 @@ export class GoogleVertexProvider extends BaseProvider {
                     });
                 }
             }
-            const result = streamText(streamOptions);
+            // Wrap streamText in an OTel span to capture provider-level latency and token usage
+            const streamSpan = streamTracer.startSpan("neurolink.provider.streamText", {
+                kind: SpanKind.CLIENT,
+                attributes: {
+                    "gen_ai.system": "vertex",
+                    "gen_ai.request.model": model.modelId || this.modelName || "unknown",
+                },
+            });
+            let result;
+            try {
+                result = streamText(streamOptions);
+            }
+            catch (err) {
+                streamSpan.recordException(err instanceof Error ? err : new Error(String(err)));
+                streamSpan.setStatus({
+                    code: SpanStatusCode.ERROR,
+                    message: err instanceof Error ? err.message : String(err),
+                });
+                streamSpan.end();
+                throw err;
+            }
+            // Collect token usage and finish reason asynchronously when the stream completes,
+            // then end the span. This avoids blocking the stream consumer.
+            result.usage
+                .then((usage) => {
+                streamSpan.setAttribute("gen_ai.usage.input_tokens", usage.promptTokens || 0);
+                streamSpan.setAttribute("gen_ai.usage.output_tokens", usage.completionTokens || 0);
+                const effectiveModel = options.model ||
+                    model.modelId ||
+                    this.modelName ||
+                    getDefaultVertexModel();
+                const cost = calculateCost(this.providerName, effectiveModel, {
+                    input: usage.promptTokens || 0,
+                    output: usage.completionTokens || 0,
+                    total: (usage.promptTokens || 0) + (usage.completionTokens || 0),
+                });
+                if (cost && cost > 0) {
+                    streamSpan.setAttribute("neurolink.cost", cost);
+                }
+            })
+                .catch(() => {
+                // Usage may not be available if the stream is aborted
+            });
+            result.finishReason
+                .then((reason) => {
+                streamSpan.setAttribute("gen_ai.response.finish_reason", reason || "unknown");
+            })
+                .catch(() => {
+                // Finish reason may not be available if the stream is aborted
+            });
+            result.text
+                .then(() => {
+                streamSpan.end();
+            })
+                .catch((err) => {
+                streamSpan.setStatus({
+                    code: SpanStatusCode.ERROR,
+                    message: err instanceof Error ? err.message : String(err),
+                });
+                streamSpan.end();
+            });
             // Defer timeout cleanup until the stream completes or errors
             result.text.finally(() => timeoutController?.cleanup());
             // Transform string stream to content object stream using BaseProvider method
@@ -965,262 +1118,306 @@ export class GoogleVertexProvider extends BaseProvider {
      * This bypasses @ai-sdk/google-vertex to properly handle thought_signature
      */
     async executeNativeGemini3Stream(options) {
-        const client = await this.createVertexGenAIClient(options.region);
-        const modelName = options.model || this.modelName || getDefaultVertexModel();
-        const effectiveLocation = options.region || this.location || getVertexLocation();
-        logger.debug("[GoogleVertex] Using native @google/genai for Gemini 3", {
-            model: modelName,
-            hasTools: !!options.tools && Object.keys(options.tools).length > 0,
-            project: this.projectId,
-            location: effectiveLocation,
-        });
-        // Build contents from input with multimodal support
-        const multimodalInput = options.input;
-        const contents = this.buildNativeContentParts(options.input.text, multimodalInput, "native stream");
-        // Convert tools to native format
-        let hasToolsInput = options.tools &&
-            Object.keys(options.tools).length > 0 &&
-            !options.disableTools;
-        // Guard: Gemini cannot use tools + JSON schema simultaneously
-        const streamOptions = options;
-        const wantsJsonOutput = streamOptions.output?.format === "json" || streamOptions.schema;
-        if (wantsJsonOutput && hasToolsInput) {
-            logger.warn("[GoogleVertex] Gemini does not support tools and JSON schema output simultaneously. Disabling tools for this request.");
-            hasToolsInput = false;
-        }
-        let toolsConfig;
-        let executeMap = new Map();
-        if (hasToolsInput) {
-            const result = buildNativeToolDeclarations(options.tools);
-            toolsConfig = result.toolsConfig;
-            executeMap = result.executeMap;
-            logger.debug("[GoogleVertex] Converted tools for native SDK", {
-                toolCount: toolsConfig[0].functionDeclarations.length,
-                toolNames: toolsConfig[0].functionDeclarations.map((t) => t.name),
+        const modelName = this.resolveAlias(options.model || this.modelName || getDefaultVertexModel());
+        return withClientSpan({
+            name: "neurolink.provider.stream",
+            tracer: tracers.provider,
+            attributes: {
+                [ATTR.GEN_AI_SYSTEM]: "vertex",
+                [ATTR.GEN_AI_MODEL]: modelName,
+                [ATTR.GEN_AI_OPERATION]: "stream",
+                [ATTR.NL_PROVIDER]: this.providerName,
+            },
+        }, async (span) => {
+            const client = await this.createVertexGenAIClient(options.region);
+            const effectiveLocation = options.region || this.location || getVertexLocation();
+            logger.debug("[GoogleVertex] Using native @google/genai for Gemini 3", {
+                model: modelName,
+                hasTools: !!options.tools && Object.keys(options.tools).length > 0,
+                project: this.projectId,
+                location: effectiveLocation,
             });
-        }
-        // Build config
-        const config = buildNativeConfig(options, toolsConfig);
-        // Add JSON output format support for native SDK stream
-        if (streamOptions.output?.format === "json" || streamOptions.schema) {
-            config.responseMimeType = "application/json";
-            if (streamOptions.schema) {
-                const rawSchema = convertZodToJsonSchema(streamOptions.schema);
-                const inlinedSchema = inlineJsonSchema(rawSchema);
-                if (inlinedSchema.$schema) {
-                    delete inlinedSchema.$schema;
-                }
-                config.responseSchema = inlinedSchema;
-                logger.debug("[GoogleVertex] Added responseSchema for JSON output (stream)", {
-                    schemaKeys: Object.keys(inlinedSchema),
+            // Build contents from input with multimodal support
+            const multimodalInput = options.input;
+            const contents = this.buildNativeContentParts(options.input.text, multimodalInput, "native stream");
+            // Convert tools to native format
+            let hasToolsInput = options.tools &&
+                Object.keys(options.tools).length > 0 &&
+                !options.disableTools;
+            // Guard: Gemini cannot use tools + JSON schema simultaneously
+            const streamOptions = options;
+            const wantsJsonOutput = streamOptions.output?.format === "json" || streamOptions.schema;
+            if (wantsJsonOutput && hasToolsInput) {
+                logger.warn("[GoogleVertex] Gemini does not support tools and JSON schema output simultaneously. Disabling tools for this request.");
+                hasToolsInput = false;
+            }
+            let toolsConfig;
+            let executeMap = new Map();
+            if (hasToolsInput) {
+                const result = buildNativeToolDeclarations(options.tools);
+                toolsConfig = result.toolsConfig;
+                executeMap = result.executeMap;
+                logger.debug("[GoogleVertex] Converted tools for native SDK", {
+                    toolCount: toolsConfig[0].functionDeclarations.length,
+                    toolNames: toolsConfig[0].functionDeclarations.map((t) => t.name),
                 });
             }
-        }
-        const startTime = Date.now();
-        const timeout = this.getTimeout(options);
-        const timeoutController = createTimeoutController(timeout, this.providerName, "stream");
-        const composedSignal = composeAbortSignals(options.abortSignal, timeoutController?.controller.signal);
-        const maxSteps = computeMaxStepsShared(options.maxSteps);
-        const currentContents = [...contents];
-        let finalText = "";
-        let lastStepText = "";
-        let totalInputTokens = 0;
-        let totalOutputTokens = 0;
-        const allToolCalls = [];
-        let step = 0;
-        const failedTools = new Map();
-        // Agentic loop for tool calling
-        try {
-            while (step < maxSteps) {
-                if (timeoutController?.controller.signal.aborted) {
-                    break;
-                }
-                step++;
-                logger.debug(`[GoogleVertex] Native SDK step ${step}/${maxSteps}`);
-                try {
-                    const stream = await client.models.generateContentStream({
-                        model: modelName,
-                        contents: currentContents,
-                        config,
-                        ...(composedSignal
-                            ? { httpOptions: { signal: composedSignal } }
-                            : {}),
-                    });
-                    const chunkResult = await collectStreamChunks(stream);
-                    totalInputTokens += chunkResult.inputTokens;
-                    totalOutputTokens += chunkResult.outputTokens;
-                    const stepText = extractTextFromParts(chunkResult.rawResponseParts);
-                    if (chunkResult.stepFunctionCalls.length === 0) {
-                        finalText = stepText;
-                        break;
+            // Build config
+            const config = buildNativeConfig(options, toolsConfig);
+            // Add JSON output format support for native SDK stream
+            if (streamOptions.output?.format === "json" || streamOptions.schema) {
+                config.responseMimeType = "application/json";
+                if (streamOptions.schema) {
+                    const rawSchema = convertZodToJsonSchema(streamOptions.schema);
+                    const inlinedSchema = inlineJsonSchema(rawSchema);
+                    if (inlinedSchema.$schema) {
+                        delete inlinedSchema.$schema;
                     }
-                    lastStepText = stepText;
-                    logger.debug(`[GoogleVertex] Executing ${chunkResult.stepFunctionCalls.length} function calls`);
-                    pushModelResponseToHistory(currentContents, chunkResult.rawResponseParts, chunkResult.stepFunctionCalls);
-                    const functionResponses = await executeNativeToolCalls("[GoogleVertex]", chunkResult.stepFunctionCalls, executeMap, failedTools, allToolCalls, { abortSignal: composedSignal });
-                    // Add function responses to history
-                    currentContents.push({
-                        role: "function",
-                        parts: functionResponses,
+                    config.responseSchema = inlinedSchema;
+                    logger.debug("[GoogleVertex] Added responseSchema for JSON output (stream)", {
+                        schemaKeys: Object.keys(inlinedSchema),
                     });
                 }
-                catch (error) {
-                    logger.error("[GoogleVertex] Native SDK error", error);
-                    throw this.handleProviderError(error);
+            }
+            const startTime = Date.now();
+            const timeout = this.getTimeout(options);
+            const timeoutController = createTimeoutController(timeout, this.providerName, "stream");
+            const composedSignal = composeAbortSignals(options.abortSignal, timeoutController?.controller.signal);
+            const maxSteps = computeMaxStepsShared(options.maxSteps);
+            const currentContents = [...contents];
+            let finalText = "";
+            let lastStepText = "";
+            let totalInputTokens = 0;
+            let totalOutputTokens = 0;
+            const allToolCalls = [];
+            let step = 0;
+            const failedTools = new Map();
+            // Agentic loop for tool calling
+            try {
+                while (step < maxSteps) {
+                    if (timeoutController?.controller.signal.aborted) {
+                        break;
+                    }
+                    step++;
+                    logger.debug(`[GoogleVertex] Native SDK step ${step}/${maxSteps}`);
+                    try {
+                        const stream = await client.models.generateContentStream({
+                            model: modelName,
+                            contents: currentContents,
+                            config,
+                            ...(composedSignal
+                                ? { httpOptions: { signal: composedSignal } }
+                                : {}),
+                        });
+                        const chunkResult = await collectStreamChunks(stream);
+                        totalInputTokens += chunkResult.inputTokens;
+                        totalOutputTokens += chunkResult.outputTokens;
+                        const stepText = extractTextFromParts(chunkResult.rawResponseParts);
+                        if (chunkResult.stepFunctionCalls.length === 0) {
+                            finalText = stepText;
+                            break;
+                        }
+                        lastStepText = stepText;
+                        // Record tool call events on the span
+                        for (const fc of chunkResult.stepFunctionCalls) {
+                            span.addEvent("gen_ai.tool_call", {
+                                "tool.name": fc.name,
+                                "tool.step": step,
+                            });
+                        }
+                        logger.debug(`[GoogleVertex] Executing ${chunkResult.stepFunctionCalls.length} function calls`);
+                        pushModelResponseToHistory(currentContents, chunkResult.rawResponseParts, chunkResult.stepFunctionCalls);
+                        const functionResponses = await executeNativeToolCalls("[GoogleVertex]", chunkResult.stepFunctionCalls, executeMap, failedTools, allToolCalls, { abortSignal: composedSignal });
+                        // Add function responses to history
+                        currentContents.push({
+                            role: "function",
+                            parts: functionResponses,
+                        });
+                    }
+                    catch (error) {
+                        logger.error("[GoogleVertex] Native SDK error", error);
+                        throw this.handleProviderError(error);
+                    }
                 }
             }
-        }
-        finally {
-            timeoutController?.cleanup();
-        }
-        finalText = handleMaxStepsTermination("[GoogleVertex]", step, maxSteps, finalText, lastStepText);
-        const responseTime = Date.now() - startTime;
-        // Create async iterable for streaming result
-        async function* createTextStream() {
-            yield { content: finalText };
-        }
-        return {
-            stream: createTextStream(),
-            provider: this.providerName,
-            model: modelName,
-            usage: {
-                input: totalInputTokens,
-                output: totalOutputTokens,
-                total: totalInputTokens + totalOutputTokens,
-            },
-            toolCalls: allToolCalls.map((tc) => ({
-                toolName: tc.toolName,
-                args: tc.args,
-            })),
-            metadata: {
-                streamId: `native-vertex-${Date.now()}`,
-                startTime,
-                responseTime,
-                totalToolExecutions: allToolCalls.length,
-            },
-        };
+            finally {
+                timeoutController?.cleanup();
+            }
+            finalText = handleMaxStepsTermination("[GoogleVertex]", step, maxSteps, finalText, lastStepText);
+            const responseTime = Date.now() - startTime;
+            // Set token usage and finish reason on the span
+            span.setAttribute(ATTR.GEN_AI_INPUT_TOKENS, totalInputTokens);
+            span.setAttribute(ATTR.GEN_AI_OUTPUT_TOKENS, totalOutputTokens);
+            span.setAttribute(ATTR.GEN_AI_FINISH_REASON, step >= maxSteps ? "max_steps" : "stop");
+            // Create async iterable for streaming result
+            async function* createTextStream() {
+                yield { content: finalText };
+            }
+            return {
+                stream: createTextStream(),
+                provider: this.providerName,
+                model: modelName,
+                usage: {
+                    input: totalInputTokens,
+                    output: totalOutputTokens,
+                    total: totalInputTokens + totalOutputTokens,
+                },
+                toolCalls: allToolCalls.map((tc) => ({
+                    toolName: tc.toolName,
+                    args: tc.args,
+                })),
+                metadata: {
+                    streamId: `native-vertex-${Date.now()}`,
+                    startTime,
+                    responseTime,
+                    totalToolExecutions: allToolCalls.length,
+                },
+            };
+        });
     }
     /**
      * Execute generate using native @google/genai SDK for Gemini 3 models on Vertex AI
      * This bypasses @ai-sdk/google-vertex to properly handle thought_signature
      */
     async executeNativeGemini3Generate(options) {
-        const client = await this.createVertexGenAIClient(options.region);
-        const modelName = options.model || this.modelName || getDefaultVertexModel();
-        const effectiveLocation = options.region || this.location || getVertexLocation();
-        logger.debug("[GoogleVertex] Using native @google/genai for Gemini 3 generate", {
-            model: modelName,
-            project: this.projectId,
-            location: effectiveLocation,
-        });
-        // Build contents from input with multimodal support
-        const inputText = options.prompt || options.input?.text || "Please respond.";
-        const multimodalInput = options.input;
-        const contents = this.buildNativeContentParts(inputText, multimodalInput, "native generate");
-        // Get tools from SDK and options
-        let shouldUseTools = !options.disableTools && this.supportsTools();
-        // Guard: Gemini cannot use tools + JSON schema simultaneously
-        const wantsJsonOutputGen = options.output?.format === "json" || options.schema;
-        if (wantsJsonOutputGen && shouldUseTools) {
-            logger.warn("[GoogleVertex] Gemini does not support tools and JSON schema output simultaneously. Disabling tools for this request.");
-            shouldUseTools = false;
-        }
-        const sdkTools = shouldUseTools ? await this.getAllTools() : {};
-        const combinedTools = shouldUseTools
-            ? { ...sdkTools, ...(options.tools || {}) }
-            : {};
-        let toolsConfig;
-        let executeMap = new Map();
-        if (Object.keys(combinedTools).length > 0) {
-            const result = buildNativeToolDeclarations(combinedTools);
-            toolsConfig = result.toolsConfig;
-            executeMap = result.executeMap;
-            logger.debug("[GoogleVertex] Converted tools for native SDK generate", {
-                toolCount: toolsConfig[0].functionDeclarations.length,
-                toolNames: toolsConfig[0].functionDeclarations.map((t) => t.name),
+        const modelName = this.resolveAlias(options.model || this.modelName || getDefaultVertexModel());
+        return withClientSpan({
+            name: "neurolink.provider.generate",
+            tracer: tracers.provider,
+            attributes: {
+                [ATTR.GEN_AI_SYSTEM]: "vertex",
+                [ATTR.GEN_AI_MODEL]: modelName,
+                [ATTR.GEN_AI_OPERATION]: "generate",
+                [ATTR.NL_PROVIDER]: this.providerName,
+            },
+        }, async (span) => {
+            const client = await this.createVertexGenAIClient(options.region);
+            const effectiveLocation = options.region || this.location || getVertexLocation();
+            logger.debug("[GoogleVertex] Using native @google/genai for Gemini 3 generate", {
+                model: modelName,
+                project: this.projectId,
+                location: effectiveLocation,
             });
-        }
-        // Build config
-        const config = buildNativeConfig(options, toolsConfig);
-        // Note: Schema/JSON output for Gemini 3 native SDK is complex due to $ref resolution issues
-        // For now, schemas are handled via the AI SDK fallback path, not native SDK
-        // TODO: Implement proper $ref resolution for complex nested schemas
-        const startTime = Date.now();
-        const timeout = this.getTimeout(options);
-        const timeoutController = createTimeoutController(timeout, this.providerName, "generate");
-        const composedSignal = composeAbortSignals(options.abortSignal, timeoutController?.controller.signal);
-        const maxSteps = computeMaxStepsShared(options.maxSteps);
-        const currentContents = [...contents];
-        let finalText = "";
-        let lastStepText = "";
-        let totalInputTokens = 0;
-        let totalOutputTokens = 0;
-        const allToolCalls = [];
-        const toolExecutions = [];
-        let step = 0;
-        const failedTools = new Map();
-        try {
-            // Agentic loop for tool calling
-            while (step < maxSteps) {
-                if (timeoutController?.controller.signal.aborted) {
-                    break;
-                }
-                step++;
-                logger.debug(`[GoogleVertex] Native SDK generate step ${step}/${maxSteps}`);
-                try {
-                    // Use generateContentStream and collect all chunks (same as GoogleAIStudio)
-                    const stream = await client.models.generateContentStream({
-                        model: modelName,
-                        contents: currentContents,
-                        config,
-                        ...(composedSignal
-                            ? { httpOptions: { signal: composedSignal } }
-                            : {}),
-                    });
-                    const chunkResult = await collectStreamChunks(stream);
-                    totalInputTokens += chunkResult.inputTokens;
-                    totalOutputTokens += chunkResult.outputTokens;
-                    const stepText = extractTextFromParts(chunkResult.rawResponseParts);
-                    if (chunkResult.stepFunctionCalls.length === 0) {
-                        finalText = stepText;
+            // Build contents from input with multimodal support
+            const inputText = options.prompt || options.input?.text || "Please respond.";
+            const multimodalInput = options.input;
+            const contents = this.buildNativeContentParts(inputText, multimodalInput, "native generate");
+            // Get tools from SDK and options
+            let shouldUseTools = !options.disableTools && this.supportsTools();
+            // Guard: Gemini cannot use tools + JSON schema simultaneously
+            const wantsJsonOutputGen = options.output?.format === "json" || options.schema;
+            if (wantsJsonOutputGen && shouldUseTools) {
+                logger.warn("[GoogleVertex] Gemini does not support tools and JSON schema output simultaneously. Disabling tools for this request.");
+                shouldUseTools = false;
+            }
+            const sdkTools = shouldUseTools ? await this.getAllTools() : {};
+            const combinedTools = shouldUseTools
+                ? { ...sdkTools, ...(options.tools || {}) }
+                : {};
+            let toolsConfig;
+            let executeMap = new Map();
+            if (Object.keys(combinedTools).length > 0) {
+                const result = buildNativeToolDeclarations(combinedTools);
+                toolsConfig = result.toolsConfig;
+                executeMap = result.executeMap;
+                logger.debug("[GoogleVertex] Converted tools for native SDK generate", {
+                    toolCount: toolsConfig[0].functionDeclarations.length,
+                    toolNames: toolsConfig[0].functionDeclarations.map((t) => t.name),
+                });
+            }
+            // Build config
+            const config = buildNativeConfig(options, toolsConfig);
+            // Note: Schema/JSON output for Gemini 3 native SDK is complex due to $ref resolution issues
+            // For now, schemas are handled via the AI SDK fallback path, not native SDK
+            // TODO: Implement proper $ref resolution for complex nested schemas
+            const startTime = Date.now();
+            const timeout = this.getTimeout(options);
+            const timeoutController = createTimeoutController(timeout, this.providerName, "generate");
+            const composedSignal = composeAbortSignals(options.abortSignal, timeoutController?.controller.signal);
+            const maxSteps = computeMaxStepsShared(options.maxSteps);
+            const currentContents = [...contents];
+            let finalText = "";
+            let lastStepText = "";
+            let totalInputTokens = 0;
+            let totalOutputTokens = 0;
+            const allToolCalls = [];
+            const toolExecutions = [];
+            let step = 0;
+            const failedTools = new Map();
+            try {
+                // Agentic loop for tool calling
+                while (step < maxSteps) {
+                    if (timeoutController?.controller.signal.aborted) {
                         break;
                     }
-                    lastStepText = stepText;
-                    logger.debug(`[GoogleVertex] Generate executing ${chunkResult.stepFunctionCalls.length} function calls`);
-                    pushModelResponseToHistory(currentContents, chunkResult.rawResponseParts, chunkResult.stepFunctionCalls);
-                    const functionResponses = await executeNativeToolCalls("[GoogleVertex]", chunkResult.stepFunctionCalls, executeMap, failedTools, allToolCalls, { toolExecutions, abortSignal: composedSignal });
-                    // Add function responses to history
-                    currentContents.push({
-                        role: "function",
-                        parts: functionResponses,
-                    });
-                }
-                catch (error) {
-                    logger.error("[GoogleVertex] Native SDK generate error", error);
-                    throw this.handleProviderError(error);
+                    step++;
+                    logger.debug(`[GoogleVertex] Native SDK generate step ${step}/${maxSteps}`);
+                    try {
+                        // Use generateContentStream and collect all chunks (same as GoogleAIStudio)
+                        const stream = await client.models.generateContentStream({
+                            model: modelName,
+                            contents: currentContents,
+                            config,
+                            ...(composedSignal
+                                ? { httpOptions: { signal: composedSignal } }
+                                : {}),
+                        });
+                        const chunkResult = await collectStreamChunks(stream);
+                        totalInputTokens += chunkResult.inputTokens;
+                        totalOutputTokens += chunkResult.outputTokens;
+                        const stepText = extractTextFromParts(chunkResult.rawResponseParts);
+                        if (chunkResult.stepFunctionCalls.length === 0) {
+                            finalText = stepText;
+                            break;
+                        }
+                        lastStepText = stepText;
+                        // Record tool call events on the span
+                        for (const fc of chunkResult.stepFunctionCalls) {
+                            span.addEvent("gen_ai.tool_call", {
+                                "tool.name": fc.name,
+                                "tool.step": step,
+                            });
+                        }
+                        logger.debug(`[GoogleVertex] Generate executing ${chunkResult.stepFunctionCalls.length} function calls`);
+                        pushModelResponseToHistory(currentContents, chunkResult.rawResponseParts, chunkResult.stepFunctionCalls);
+                        const functionResponses = await executeNativeToolCalls("[GoogleVertex]", chunkResult.stepFunctionCalls, executeMap, failedTools, allToolCalls, { toolExecutions, abortSignal: composedSignal });
+                        // Add function responses to history
+                        currentContents.push({
+                            role: "function",
+                            parts: functionResponses,
+                        });
+                    }
+                    catch (error) {
+                        logger.error("[GoogleVertex] Native SDK generate error", error);
+                        throw this.handleProviderError(error);
+                    }
                 }
             }
-        }
-        finally {
-            timeoutController?.cleanup();
-        }
-        finalText = handleMaxStepsTermination("[GoogleVertex]", step, maxSteps, finalText, lastStepText);
-        const responseTime = Date.now() - startTime;
-        // Build EnhancedGenerateResult
-        return {
-            content: finalText,
-            provider: this.providerName,
-            model: modelName,
-            usage: {
-                input: totalInputTokens,
-                output: totalOutputTokens,
-                total: totalInputTokens + totalOutputTokens,
-            },
-            responseTime,
-            toolsUsed: allToolCalls.map((tc) => tc.toolName),
-            toolExecutions: toolExecutions,
-            enhancedWithTools: allToolCalls.length > 0,
-        };
+            finally {
+                timeoutController?.cleanup();
+            }
+            finalText = handleMaxStepsTermination("[GoogleVertex]", step, maxSteps, finalText, lastStepText);
+            const responseTime = Date.now() - startTime;
+            // Set token usage and finish reason on the span
+            span.setAttribute(ATTR.GEN_AI_INPUT_TOKENS, totalInputTokens);
+            span.setAttribute(ATTR.GEN_AI_OUTPUT_TOKENS, totalOutputTokens);
+            span.setAttribute(ATTR.GEN_AI_FINISH_REASON, step >= maxSteps ? "max_steps" : "stop");
+            // Build EnhancedGenerateResult
+            return {
+                content: finalText,
+                provider: this.providerName,
+                model: modelName,
+                usage: {
+                    input: totalInputTokens,
+                    output: totalOutputTokens,
+                    total: totalInputTokens + totalOutputTokens,
+                },
+                responseTime,
+                toolsUsed: allToolCalls.map((tc) => tc.toolName),
+                toolExecutions: toolExecutions,
+                enhancedWithTools: allToolCalls.length > 0,
+            };
+        });
     }
     /**
      * Process CSV files and append content to options.input.text
@@ -1298,7 +1495,7 @@ export class GoogleVertexProvider extends BaseProvider {
         const options = typeof optionsOrPrompt === "string"
             ? { prompt: optionsOrPrompt }
             : optionsOrPrompt;
-        const modelName = options.model || this.modelName || getDefaultVertexModel();
+        const modelName = this.resolveAlias(options.model || this.modelName || getDefaultVertexModel());
         // Check if we should use native SDK for Gemini 3 with tools
         const shouldUseTools = !options.disableTools && this.supportsTools();
         const sdkTools = shouldUseTools ? await this.getAllTools() : {};
@@ -1458,6 +1655,23 @@ export class GoogleVertexProvider extends BaseProvider {
     async hasAnthropicSupport() {
         return hasAnthropicSupport();
     }
+    /**
+     * Resolve a shorthand model name to its full versioned Vertex AI identifier.
+     * Returns the original name unchanged if no alias exists.
+     *
+     * @param modelName - A model name, possibly a shorthand alias
+     * @returns The resolved full versioned model name
+     *
+     * @example
+     * ```typescript
+     * provider.resolveModelAlias("claude-sonnet-4-5"); // "claude-sonnet-4-5@20250929"
+     * provider.resolveModelAlias("gemini-3-pro");      // "gemini-3-pro-latest"
+     * provider.resolveModelAlias("gemini-2.5-flash");  // "gemini-2.5-flash" (unchanged)
+     * ```
+     */
+    resolveModelAlias(modelName) {
+        return VERTEX_MODEL_ALIASES[modelName] ?? modelName;
+    }
     /**
      * Create an Anthropic model instance using vertexAnthropic provider
      * Uses fresh vertex settings for each request with comprehensive validation
@@ -1544,11 +1758,11 @@ export class GoogleVertexProvider extends BaseProvider {
                 modelName,
                 issue: modelValidation.issue,
                 recommendedModels: [
+                    "claude-sonnet-4-6",
+                    "claude-opus-4-6",
                     "claude-sonnet-4-5@20250929",
-                    "claude-sonnet-4@20250514",
                     "claude-opus-4@20250514",
                     "claude-3-5-sonnet-20241022",
-                    "claude-3-5-haiku-20241022",
                 ],
             });
             return null;
@@ -1749,6 +1963,8 @@ export class GoogleVertexProvider extends BaseProvider {
     async checkVertexRegionalSupport(region = "us-central1") {
         // Based on Google Cloud documentation, these regions support Anthropic models
         const supportedRegions = [
+            // Global endpoint (routed automatically)
+            "global",
             // North America
             "us-central1",
             "us-east1",
@@ -1810,10 +2026,17 @@ export class GoogleVertexProvider extends BaseProvider {
         }
         // Validate against known Claude model patterns
         const validPatterns = [
+            // Claude 4.6 — versionless IDs (no @YYYYMMDD suffix)
+            /^claude-opus-4-6$/,
+            /^claude-sonnet-4-6$/,
+            // Claude 4.x versioned
             /^claude-sonnet-4@\d{8}$/,
             /^claude-sonnet-4-5@\d{8}$/,
             /^claude-opus-4@\d{8}$/,
             /^claude-opus-4-1@\d{8}$/,
+            /^claude-opus-4-5@\d{8}$/,
+            /^claude-haiku-4-5@\d{8}$/,
+            // Claude 3.x
             /^claude-3-7-sonnet@\d{8}$/,
             /^claude-3-5-sonnet-\d{8}$/,
             /^claude-3-5-haiku-\d{8}$/,
@@ -2063,11 +2286,10 @@ export class GoogleVertexProvider extends BaseProvider {
         return "image/png";
     }
     /**
-     * Estimate token count from text (simple character-based estimation)
+     * Estimate token count from text using centralized estimation with provider multipliers
      */
     estimateTokenCount(text) {
-        // Rough estimation: ~4 characters per token
-        return Math.ceil(text.length / 4);
+        return estimateTokens(text, "vertex");
     }
     /**
      * Obtain a Google Auth access token for Vertex AI REST API calls.
@@ -2123,7 +2345,7 @@ export class GoogleVertexProvider extends BaseProvider {
     /**
      * Build request parts for image generation from prompt, PDFs, and images.
      */
-    buildImageGenerationParts(prompt, pdfFiles, inputImages) {
+    async buildImageGenerationParts(prompt, pdfFiles, inputImages) {
         const parts = [];
         if (prompt) {
             parts.push({ text: prompt });
@@ -2213,6 +2435,77 @@ export class GoogleVertexProvider extends BaseProvider {
                         continue;
                     }
                 }
+                else if (image.startsWith("http://") ||
+                    image.startsWith("https://")) {
+                    // Download URL image and convert to base64
+                    try {
+                        // Validate URL to prevent SSRF attacks
+                        const parsedUrl = new URL(image);
+                        const hostname = parsedUrl.hostname;
+                        const blockedHosts = ["localhost", "127.0.0.1", "0.0.0.0", "[::1]"];
+                        if (blockedHosts.some((h) => hostname === h) ||
+                            /^(10\.|172\.(1[6-9]|2\d|3[01])\.|192\.168\.)/.test(hostname)) {
+                            logger.warn(`[GoogleVertexProvider] Blocked fetch to private/local URL: ${hostname}`, { index: i });
+                            continue;
+                        }
+                        // DNS resolution check — verify resolved IPs are not private/loopback
+                        try {
+                            const { resolve4, resolve6 } = dns.promises;
+                            const addresses = [];
+                            try {
+                                addresses.push(...(await resolve4(hostname)));
+                            }
+                            catch {
+                                /* hostname may not have A records */
+                            }
+                            try {
+                                addresses.push(...(await resolve6(hostname)));
+                            }
+                            catch {
+                                /* hostname may not have AAAA records */
+                            }
+                            if (addresses.length > 0 &&
+                                addresses.every((addr) => isPrivateOrLoopbackAddress(addr))) {
+                                logger.warn(`[GoogleVertexProvider] Blocked fetch: hostname ${hostname} resolves to private/loopback address`, { index: i, addresses });
+                                continue;
+                            }
+                        }
+                        catch (dnsError) {
+                            logger.warn(`[GoogleVertexProvider] DNS resolution failed for ${hostname}, blocking fetch`, {
+                                index: i,
+                                error: dnsError instanceof Error
+                                    ? dnsError.message
+                                    : String(dnsError),
+                            });
+                            continue;
+                        }
+                        const response = await fetch(image, {
+                            signal: AbortSignal.timeout(15_000),
+                        });
+                        if (!response.ok) {
+                            logger.warn(`Failed to fetch image URL (${response.status}), skipping`, { index: i, url: image });
+                            continue;
+                        }
+                        // Size guard — reject downloads exceeding 10 MB
+                        const contentLength = response.headers.get("content-length");
+                        if (contentLength &&
+                            Number(contentLength) > MAX_IMAGE_DOWNLOAD_BYTES) {
+                            logger.warn(`[GoogleVertexProvider] Image URL exceeds ${MAX_IMAGE_DOWNLOAD_BYTES} byte limit (Content-Length: ${contentLength}), skipping`, { index: i, url: image });
+                            continue;
+                        }
+                        const buffer = Buffer.from(await response.arrayBuffer());
+                        if (buffer.byteLength > MAX_IMAGE_DOWNLOAD_BYTES) {
+                            logger.warn(`[GoogleVertexProvider] Downloaded image exceeds ${MAX_IMAGE_DOWNLOAD_BYTES} byte limit (${buffer.byteLength} bytes), skipping`, { index: i, url: image });
+                            continue;
+                        }
+                        imageBase64 = buffer.toString("base64");
+                        mimeType = this.detectImageType(buffer);
+                    }
+                    catch (fetchError) {
+                        logger.warn(`Failed to download image from URL, skipping: ${fetchError instanceof Error ? fetchError.message : String(fetchError)}`, { index: i, url: image });
+                        continue;
+                    }
+                }
                 else {
                     imageBase64 = image;
                     const decodedBuffer = Buffer.from(imageBase64, "base64");
@@ -2309,7 +2602,7 @@ export class GoogleVertexProvider extends BaseProvider {
         });
         try {
             const token = await this.getImageGenerationAccessToken();
-            const parts = this.buildImageGenerationParts(prompt, pdfFiles, inputImages);
+            const parts = await this.buildImageGenerationParts(prompt, pdfFiles, inputImages);
             // Build request body with CRITICAL response_modalities setting
             const requestBody = {
                 contents: [{ role: "user", parts }],