npm - @juspay/neurolink - Versions diffs - 9.50.0 → 9.50.1 - Mend

@juspay/neurolink 9.50.0 → 9.50.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (11) hide show

package/CHANGELOG.md +6 -0
package/dist/browser/neurolink.min.js +270 -270
package/dist/lib/providers/litellm.js +2 -2
package/dist/lib/proxy/proxyTracer.d.ts +14 -0
package/dist/lib/proxy/proxyTracer.js +43 -0
package/dist/lib/server/routes/claudeProxyRoutes.js +112 -33
package/dist/providers/litellm.js +2 -2
package/dist/proxy/proxyTracer.d.ts +14 -0
package/dist/proxy/proxyTracer.js +43 -0
package/dist/server/routes/claudeProxyRoutes.js +112 -33
package/package.json +1 -1

package/dist/lib/providers/litellm.js CHANGED Viewed

@@ -356,8 +356,8 @@ export class LiteLLMProvider extends BaseProvider {
         }
         catch (streamError) {
             if (NoOutputGeneratedError.isInstance(streamError)) {
-                logger.warn("LiteLLM: Stream produced no output (NoOutputGeneratedError)");
-                return;
+                logger.warn("LiteLLM: Stream produced no output (NoOutputGeneratedError) — propagating to fallback chain");
+                throw streamError;
             }
             throw streamError;
         }

package/dist/lib/proxy/proxyTracer.d.ts CHANGED Viewed

@@ -90,6 +90,13 @@ declare class ProxyTracer {
      * Sets span attributes and increments the substitution metric counter.
      */
     setModelSubstitution(requestedModel: string, actualModel: string): void;
+    setFallbackInfo(info: {
+        triggered: boolean;
+        provider?: string;
+        model?: string;
+        attemptCount: number;
+        reason: string;
+    }): void;
     /** Log the incoming client request body (redacted). */
     logRequestBody(body: string): void;
     /** Log the incoming client request headers (redacted). */
@@ -129,5 +136,12 @@ declare class ProxyTracer {
      */
     getTraceHeaders(): Record<string, string>;
 }
+export declare function recordFallbackAttempt(attrs: {
+    provider: string;
+    model: string;
+    status: "success" | "failure";
+    errorMessage?: string;
+    durationMs: number;
+}): void;
 export { ProxyTracer };
 export type { ProxyRequestContext, AccountSelectionContext, UpstreamAttemptContext, UsageContext, };

package/dist/lib/proxy/proxyTracer.js CHANGED Viewed

@@ -79,6 +79,18 @@ function getProxyMetrics() {
             description: "Response body size in bytes received from upstream",
             unit: "By",
         }),
+        fallbackAttemptsTotal: meter.createCounter("proxy_fallback_attempts_total", {
+            description: "Total fallback provider attempts",
+            unit: "{attempt}",
+        }),
+        fallbackSuccessTotal: meter.createCounter("proxy_fallback_success_total", {
+            description: "Total successful fallback provider responses",
+            unit: "{success}",
+        }),
+        fallbackFailureTotal: meter.createCounter("proxy_fallback_failure_total", {
+            description: "Total failed fallback provider responses",
+            unit: "{failure}",
+        }),
     };
     _metrics = createdMetrics;
     return createdMetrics;
@@ -396,6 +408,18 @@ class ProxyTracer {
             actual_model: actualModel,
         });
     }
+    setFallbackInfo(info) {
+        if (!this.rootSpan) {
+            return;
+        }
+        this.rootSpan.setAttributes({
+            "proxy.fallback.triggered": info.triggered,
+            ...(info.provider ? { "proxy.fallback.provider": info.provider } : {}),
+            ...(info.model ? { "proxy.fallback.model": info.model } : {}),
+            "proxy.fallback.attempt_count": info.attemptCount,
+            "proxy.fallback.reason": info.reason,
+        });
+    }
     // -------------------------------------------------------------------------
     // Log payloads as span events
     // -------------------------------------------------------------------------
@@ -641,5 +665,24 @@ class ProxyTracer {
         return this.bridge.injectContext({}, trace.setSpan(context.active(), this.rootSpan));
     }
 }
+export function recordFallbackAttempt(attrs) {
+    try {
+        const m = getProxyMetrics();
+        const labels = { provider: attrs.provider, model: attrs.model };
+        m.fallbackAttemptsTotal.add(1, labels);
+        if (attrs.status === "success") {
+            m.fallbackSuccessTotal.add(1, labels);
+        }
+        else {
+            m.fallbackFailureTotal.add(1, {
+                ...labels,
+                error: attrs.errorMessage?.slice(0, 100) ?? "unknown",
+            });
+        }
+    }
+    catch {
+        // metrics are best-effort
+    }
+}
 export { ProxyTracer };
 //# sourceMappingURL=proxyTracer.js.map

package/dist/lib/server/routes/claudeProxyRoutes.js CHANGED Viewed

@@ -15,7 +15,7 @@ import { join } from "node:path";
 import { buildStableClaudeCodeBillingHeader, CLAUDE_CLI_USER_AGENT, CLAUDE_CODE_OAUTH_BETAS, getOrCreateClaudeCodeIdentity, parseClaudeCodeUserId, } from "../../auth/anthropicOAuth.js";
 import { parseQuotaHeaders, saveAccountQuota, } from "../../proxy/accountQuota.js";
 import { buildClaudeError, ClaudeStreamSerializer, generateToolUseId, parseClaudeRequest, serializeClaudeResponse, } from "../../proxy/claudeFormat.js";
-import { ProxyTracer } from "../../proxy/proxyTracer.js";
+import { ProxyTracer, recordFallbackAttempt } from "../../proxy/proxyTracer.js";
 import { createRawStreamCapture } from "../../proxy/rawStreamCapture.js";
 import { logBodyCapture, logRequest, logRequestAttempt, logStreamError, } from "../../proxy/requestLogger.js";
 import { createSSEInterceptor } from "../../proxy/sseInterceptor.js";
@@ -1246,43 +1246,64 @@ async function executeClaudeFallbackTranslation(args) {
     if (body.stream) {
         const streamResult = await ctx.neurolink.stream(options);
         const serializer = new ClaudeStreamSerializer(body.model, 0);
-        async function* sseGenerator() {
-            for (const frame of serializer.start()) {
-                yield frame;
-            }
-            let collectedText = "";
-            for await (const chunk of streamResult.stream) {
-                const text = extractText(chunk);
-                if (text) {
-                    collectedText += text;
-                    for (const frame of serializer.pushDelta(text)) {
-                        yield frame;
-                    }
+        // Eagerly consume stream so errors fire synchronously and the
+        // fallback loop in tryConfiguredClaudeFallbackChain can catch them.
+        const frames = [];
+        let collectedText = "";
+        for (const frame of serializer.start()) {
+            frames.push(frame);
+        }
+        for await (const chunk of streamResult.stream) {
+            const text = extractText(chunk);
+            if (text) {
+                collectedText += text;
+                for (const frame of serializer.pushDelta(text)) {
+                    frames.push(frame);
                 }
             }
-            const toolCalls = streamResult.toolCalls ?? [];
-            if (!hasTranslatedOutput(collectedText, toolCalls)) {
-                throw new Error(`Translated provider ${providerLabel} returned no content or tool calls`);
-            }
-            if (toolCalls.length) {
-                for (const toolCall of toolCalls) {
-                    const toolName = toolCall.toolName ??
-                        toolCall.name ??
-                        "unknown";
-                    for (const frame of serializer.pushToolUse(generateToolUseId(), toolName, extractToolArgs(toolCall))) {
-                        yield frame;
-                    }
+        }
+        const toolCalls = streamResult.toolCalls ?? [];
+        if (!hasTranslatedOutput(collectedText, toolCalls)) {
+            throw new Error(`Translated provider ${providerLabel} returned no content or tool calls`);
+        }
+        if (toolCalls.length) {
+            for (const toolCall of toolCalls) {
+                const toolName = toolCall.toolName ??
+                    toolCall.name ??
+                    "unknown";
+                for (const frame of serializer.pushToolUse(generateToolUseId(), toolName, extractToolArgs(toolCall))) {
+                    frames.push(frame);
                 }
             }
-            const reason = streamResult.finishReason ?? "end_turn";
-            const resolvedUsage = extractUsageFromStreamResult(streamResult.usage);
-            for (const frame of serializer.finish(resolvedUsage.output, reason)) {
-                yield frame;
-            }
         }
+        const reason = streamResult.finishReason ?? "end_turn";
+        const resolvedUsage = extractUsageFromStreamResult(streamResult.usage);
+        for (const frame of serializer.finish(resolvedUsage.output, reason)) {
+            frames.push(frame);
+        }
+        // Telemetry AFTER validation — not before like the old lazy path
         tracer?.end(200, Date.now() - requestStartTime);
         recordFinalSuccess();
-        logFinalRequest(200, "", providerLabel);
+        logFinalRequest(200, "", providerLabel, undefined, undefined, {
+            inputTokens: resolvedUsage.input,
+            outputTokens: resolvedUsage.output,
+        });
+        const bufferedBody = frames.join("");
+        logProxyBody({
+            phase: "client_response",
+            headers: { "content-type": "text/event-stream" },
+            body: bufferedBody,
+            bodySize: Buffer.byteLength(bufferedBody, "utf8"),
+            contentType: "text/event-stream",
+            responseStatus: 200,
+            durationMs: Date.now() - requestStartTime,
+        });
+        // Return generator that yields pre-buffered frames
+        async function* sseGenerator() {
+            for (const frame of frames) {
+                yield frame;
+            }
+        }
         return sseGenerator();
     }
     const streamResult = await ctx.neurolink.stream(options);
@@ -1346,6 +1367,11 @@ async function tryConfiguredClaudeFallbackChain(args) {
             : "auto-provider";
         logger.always(`[proxy] skipping fallback ${label}: ${skipped.reason}`);
     }
+    tracer?.setFallbackInfo({
+        triggered: true,
+        attemptCount: fallbackPlan.attempts.slice(1).length,
+        reason: fallbackPolicyReason ?? "all_anthropic_accounts_exhausted",
+    });
     for (const fallback of fallbackPlan.attempts.slice(1)) {
         if (!fallback.provider || !fallback.model) {
             continue;
@@ -1354,6 +1380,7 @@ async function tryConfiguredClaudeFallbackChain(args) {
         if (!availability.available) {
             logger.always(`[proxy] fallback ${fallback.provider}/${fallback.model} health-check failed (${availability.reason ?? "provider unavailable"}), attempting anyway`);
         }
+        const fallbackStart = Date.now();
         try {
             logger.always(`[proxy] fallback → ${fallback.provider}/${fallback.model}`);
             const options = buildProxyFallbackOptions(parsedFallbackRequest, {
@@ -1370,13 +1397,57 @@ async function tryConfiguredClaudeFallbackChain(args) {
                 options: options,
                 providerLabel: fallback.provider,
             });
+            recordFallbackAttempt({
+                provider: fallback.provider,
+                model: fallback.model,
+                status: "success",
+                durationMs: Date.now() - fallbackStart,
+            });
+            tracer?.setFallbackInfo({
+                triggered: true,
+                provider: fallback.provider,
+                model: fallback.model,
+                attemptCount: fallbackPlan.attempts.slice(1).length,
+                reason: "fallback_success",
+            });
             return {
                 response,
                 fallbackPolicyReason,
             };
         }
         catch (fallbackErr) {
-            logger.always(`[proxy] fallback ${fallback.provider}/${fallback.model} failed: ${fallbackErr instanceof Error ? fallbackErr.message : String(fallbackErr)}`);
+            const errMsg = fallbackErr instanceof Error
+                ? fallbackErr.message
+                : String(fallbackErr);
+            let errorClass = "unknown";
+            if (errMsg.includes("Rate limit") ||
+                errMsg.includes("rate_limit") ||
+                errMsg.includes("max_parallel_requests")) {
+                errorClass = "rate_limit";
+            }
+            else if (errMsg.includes("context length") ||
+                errMsg.includes("ContextWindowExceeded")) {
+                errorClass = "context_overflow";
+            }
+            else if (errMsg.includes("no content or tool calls") ||
+                errMsg.includes("NoOutputGenerated")) {
+                errorClass = "empty_response";
+            }
+            else if (errMsg.includes("thinking_level") ||
+                errMsg.includes("Field required")) {
+                errorClass = "schema_mismatch";
+            }
+            else if (errMsg.includes("Resource exhausted")) {
+                errorClass = "provider_quota";
+            }
+            logger.always(`[proxy] fallback ${fallback.provider}/${fallback.model} failed [${errorClass}]: ${errMsg}`);
+            recordFallbackAttempt({
+                provider: fallback.provider,
+                model: fallback.model,
+                status: "failure",
+                errorMessage: `[${errorClass}] ${errMsg}`,
+                durationMs: Date.now() - fallbackStart,
+            });
         }
     }
     return {
@@ -3541,7 +3612,15 @@ function shouldOmitImagesForTarget(provider, model) {
     return provider === "litellm" && model === "open-large";
 }
 function shouldOmitThinkingConfigForTarget(provider, model) {
-    return provider === "vertex" && model === "gemini-2.5-flash";
+    if (provider === "litellm") {
+        return true;
+    }
+    if (provider !== "vertex") {
+        return false;
+    }
+    // Only Gemini 2.5+ and 3.x support thinking_level on Vertex.
+    const m = model?.toLowerCase() ?? "";
+    return !/gemini-(2\.5|3)/.test(m);
 }
 function extractToolArgs(toolCall) {
     return (toolCall.args ??

package/dist/providers/litellm.js CHANGED Viewed

@@ -356,8 +356,8 @@ export class LiteLLMProvider extends BaseProvider {
         }
         catch (streamError) {
             if (NoOutputGeneratedError.isInstance(streamError)) {
-                logger.warn("LiteLLM: Stream produced no output (NoOutputGeneratedError)");
-                return;
+                logger.warn("LiteLLM: Stream produced no output (NoOutputGeneratedError) — propagating to fallback chain");
+                throw streamError;
             }
             throw streamError;
         }

package/dist/proxy/proxyTracer.d.ts CHANGED Viewed

@@ -90,6 +90,13 @@ declare class ProxyTracer {
      * Sets span attributes and increments the substitution metric counter.
      */
     setModelSubstitution(requestedModel: string, actualModel: string): void;
+    setFallbackInfo(info: {
+        triggered: boolean;
+        provider?: string;
+        model?: string;
+        attemptCount: number;
+        reason: string;
+    }): void;
     /** Log the incoming client request body (redacted). */
     logRequestBody(body: string): void;
     /** Log the incoming client request headers (redacted). */
@@ -129,5 +136,12 @@ declare class ProxyTracer {
      */
     getTraceHeaders(): Record<string, string>;
 }
+export declare function recordFallbackAttempt(attrs: {
+    provider: string;
+    model: string;
+    status: "success" | "failure";
+    errorMessage?: string;
+    durationMs: number;
+}): void;
 export { ProxyTracer };
 export type { ProxyRequestContext, AccountSelectionContext, UpstreamAttemptContext, UsageContext, };

package/dist/proxy/proxyTracer.js CHANGED Viewed

@@ -79,6 +79,18 @@ function getProxyMetrics() {
             description: "Response body size in bytes received from upstream",
             unit: "By",
         }),
+        fallbackAttemptsTotal: meter.createCounter("proxy_fallback_attempts_total", {
+            description: "Total fallback provider attempts",
+            unit: "{attempt}",
+        }),
+        fallbackSuccessTotal: meter.createCounter("proxy_fallback_success_total", {
+            description: "Total successful fallback provider responses",
+            unit: "{success}",
+        }),
+        fallbackFailureTotal: meter.createCounter("proxy_fallback_failure_total", {
+            description: "Total failed fallback provider responses",
+            unit: "{failure}",
+        }),
     };
     _metrics = createdMetrics;
     return createdMetrics;
@@ -396,6 +408,18 @@ class ProxyTracer {
             actual_model: actualModel,
         });
     }
+    setFallbackInfo(info) {
+        if (!this.rootSpan) {
+            return;
+        }
+        this.rootSpan.setAttributes({
+            "proxy.fallback.triggered": info.triggered,
+            ...(info.provider ? { "proxy.fallback.provider": info.provider } : {}),
+            ...(info.model ? { "proxy.fallback.model": info.model } : {}),
+            "proxy.fallback.attempt_count": info.attemptCount,
+            "proxy.fallback.reason": info.reason,
+        });
+    }
     // -------------------------------------------------------------------------
     // Log payloads as span events
     // -------------------------------------------------------------------------
@@ -641,4 +665,23 @@ class ProxyTracer {
         return this.bridge.injectContext({}, trace.setSpan(context.active(), this.rootSpan));
     }
 }
+export function recordFallbackAttempt(attrs) {
+    try {
+        const m = getProxyMetrics();
+        const labels = { provider: attrs.provider, model: attrs.model };
+        m.fallbackAttemptsTotal.add(1, labels);
+        if (attrs.status === "success") {
+            m.fallbackSuccessTotal.add(1, labels);
+        }
+        else {
+            m.fallbackFailureTotal.add(1, {
+                ...labels,
+                error: attrs.errorMessage?.slice(0, 100) ?? "unknown",
+            });
+        }
+    }
+    catch {
+        // metrics are best-effort
+    }
+}
 export { ProxyTracer };

package/dist/server/routes/claudeProxyRoutes.js CHANGED Viewed

@@ -15,7 +15,7 @@ import { join } from "node:path";
 import { buildStableClaudeCodeBillingHeader, CLAUDE_CLI_USER_AGENT, CLAUDE_CODE_OAUTH_BETAS, getOrCreateClaudeCodeIdentity, parseClaudeCodeUserId, } from "../../auth/anthropicOAuth.js";
 import { parseQuotaHeaders, saveAccountQuota, } from "../../proxy/accountQuota.js";
 import { buildClaudeError, ClaudeStreamSerializer, generateToolUseId, parseClaudeRequest, serializeClaudeResponse, } from "../../proxy/claudeFormat.js";
-import { ProxyTracer } from "../../proxy/proxyTracer.js";
+import { ProxyTracer, recordFallbackAttempt } from "../../proxy/proxyTracer.js";
 import { createRawStreamCapture } from "../../proxy/rawStreamCapture.js";
 import { logBodyCapture, logRequest, logRequestAttempt, logStreamError, } from "../../proxy/requestLogger.js";
 import { createSSEInterceptor } from "../../proxy/sseInterceptor.js";
@@ -1246,43 +1246,64 @@ async function executeClaudeFallbackTranslation(args) {
     if (body.stream) {
         const streamResult = await ctx.neurolink.stream(options);
         const serializer = new ClaudeStreamSerializer(body.model, 0);
-        async function* sseGenerator() {
-            for (const frame of serializer.start()) {
-                yield frame;
-            }
-            let collectedText = "";
-            for await (const chunk of streamResult.stream) {
-                const text = extractText(chunk);
-                if (text) {
-                    collectedText += text;
-                    for (const frame of serializer.pushDelta(text)) {
-                        yield frame;
-                    }
+        // Eagerly consume stream so errors fire synchronously and the
+        // fallback loop in tryConfiguredClaudeFallbackChain can catch them.
+        const frames = [];
+        let collectedText = "";
+        for (const frame of serializer.start()) {
+            frames.push(frame);
+        }
+        for await (const chunk of streamResult.stream) {
+            const text = extractText(chunk);
+            if (text) {
+                collectedText += text;
+                for (const frame of serializer.pushDelta(text)) {
+                    frames.push(frame);
                 }
             }
-            const toolCalls = streamResult.toolCalls ?? [];
-            if (!hasTranslatedOutput(collectedText, toolCalls)) {
-                throw new Error(`Translated provider ${providerLabel} returned no content or tool calls`);
-            }
-            if (toolCalls.length) {
-                for (const toolCall of toolCalls) {
-                    const toolName = toolCall.toolName ??
-                        toolCall.name ??
-                        "unknown";
-                    for (const frame of serializer.pushToolUse(generateToolUseId(), toolName, extractToolArgs(toolCall))) {
-                        yield frame;
-                    }
+        }
+        const toolCalls = streamResult.toolCalls ?? [];
+        if (!hasTranslatedOutput(collectedText, toolCalls)) {
+            throw new Error(`Translated provider ${providerLabel} returned no content or tool calls`);
+        }
+        if (toolCalls.length) {
+            for (const toolCall of toolCalls) {
+                const toolName = toolCall.toolName ??
+                    toolCall.name ??
+                    "unknown";
+                for (const frame of serializer.pushToolUse(generateToolUseId(), toolName, extractToolArgs(toolCall))) {
+                    frames.push(frame);
                 }
             }
-            const reason = streamResult.finishReason ?? "end_turn";
-            const resolvedUsage = extractUsageFromStreamResult(streamResult.usage);
-            for (const frame of serializer.finish(resolvedUsage.output, reason)) {
-                yield frame;
-            }
         }
+        const reason = streamResult.finishReason ?? "end_turn";
+        const resolvedUsage = extractUsageFromStreamResult(streamResult.usage);
+        for (const frame of serializer.finish(resolvedUsage.output, reason)) {
+            frames.push(frame);
+        }
+        // Telemetry AFTER validation — not before like the old lazy path
         tracer?.end(200, Date.now() - requestStartTime);
         recordFinalSuccess();
-        logFinalRequest(200, "", providerLabel);
+        logFinalRequest(200, "", providerLabel, undefined, undefined, {
+            inputTokens: resolvedUsage.input,
+            outputTokens: resolvedUsage.output,
+        });
+        const bufferedBody = frames.join("");
+        logProxyBody({
+            phase: "client_response",
+            headers: { "content-type": "text/event-stream" },
+            body: bufferedBody,
+            bodySize: Buffer.byteLength(bufferedBody, "utf8"),
+            contentType: "text/event-stream",
+            responseStatus: 200,
+            durationMs: Date.now() - requestStartTime,
+        });
+        // Return generator that yields pre-buffered frames
+        async function* sseGenerator() {
+            for (const frame of frames) {
+                yield frame;
+            }
+        }
         return sseGenerator();
     }
     const streamResult = await ctx.neurolink.stream(options);
@@ -1346,6 +1367,11 @@ async function tryConfiguredClaudeFallbackChain(args) {
             : "auto-provider";
         logger.always(`[proxy] skipping fallback ${label}: ${skipped.reason}`);
     }
+    tracer?.setFallbackInfo({
+        triggered: true,
+        attemptCount: fallbackPlan.attempts.slice(1).length,
+        reason: fallbackPolicyReason ?? "all_anthropic_accounts_exhausted",
+    });
     for (const fallback of fallbackPlan.attempts.slice(1)) {
         if (!fallback.provider || !fallback.model) {
             continue;
@@ -1354,6 +1380,7 @@ async function tryConfiguredClaudeFallbackChain(args) {
         if (!availability.available) {
             logger.always(`[proxy] fallback ${fallback.provider}/${fallback.model} health-check failed (${availability.reason ?? "provider unavailable"}), attempting anyway`);
         }
+        const fallbackStart = Date.now();
         try {
             logger.always(`[proxy] fallback → ${fallback.provider}/${fallback.model}`);
             const options = buildProxyFallbackOptions(parsedFallbackRequest, {
@@ -1370,13 +1397,57 @@ async function tryConfiguredClaudeFallbackChain(args) {
                 options: options,
                 providerLabel: fallback.provider,
             });
+            recordFallbackAttempt({
+                provider: fallback.provider,
+                model: fallback.model,
+                status: "success",
+                durationMs: Date.now() - fallbackStart,
+            });
+            tracer?.setFallbackInfo({
+                triggered: true,
+                provider: fallback.provider,
+                model: fallback.model,
+                attemptCount: fallbackPlan.attempts.slice(1).length,
+                reason: "fallback_success",
+            });
             return {
                 response,
                 fallbackPolicyReason,
             };
         }
         catch (fallbackErr) {
-            logger.always(`[proxy] fallback ${fallback.provider}/${fallback.model} failed: ${fallbackErr instanceof Error ? fallbackErr.message : String(fallbackErr)}`);
+            const errMsg = fallbackErr instanceof Error
+                ? fallbackErr.message
+                : String(fallbackErr);
+            let errorClass = "unknown";
+            if (errMsg.includes("Rate limit") ||
+                errMsg.includes("rate_limit") ||
+                errMsg.includes("max_parallel_requests")) {
+                errorClass = "rate_limit";
+            }
+            else if (errMsg.includes("context length") ||
+                errMsg.includes("ContextWindowExceeded")) {
+                errorClass = "context_overflow";
+            }
+            else if (errMsg.includes("no content or tool calls") ||
+                errMsg.includes("NoOutputGenerated")) {
+                errorClass = "empty_response";
+            }
+            else if (errMsg.includes("thinking_level") ||
+                errMsg.includes("Field required")) {
+                errorClass = "schema_mismatch";
+            }
+            else if (errMsg.includes("Resource exhausted")) {
+                errorClass = "provider_quota";
+            }
+            logger.always(`[proxy] fallback ${fallback.provider}/${fallback.model} failed [${errorClass}]: ${errMsg}`);
+            recordFallbackAttempt({
+                provider: fallback.provider,
+                model: fallback.model,
+                status: "failure",
+                errorMessage: `[${errorClass}] ${errMsg}`,
+                durationMs: Date.now() - fallbackStart,
+            });
         }
     }
     return {
@@ -3541,7 +3612,15 @@ function shouldOmitImagesForTarget(provider, model) {
     return provider === "litellm" && model === "open-large";
 }
 function shouldOmitThinkingConfigForTarget(provider, model) {
-    return provider === "vertex" && model === "gemini-2.5-flash";
+    if (provider === "litellm") {
+        return true;
+    }
+    if (provider !== "vertex") {
+        return false;
+    }
+    // Only Gemini 2.5+ and 3.x support thinking_level on Vertex.
+    const m = model?.toLowerCase() ?? "";
+    return !/gemini-(2\.5|3)/.test(m);
 }
 function extractToolArgs(toolCall) {
     return (toolCall.args ??

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@juspay/neurolink",
-  "version": "9.50.0",
+  "version": "9.50.1",
   "packageManager": "pnpm@10.15.1",
   "description": "Universal AI Development Platform with working MCP integration, multi-provider support, and professional CLI. Built-in tools operational, 58+ external MCP servers discoverable. Connect to filesystem, GitHub, database operations, and more. Build, test, and deploy AI applications with 13 providers: OpenAI, Anthropic, Google AI, AWS Bedrock, Azure, Hugging Face, Ollama, and Mistral AI.",
   "author": {