npm - @ai-sdk/gateway - Versions diffs - 4.0.0-beta.45 → 4.0.0-beta.47 - Mend

@ai-sdk/gateway 4.0.0-beta.45 → 4.0.0-beta.47

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (14) hide show

package/CHANGELOG.md +14 -0
package/dist/index.d.mts +2 -1
package/dist/index.d.ts +2 -1
package/dist/index.js +2 -7
package/dist/index.js.map +1 -1
package/dist/index.mjs +2 -7
package/dist/index.mjs.map +1 -1
package/docs/00-ai-gateway.mdx +14 -0
package/package.json +2 -2
package/src/errors/create-gateway-error.ts +0 -1
package/src/errors/gateway-authentication-error.ts +0 -1
package/src/gateway-image-model.ts +1 -5
package/src/gateway-language-model.ts +0 -1
package/src/gateway-provider-options.ts +8 -0

package/docs/00-ai-gateway.mdx CHANGED Viewed

@@ -778,6 +778,20 @@ The following gateway provider options are available:
   Example: `only: ['anthropic', 'vertex']` will only allow routing to Anthropic or Vertex AI.
+- **sort** _'cost' | 'ttft' | 'tps'_
+  Sorts available providers by a performance or cost metric before routing. The gateway will try the best-scoring provider first and fall back through the rest in sorted order. If unspecified, providers are ordered using the gateway's default system ranking.
+  - `'cost'` — lowest input cost per token first
+  - `'ttft'` — lowest time-to-first-token first
+  - `'tps'` — highest tokens-per-second first
+  When combined with `order`, the user-specified providers are promoted to the front while remaining providers follow the sorted order.
+  Example: `sort: 'ttft'` will route to the provider with the fastest time-to-first-token.
+  When `sort` is active, the response's `providerMetadata.gateway.routing.sort` object contains the sort option used, the resulting execution order, per-provider metric values, and any providers that were deprioritized.
 - **models** _string[]_
   Specifies fallback models to use when the primary model fails or is unavailable. The gateway will try the primary model first (specified in the `model` parameter), then try each model in this array in order until one succeeds.

package/package.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "name": "@ai-sdk/gateway",
   "private": false,
-  "version": "4.0.0-beta.45",
+  "version": "4.0.0-beta.47",
   "license": "Apache-2.0",
   "sideEffects": false,
   "main": "./dist/index.js",
@@ -32,7 +32,7 @@
   "dependencies": {
     "@vercel/oidc": "3.2.0",
     "@ai-sdk/provider": "4.0.0-beta.10",
-    "@ai-sdk/provider-utils": "5.0.0-beta.17"
+    "@ai-sdk/provider-utils": "5.0.0-beta.18"
   },
   "devDependencies": {
     "@types/node": "18.15.11",

package/src/errors/create-gateway-error.ts CHANGED Viewed

@@ -13,7 +13,6 @@ import {
   InferSchema,
   lazySchema,
   safeValidateTypes,
-  validateTypes,
   zodSchema,
 } from '@ai-sdk/provider-utils';

package/src/errors/gateway-authentication-error.ts CHANGED Viewed

@@ -37,7 +37,6 @@ export class GatewayAuthenticationError extends GatewayError {
   static createContextualError({
     apiKeyProvided,
     oidcTokenProvided,
-    message = 'Authentication failed',
     statusCode = 401,
     cause,
     generationId,

package/src/gateway-image-model.ts CHANGED Viewed

@@ -50,11 +50,7 @@ export class GatewayImageModel implements ImageModelV4 {
   > {
     const resolvedHeaders = await resolve(this.config.headers());
     try {
-      const {
-        responseHeaders,
-        value: responseBody,
-        rawValue,
-      } = await postJsonToApi({
+      const { responseHeaders, value: responseBody } = await postJsonToApi({
         url: this.getUrl(),
         headers: combineHeaders(
           resolvedHeaders,

package/src/gateway-language-model.ts CHANGED Viewed

@@ -1,7 +1,6 @@
 import type {
   LanguageModelV4,
   LanguageModelV4CallOptions,
-  SharedV4Warning,
   LanguageModelV4FilePart,
   LanguageModelV4StreamPart,
   LanguageModelV4GenerateResult,

package/src/gateway-provider-options.ts CHANGED Viewed

@@ -17,6 +17,14 @@ const gatewayProviderOptions = lazySchema(() =>
        * Example: `['bedrock', 'anthropic']` will try Amazon Bedrock first, then Anthropic as fallback.
        */
       order: z.array(z.string()).optional(),
+      /**
+       * Sort providers by a performance or cost metric before routing.
+       *
+       * - `'cost'`: lowest input cost first
+       * - `'ttft'`: lowest time-to-first-token first
+       * - `'tps'`: highest tokens-per-second first
+       */
+      sort: z.enum(['cost', 'ttft', 'tps']).optional(),
       /**
        * The unique identifier for the end user on behalf of whom the request was made.
        *