npm - @ai-sdk/gateway - Versions diffs - 4.0.0-canary.101 → 4.0.0-canary.103 - Mend

@ai-sdk/gateway 4.0.0-canary.101 → 4.0.0-canary.103

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (12) hide show

package/CHANGELOG.md +38 -0
package/dist/index.d.ts +98 -19
package/dist/index.js +153 -2
package/dist/index.js.map +1 -1
package/docs/00-ai-gateway.mdx +70 -0
package/package.json +3 -3
package/src/gateway-provider-options.ts +50 -116
package/src/gateway-provider.ts +56 -0
package/src/gateway-realtime-auth.ts +126 -0
package/src/gateway-realtime-model-settings.ts +1 -0
package/src/gateway-realtime-model.ts +107 -0
package/src/index.ts +9 -0

package/CHANGELOG.md CHANGED Viewed

@@ -1,5 +1,43 @@
 # @ai-sdk/gateway
+## 4.0.0-canary.103
+### Patch Changes
+- Updated dependencies [bae5e2b]
+  - @ai-sdk/provider-utils@5.0.0-canary.47
+## 4.0.0-canary.102
+### Patch Changes
+- a3bb04a: feat(gateway): add experimental realtime model support
+  Adds `gateway.experimental_realtime()` for bidirectional audio/text realtime
+  sessions routed through the AI Gateway. Like every other Gateway modality, the
+  client speaks the normalized AI SDK realtime protocol and the Gateway
+  translates to/from the upstream provider server-side, so `GatewayRealtimeModel`
+  is a thin identity codec. Gateway realtime is server-side only for v0 and throws
+  if used in a browser because it returns the resolved Gateway auth token rather
+  than a minted ephemeral client secret. Because the browser `WebSocket` API
+  cannot set request headers, the Gateway auth token is carried via the
+  `Sec-WebSocket-Protocol` subprotocol (the same workaround used for OpenAI) and
+  the model id rides the `?ai-model-id=` query — the WS transport of the
+  `ai-model-id` header used by the HTTP routes. The model id is passed through
+  verbatim; the Gateway owns resolution. Provider options (including BYOK) flow
+  through the normalized `session.update`, exactly as they ride the request body
+  on the non-realtime routes.
+  The versioned subprotocol auth contract is centralized so the client and the
+  Gateway server share one definition: `getGatewayRealtimeProtocols` (client
+  encode) and `getGatewayRealtimeAuthToken` (server decode), plus the
+  `GATEWAY_REALTIME_SUBPROTOCOL` / `GATEWAY_AUTH_SUBPROTOCOL_PREFIX` constants.
+  `GatewayProviderOptions` documents the stable client-facing option fields while
+  remaining open to service-owned options. Runtime validation lives in the Gateway
+  service so the server can evolve without requiring an SDK release for every new
+  option.
 ## 4.0.0-canary.101
 ### Patch Changes

package/dist/index.d.ts CHANGED Viewed

@@ -1,9 +1,64 @@
-import { LanguageModelV4, ProviderV4, EmbeddingModelV4, ImageModelV4, Experimental_VideoModelV4, RerankingModelV4, SpeechModelV4, TranscriptionModelV4, TypeValidationError } from '@ai-sdk/provider';
+import { LanguageModelV4, ProviderV4, EmbeddingModelV4, ImageModelV4, Experimental_VideoModelV4, RerankingModelV4, SpeechModelV4, TranscriptionModelV4, Experimental_RealtimeFactoryV4, TypeValidationError } from '@ai-sdk/provider';
 import * as _ai_sdk_provider_utils from '@ai-sdk/provider-utils';
 import { FetchFunction, InferSchema } from '@ai-sdk/provider-utils';
 type GatewayModelId = 'alibaba/qwen-3-14b' | 'alibaba/qwen-3-235b' | 'alibaba/qwen-3-30b' | 'alibaba/qwen-3-32b' | 'alibaba/qwen-3.6-max-preview' | 'alibaba/qwen3-235b-a22b-thinking' | 'alibaba/qwen3-coder' | 'alibaba/qwen3-coder-30b-a3b' | 'alibaba/qwen3-coder-next' | 'alibaba/qwen3-coder-plus' | 'alibaba/qwen3-max' | 'alibaba/qwen3-max-preview' | 'alibaba/qwen3-max-thinking' | 'alibaba/qwen3-next-80b-a3b-instruct' | 'alibaba/qwen3-next-80b-a3b-thinking' | 'alibaba/qwen3-vl-235b-a22b-instruct' | 'alibaba/qwen3-vl-instruct' | 'alibaba/qwen3-vl-thinking' | 'alibaba/qwen3.5-flash' | 'alibaba/qwen3.5-plus' | 'alibaba/qwen3.6-27b' | 'alibaba/qwen3.6-plus' | 'alibaba/qwen3.7-max' | 'alibaba/qwen3.7-plus' | 'amazon/nova-2-lite' | 'amazon/nova-lite' | 'amazon/nova-micro' | 'amazon/nova-pro' | 'anthropic/claude-3-haiku' | 'anthropic/claude-3.5-haiku' | 'anthropic/claude-fable-5' | 'anthropic/claude-haiku-4.5' | 'anthropic/claude-opus-4' | 'anthropic/claude-opus-4.1' | 'anthropic/claude-opus-4.5' | 'anthropic/claude-opus-4.6' | 'anthropic/claude-opus-4.7' | 'anthropic/claude-opus-4.8' | 'anthropic/claude-sonnet-4' | 'anthropic/claude-sonnet-4.5' | 'anthropic/claude-sonnet-4.6' | 'arcee-ai/trinity-large-preview' | 'arcee-ai/trinity-large-thinking' | 'arcee-ai/trinity-mini' | 'bytedance/seed-1.6' | 'bytedance/seed-1.8' | 'cohere/command-a' | 'deepseek/deepseek-r1' | 'deepseek/deepseek-v3' | 'deepseek/deepseek-v3.1' | 'deepseek/deepseek-v3.1-terminus' | 'deepseek/deepseek-v3.2' | 'deepseek/deepseek-v3.2-thinking' | 'deepseek/deepseek-v4-flash' | 'deepseek/deepseek-v4-pro' | 'google/gemini-2.5-flash' | 'google/gemini-2.5-flash-image' | 'google/gemini-2.5-flash-lite' | 'google/gemini-2.5-pro' | 'google/gemini-3-flash' | 'google/gemini-3-pro-image' | 'google/gemini-3-pro-preview' | 'google/gemini-3.1-flash-image' | 'google/gemini-3.1-flash-image-preview' | 'google/gemini-3.1-flash-lite' | 'google/gemini-3.1-flash-lite-preview' | 'google/gemini-3.1-pro-preview' | 'google/gemini-3.5-flash' | 'google/gemma-4-26b-a4b-it' | 'google/gemma-4-31b-it' | 'inception/mercury-2' | 'inception/mercury-coder-small' | 'interfaze/interfaze-beta' | 'kwaipilot/kat-coder-pro-v1' | 'kwaipilot/kat-coder-pro-v2' | 'meituan/longcat-flash-chat' | 'meituan/longcat-flash-thinking-2601' | 'meta/llama-3.1-70b' | 'meta/llama-3.1-8b' | 'meta/llama-3.2-11b' | 'meta/llama-3.2-1b' | 'meta/llama-3.2-3b' | 'meta/llama-3.2-90b' | 'meta/llama-3.3-70b' | 'meta/llama-4-maverick' | 'meta/llama-4-scout' | 'minimax/minimax-m2' | 'minimax/minimax-m2.1' | 'minimax/minimax-m2.1-lightning' | 'minimax/minimax-m2.5' | 'minimax/minimax-m2.5-highspeed' | 'minimax/minimax-m2.7' | 'minimax/minimax-m2.7-highspeed' | 'minimax/minimax-m3' | 'mistral/codestral' | 'mistral/devstral-2' | 'mistral/devstral-small' | 'mistral/devstral-small-2' | 'mistral/magistral-medium' | 'mistral/magistral-small' | 'mistral/ministral-14b' | 'mistral/ministral-3b' | 'mistral/ministral-8b' | 'mistral/mistral-large-3' | 'mistral/mistral-medium' | 'mistral/mistral-medium-3.5' | 'mistral/mistral-nemo' | 'mistral/mistral-small' | 'mistral/pixtral-12b' | 'mistral/pixtral-large' | 'moonshotai/kimi-k2' | 'moonshotai/kimi-k2-thinking' | 'moonshotai/kimi-k2-thinking-turbo' | 'moonshotai/kimi-k2-turbo' | 'moonshotai/kimi-k2.5' | 'moonshotai/kimi-k2.6' | 'morph/morph-v3-fast' | 'morph/morph-v3-large' | 'nvidia/nemotron-3-nano-30b-a3b' | 'nvidia/nemotron-3-super-120b-a12b' | 'nvidia/nemotron-3-ultra-550b-a55b' | 'nvidia/nemotron-nano-12b-v2-vl' | 'nvidia/nemotron-nano-9b-v2' | 'openai/gpt-3.5-turbo' | 'openai/gpt-3.5-turbo-instruct' | 'openai/gpt-4-turbo' | 'openai/gpt-4.1' | 'openai/gpt-4.1-mini' | 'openai/gpt-4.1-nano' | 'openai/gpt-4o' | 'openai/gpt-4o-mini' | 'openai/gpt-4o-mini-search-preview' | 'openai/gpt-5' | 'openai/gpt-5-chat' | 'openai/gpt-5-codex' | 'openai/gpt-5-mini' | 'openai/gpt-5-nano' | 'openai/gpt-5-pro' | 'openai/gpt-5.1-codex' | 'openai/gpt-5.1-codex-max' | 'openai/gpt-5.1-codex-mini' | 'openai/gpt-5.1-instant' | 'openai/gpt-5.1-thinking' | 'openai/gpt-5.2' | 'openai/gpt-5.2-chat' | 'openai/gpt-5.2-codex' | 'openai/gpt-5.2-pro' | 'openai/gpt-5.3-chat' | 'openai/gpt-5.3-codex' | 'openai/gpt-5.4' | 'openai/gpt-5.4-mini' | 'openai/gpt-5.4-nano' | 'openai/gpt-5.4-pro' | 'openai/gpt-5.5' | 'openai/gpt-5.5-pro' | 'openai/gpt-oss-120b' | 'openai/gpt-oss-20b' | 'openai/gpt-oss-safeguard-20b' | 'openai/o1' | 'openai/o3' | 'openai/o3-deep-research' | 'openai/o3-mini' | 'openai/o3-pro' | 'openai/o4-mini' | 'perplexity/sonar' | 'perplexity/sonar-pro' | 'perplexity/sonar-reasoning-pro' | 'stepfun/step-3.5-flash' | 'stepfun/step-3.7-flash' | 'xai/grok-4.1-fast-non-reasoning' | 'xai/grok-4.1-fast-reasoning' | 'xai/grok-4.20-multi-agent' | 'xai/grok-4.20-multi-agent-beta' | 'xai/grok-4.20-non-reasoning' | 'xai/grok-4.20-non-reasoning-beta' | 'xai/grok-4.20-reasoning' | 'xai/grok-4.20-reasoning-beta' | 'xai/grok-4.3' | 'xai/grok-build-0.1' | 'xiaomi/mimo-v2-flash' | 'xiaomi/mimo-v2-pro' | 'xiaomi/mimo-v2.5' | 'xiaomi/mimo-v2.5-pro' | 'zai/glm-4.5' | 'zai/glm-4.5-air' | 'zai/glm-4.5v' | 'zai/glm-4.6' | 'zai/glm-4.6v' | 'zai/glm-4.6v-flash' | 'zai/glm-4.7' | 'zai/glm-4.7-flash' | 'zai/glm-4.7-flashx' | 'zai/glm-5' | 'zai/glm-5-turbo' | 'zai/glm-5.1' | 'zai/glm-5v-turbo' | (string & {});
+/**
+ * Shared WebSocket subprotocol contract for AI Gateway realtime auth.
+ *
+ * The browser `WebSocket` API cannot set request headers, so the Gateway auth
+ * (bearer) token is carried through the `Sec-WebSocket-Protocol` handshake
+ * instead of an `Authorization` header — the same workaround OpenAI uses for
+ * `openai-insecure-api-key.<token>`.
+ *
+ * This module is the single source of truth for that contract so the client and
+ * the Gateway server can't drift: the client encodes values with
+ * `getGatewayRealtimeProtocols`, and the Gateway server decodes them with
+ * `getGatewayRealtimeAuthToken` / `getGatewayRealtimeTeamIdOrSlug`.
+ *
+ * WebSocket subprotocol values must fit the RFC token grammar. The auth token is
+ * sent as-is, so callers must use tokens that are valid subprotocol tokens; the
+ * optional team scope is base64url-encoded by this module. Keep the complete
+ * `Sec-WebSocket-Protocol` header compact (target under an 8 KiB safe header
+ * budget) because intermediaries may reject large upgrade headers.
+ */
+/**
+ * Marker subprotocol offered on every handshake so the Gateway can echo a
+ * negotiated subprotocol on the 101 response (some clients require the server to
+ * select one of the offered subprotocols).
+ */
+declare const GATEWAY_REALTIME_SUBPROTOCOL = "ai-gateway-realtime.v1";
+/** Subprotocol prefix that carries the Gateway auth (bearer) token. */
+declare const GATEWAY_AUTH_SUBPROTOCOL_PREFIX = "ai-gateway-auth.";
+/** Subprotocol prefix that carries optional Vercel team scoping. */
+declare const GATEWAY_TEAM_SUBPROTOCOL_PREFIX = "ai-gateway-team.";
+/**
+ * Client-side: build the WebSocket subprotocols that carry `token` to the
+ * Gateway. Pass the result as the second argument to `new WebSocket(url, ...)`.
+ */
+declare function getGatewayRealtimeProtocols(token: string, options?: {
+    teamIdOrSlug?: string;
+}): string[];
+/**
+ * Server-side: extract the Gateway auth (bearer) token from a
+ * `Sec-WebSocket-Protocol` header value, or `undefined` when it is absent or
+ * empty. The Gateway upgrade handler turns this into an
+ * `Authorization: Bearer <token>` before its normal auth path.
+ *
+ * Accepts the raw header value (subprotocols are comma-separated and may carry
+ * surrounding whitespace).
+ */
+declare function getGatewayRealtimeAuthToken(secWebSocketProtocol: string | null | undefined): string | undefined;
+/**
+ * Server-side: extract the optional Vercel team ID or slug from the
+ * `Sec-WebSocket-Protocol` header value. Team scoping is base64url-encoded so
+ * arbitrary team slugs stay within the WebSocket subprotocol token grammar.
+ */
+declare function getGatewayRealtimeTeamIdOrSlug(secWebSocketProtocol: string | null | undefined): string | undefined;
+type GatewayRealtimeModelId = string & {};
 type GatewayRerankingModelId = 'cohere/rerank-v3.5' | 'cohere/rerank-v4-fast' | 'cohere/rerank-v4-pro' | 'voyage/rerank-2.5' | 'voyage/rerank-2.5-lite' | (string & {});
 type GatewaySpeechModelId = string & {};
@@ -539,6 +594,11 @@ interface GatewayProvider extends ProviderV4 {
      * Creates a model for audio transcription.
      */
     transcriptionModel(modelId: GatewayTranscriptionModelId): TranscriptionModelV4;
+    /**
+     * Creates an experimental realtime model for bidirectional audio/text
+     * communication over WebSocket, normalized through the AI Gateway.
+     */
+    experimental_realtime: Experimental_RealtimeFactoryV4;
     /**
      * Gateway-specific tools executed server-side.
      */
@@ -579,24 +639,43 @@ interface GatewayProviderSettings {
 declare function createGateway(options?: GatewayProviderSettings): GatewayProvider;
 declare const gateway: GatewayProvider;
-declare const gatewayProviderOptions: _ai_sdk_provider_utils.LazySchema<{
-    only?: string[] | undefined;
-    order?: string[] | undefined;
-    sort?: "cost" | "ttft" | "tps" | undefined;
-    user?: string | undefined;
-    tags?: string[] | undefined;
-    models?: string[] | undefined;
-    byok?: Record<string, Record<string, unknown>[]> | undefined;
-    zeroDataRetention?: boolean | undefined;
-    disallowPromptTraining?: boolean | undefined;
-    hipaaCompliant?: boolean | undefined;
-    quotaEntityId?: string | undefined;
+type GatewayProviderOptions = {
+    /**
+     * Service-owned options may be added by the Gateway without requiring an SDK
+     * release. The Gateway service validates and applies the runtime schema.
+     */
+    [key: string]: unknown;
+    /** Request-scoped BYOK credentials to use instead of cached credentials. */
+    byok?: Record<string, Array<Record<string, unknown>>>;
+    /** Enables automatic caching behavior when supported by the Gateway. */
+    caching?: 'auto';
+    /** Filter to providers that do not train on prompt data. */
+    disallowPromptTraining?: boolean;
+    /** Filter to providers that are HIPAA compliant with Vercel AI Gateway. */
+    hipaaCompliant?: boolean;
+    /** Array of model slugs specifying fallback models to use in order. */
+    models?: string[];
+    /** Array of provider slugs that are the only ones allowed to be used. */
+    only?: string[];
+    /** Array of provider slugs specifying the provider attempt order. */
+    order?: string[];
+    /** Per-provider timeouts for BYOK credentials in milliseconds. */
     providerTimeouts?: {
-        byok?: Record<string, number> | undefined;
-    } | undefined;
-    serviceTier?: "flex" | "priority" | undefined;
-}>;
-type GatewayProviderOptions = InferSchema<typeof gatewayProviderOptions>;
+        byok?: Record<string, number>;
+    };
+    /** Entity identifier against which quota is tracked. */
+    quotaEntityId?: string;
+    /** Unified service tier intent. */
+    serviceTier?: 'flex' | 'priority';
+    /** Sort providers by a performance or cost metric before routing. */
+    sort?: 'cost' | 'tps' | 'ttft';
+    /** User-specified tags for reporting and filtering usage. */
+    tags?: string[];
+    /** End-user identifier for spend tracking and attribution. */
+    user?: string;
+    /** Filter to providers with zero data retention agreements. */
+    zeroDataRetention?: boolean;
+};
 declare const symbol$7: unique symbol;
 declare abstract class GatewayError extends Error {
@@ -774,4 +853,4 @@ declare class GatewayResponseError extends GatewayError {
 declare const VERSION: string;
-export { GatewayAuthenticationError, type GatewayCreditsResponse, GatewayError, type GatewayErrorResponse, GatewayFailedDependencyError, type GatewayGenerationInfo, type GatewayGenerationInfoParams, GatewayInternalServerError, GatewayInvalidRequestError, type GatewayLanguageModelEntry, type GatewayProviderOptions as GatewayLanguageModelOptions, type GatewayLanguageModelSpecification, type GatewayLanguageModelEntry as GatewayModelEntry, type GatewayModelId, GatewayModelNotFoundError, type GatewayProvider, type GatewayProviderOptions, type GatewayProviderSettings, GatewayRateLimitError, type GatewayRerankingModelId, GatewayResponseError, type GatewaySpeechModelId, type GatewaySpendReportParams, type GatewaySpendReportResponse, type GatewaySpendReportRow, type GatewayTranscriptionModelId, type GatewayVideoModelId, VERSION, createGateway, createGateway as createGatewayProvider, gateway };
+export { GATEWAY_AUTH_SUBPROTOCOL_PREFIX, GATEWAY_REALTIME_SUBPROTOCOL, GATEWAY_TEAM_SUBPROTOCOL_PREFIX, GatewayAuthenticationError, type GatewayCreditsResponse, GatewayError, type GatewayErrorResponse, GatewayFailedDependencyError, type GatewayGenerationInfo, type GatewayGenerationInfoParams, GatewayInternalServerError, GatewayInvalidRequestError, type GatewayLanguageModelEntry, type GatewayProviderOptions as GatewayLanguageModelOptions, type GatewayLanguageModelSpecification, type GatewayLanguageModelEntry as GatewayModelEntry, type GatewayModelId, GatewayModelNotFoundError, type GatewayProvider, type GatewayProviderOptions, type GatewayProviderSettings, GatewayRateLimitError, type GatewayRealtimeModelId, type GatewayRerankingModelId, GatewayResponseError, type GatewaySpeechModelId, type GatewaySpendReportParams, type GatewaySpendReportResponse, type GatewaySpendReportRow, type GatewayTranscriptionModelId, type GatewayVideoModelId, VERSION, createGateway, createGateway as createGatewayProvider, gateway, getGatewayRealtimeAuthToken, getGatewayRealtimeProtocols, getGatewayRealtimeTeamIdOrSlug };

package/dist/index.js CHANGED Viewed

@@ -1,3 +1,57 @@
+// src/gateway-realtime-auth.ts
+var GATEWAY_REALTIME_SUBPROTOCOL = "ai-gateway-realtime.v1";
+var GATEWAY_AUTH_SUBPROTOCOL_PREFIX = "ai-gateway-auth.";
+var GATEWAY_TEAM_SUBPROTOCOL_PREFIX = "ai-gateway-team.";
+function getGatewayRealtimeProtocols(token, options) {
+  const protocols = [
+    GATEWAY_REALTIME_SUBPROTOCOL,
+    `${GATEWAY_AUTH_SUBPROTOCOL_PREFIX}${token}`
+  ];
+  if (options == null ? void 0 : options.teamIdOrSlug) {
+    protocols.push(
+      `${GATEWAY_TEAM_SUBPROTOCOL_PREFIX}${encodeSubprotocolValue(options.teamIdOrSlug)}`
+    );
+  }
+  return protocols;
+}
+function getGatewayRealtimeAuthToken(secWebSocketProtocol) {
+  var _a10;
+  return ((_a10 = findProtocol(secWebSocketProtocol, GATEWAY_AUTH_SUBPROTOCOL_PREFIX)) == null ? void 0 : _a10.slice(
+    GATEWAY_AUTH_SUBPROTOCOL_PREFIX.length
+  )) || void 0;
+}
+function getGatewayRealtimeTeamIdOrSlug(secWebSocketProtocol) {
+  var _a10;
+  const encoded = (_a10 = findProtocol(
+    secWebSocketProtocol,
+    GATEWAY_TEAM_SUBPROTOCOL_PREFIX
+  )) == null ? void 0 : _a10.slice(GATEWAY_TEAM_SUBPROTOCOL_PREFIX.length);
+  if (!encoded) return void 0;
+  try {
+    return decodeSubprotocolValue(encoded) || void 0;
+  } catch (e) {
+    return void 0;
+  }
+}
+function findProtocol(secWebSocketProtocol, prefix) {
+  return secWebSocketProtocol == null ? void 0 : secWebSocketProtocol.split(",").map((protocol) => protocol.trim()).find((protocol) => protocol.startsWith(prefix));
+}
+function encodeSubprotocolValue(value) {
+  const bytes = new TextEncoder().encode(value);
+  let binary = "";
+  for (const byte of bytes) {
+    binary += String.fromCharCode(byte);
+  }
+  return btoa(binary).replace(/\+/g, "-").replace(/\//g, "_").replace(/=+$/u, "");
+}
+function decodeSubprotocolValue(value) {
+  const base64 = value.replace(/-/g, "+").replace(/_/g, "/");
+  const padding = "=".repeat((4 - base64.length % 4) % 4);
+  const binary = atob(`${base64}${padding}`);
+  const bytes = Uint8Array.from(binary, (char) => char.charCodeAt(0));
+  return new TextDecoder().decode(bytes);
+}
 // src/gateway-provider.ts
 import {
   loadOptionalSetting,
@@ -1801,6 +1855,55 @@ var gatewayTranscriptionResponseSchema = z13.object({
   providerMetadata: z13.record(z13.string(), providerMetadataEntrySchema4).optional()
 });
+// src/gateway-realtime-model.ts
+var GatewayRealtimeModel = class {
+  constructor(modelId, config) {
+    this.specificationVersion = "v4";
+    this.modelId = modelId;
+    this.provider = config.provider;
+    this.config = config;
+  }
+  /**
+   * Unlike providers with a dedicated ephemeral-secret endpoint (e.g. OpenAI),
+   * the Gateway v0 realtime path does not mint a new client secret. The returned
+   * token is the Gateway credential resolved by the provider (`apiKey`,
+   * `AI_GATEWAY_API_KEY`, or Vercel OIDC token) and the WebSocket upgrade is
+   * authenticated directly with that credential. The
+   * `RealtimeModelV4ClientSecretOptions` are therefore intentionally unused:
+   * `sessionConfig` is applied later via the normalized `session-update` event,
+   * and `expiresAfterSeconds` has no Gateway-side equivalent.
+   */
+  async doCreateClientSecret() {
+    const { token } = await this.config.getAuthToken();
+    return {
+      token,
+      url: toGatewayRealtimeUrl(this.config.baseURL, this.modelId)
+    };
+  }
+  getWebSocketConfig(options) {
+    return {
+      url: options.url,
+      protocols: getGatewayRealtimeProtocols(options.token, {
+        teamIdOrSlug: this.config.teamIdOrSlug
+      })
+    };
+  }
+  parseServerEvent(raw) {
+    return raw;
+  }
+  serializeClientEvent(event) {
+    return event;
+  }
+  buildSessionConfig(config) {
+    return config;
+  }
+};
+function toGatewayRealtimeUrl(baseURL, modelId) {
+  const url = new URL(`${baseURL.replace(/^http/, "ws")}/realtime-model`);
+  url.searchParams.set("ai-model-id", modelId);
+  return url.toString();
+}
 // src/tool/parallel-search.ts
 import {
   createProviderExecutedToolFactory,
@@ -2000,7 +2103,7 @@ async function getVercelRequestId() {
 }
 // src/version.ts
-var VERSION = true ? "4.0.0-canary.101" : "0.0.0-test";
+var VERSION = true ? "4.0.0-canary.103" : "0.0.0-test";
 // src/gateway-provider.ts
 var AI_GATEWAY_PROTOCOL_VERSION = "0.0.1";
@@ -2033,6 +2136,18 @@ function createGateway(options = {}) {
       });
     }
   };
+  const getRealtimeAuthToken = async () => {
+    try {
+      return await getGatewayAuthToken(options);
+    } catch (error) {
+      throw GatewayAuthenticationError.createContextualError({
+        apiKeyProvided: false,
+        oidcTokenProvided: false,
+        statusCode: 401,
+        cause: error
+      });
+    }
+  };
   const createO11yHeaders = () => {
     const deploymentId = loadOptionalSetting({
       settingValue: void 0,
@@ -2203,6 +2318,29 @@ function createGateway(options = {}) {
   };
   provider.transcriptionModel = createTranscriptionModel;
   provider.transcription = createTranscriptionModel;
+  const createRealtimeModel = (modelId) => {
+    assertGatewayRealtimeServerEnvironment();
+    return new GatewayRealtimeModel(modelId, {
+      provider: "gateway.realtime",
+      baseURL,
+      teamIdOrSlug: options.teamIdOrSlug,
+      getAuthToken: getRealtimeAuthToken
+    });
+  };
+  provider.experimental_realtime = Object.assign(
+    (modelId) => createRealtimeModel(modelId),
+    {
+      getToken: async (tokenOptions) => {
+        const model = createRealtimeModel(tokenOptions.model);
+        const secret = await model.doCreateClientSecret();
+        return {
+          token: secret.token,
+          url: secret.url,
+          ...secret.expiresAt != null && { expiresAt: secret.expiresAt }
+        };
+      }
+    }
+  );
   provider.chat = provider.languageModel;
   provider.embedding = provider.embeddingModel;
   provider.image = provider.imageModel;
@@ -2228,7 +2366,17 @@ async function getGatewayAuthToken(options) {
     authMethod: "oidc"
   };
 }
+function assertGatewayRealtimeServerEnvironment() {
+  if (typeof globalThis.window !== "undefined") {
+    throw new Error(
+      "AI Gateway realtime models cannot be used in browsers yet. Use gateway.experimental_realtime from server-side code only."
+    );
+  }
+}
 export {
+  GATEWAY_AUTH_SUBPROTOCOL_PREFIX,
+  GATEWAY_REALTIME_SUBPROTOCOL,
+  GATEWAY_TEAM_SUBPROTOCOL_PREFIX,
   GatewayAuthenticationError,
   GatewayError,
   GatewayFailedDependencyError,
@@ -2240,6 +2388,9 @@ export {
   VERSION,
   createGateway,
   createGateway as createGatewayProvider,
-  gateway
+  gateway,
+  getGatewayRealtimeAuthToken,
+  getGatewayRealtimeProtocols,
+  getGatewayRealtimeTeamIdOrSlug
 };
 //# sourceMappingURL=index.js.map