npm - @ai-sdk/provider - Versions diffs - 4.0.0-beta.13 → 4.0.0-beta.19 - Mend

@ai-sdk/provider 4.0.0-beta.13 → 4.0.0-beta.19

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (132) hide show

package/dist/index.d.ts CHANGED Viewed

@@ -1,6 +1,69 @@
 import { JSONSchema7 } from 'json-schema';
 export { JSONSchema7, JSONSchema7Definition } from 'json-schema';
+/**
+ * A mapping of provider names to provider-specific file identifiers.
+ *
+ * Provider references allow files to be identified across different
+ * providers without re-uploading, by storing each provider's own
+ * identifier for the same logical file.
+ *
+ * ```ts
+ * {
+ *   "openai": "file-abc123",
+ *   "anthropic": "file-xyz789"
+ * }
+ * ```
+ *
+ * The `type?: never` constraint excludes any object that has a `type`
+ * property, so a `SharedV4ProviderReference` cannot be confused with a
+ * tagged file-data shape (e.g. `{ type: 'data', data }` or
+ * `{ type: 'reference', reference }`) when both appear in the same union.
+ */
+type SharedV4ProviderReference = Record<string, string> & {
+    type?: never;
+};
+/**
+ * File data variant containing raw bytes (`Uint8Array`) or a base64-encoded
+ * string.
+ */
+interface SharedV4FileDataData {
+    type: 'data';
+    data: Uint8Array | string;
+}
+/**
+ * File data variant containing a URL that points to the file.
+ */
+interface SharedV4FileDataUrl {
+    type: 'url';
+    url: URL;
+}
+/**
+ * File data variant containing a provider reference (`{ [provider]: id }`).
+ */
+interface SharedV4FileDataReference {
+    type: 'reference';
+    reference: SharedV4ProviderReference;
+}
+/**
+ * File data variant containing inline text content (e.g. an inline text
+ * document).
+ */
+interface SharedV4FileDataText {
+    type: 'text';
+    text: string;
+}
+/**
+ * File data as a tagged discriminated union:
+ *
+ * - `{ type: 'data', data }`: raw bytes (`Uint8Array`) or base64-encoded string.
+ * - `{ type: 'url', url }`: a URL that points to the file.
+ * - `{ type: 'reference', reference }`: a provider reference (`{ [provider]: id }`).
+ * - `{ type: 'text', text }`: inline text content (e.g. an inline text document).
+ */
+type SharedV4FileData = SharedV4FileDataData | SharedV4FileDataUrl | SharedV4FileDataReference | SharedV4FileDataText;
 type SharedV4Headers = Record<string, string>;
 /**
@@ -59,22 +122,6 @@ type SharedV4ProviderMetadata = Record<string, JSONObject>;
  */
 type SharedV4ProviderOptions = Record<string, JSONObject>;
-/**
- * A mapping of provider names to provider-specific file identifiers.
- *
- * Provider references allow files to be identified across different
- * providers without re-uploading, by storing each provider's own
- * identifier for the same logical file.
- *
- * ```ts
- * {
- *   "openai": "file-abc123",
- *   "anthropic": "file-xyz789"
- * }
- * ```
- */
-type SharedV4ProviderReference = Record<string, string>;
 /**
  * Warning from the model.
  *
@@ -850,9 +897,12 @@ declare class UnsupportedFunctionalityError extends AISDKError {
  */
 type FilesV4UploadFileCallOptions = {
     /**
-     * The file data as raw bytes or a base64-encoded string.
+     * The file data.
+     *
+     * - `{ type: 'data', data }`: raw bytes (`Uint8Array`) or a base64-encoded string.
+     * - `{ type: 'text', text }`: inline text (UTF-8).
      */
-    data: Uint8Array | string;
+    data: SharedV4FileDataData | SharedV4FileDataText;
     /**
      * The IANA media type of the file (e.g. `'application/pdf'`).
      */
@@ -1655,11 +1705,6 @@ type LanguageModelV4FunctionTool = {
     providerOptions?: SharedV4ProviderOptions;
 };
-/**
- * Data content. Can be a Uint8Array, base64 encoded data as a string or a URL.
- */
-type LanguageModelV4DataContent = Uint8Array | string | URL;
 /**
  * A prompt is a list of messages.
  *
@@ -1728,9 +1773,12 @@ interface LanguageModelV4ReasoningPart {
 interface LanguageModelV4ReasoningFilePart {
     type: 'reasoning-file';
     /**
-     * File data. Can be a Uint8Array or base64 encoded data as a string.
+     * File data as a tagged discriminated union:
+     *
+     * - `{ type: 'data', data }`: raw bytes (Uint8Array) or base64-encoded string.
+     * - `{ type: 'url', url }`: a URL that points to the file.
      */
-    data: LanguageModelV4DataContent;
+    data: SharedV4FileDataData | SharedV4FileDataUrl;
     /**
      * IANA media type of the file.
      *
@@ -1771,14 +1819,23 @@ interface LanguageModelV4FilePart {
      */
     filename?: string;
     /**
-     * File data. Can be a Uint8Array, base64 encoded data as a string, a URL,
-     * or a provider reference mapping provider names to provider-specific file IDs.
+     * File data as a tagged discriminated union:
+     *
+     * - `{ type: 'data', data }`: raw bytes (Uint8Array) or base64-encoded string.
+     * - `{ type: 'url', url }`: a URL that points to the file.
+     * - `{ type: 'reference', reference }`: a provider reference (`{ [provider]: id }`).
+     * - `{ type: 'text', text }`: inline text content (e.g. an inline text document).
      */
-    data: LanguageModelV4DataContent | SharedV4ProviderReference;
+    data: SharedV4FileData;
     /**
-     * IANA media type of the file.
+     * Either a full IANA media type (`type/subtype`, e.g. `image/png`) or just
+     * the top-level IANA segment (e.g. `image`, `audio`, `video`, `text`).
      *
-     * Can support wildcards, e.g. `image/*` (in which case the provider needs to take appropriate action).
+     * `*`-subtype wildcards (e.g. `image/*`) are normalized as equivalent to the
+     * top-level segment alone (e.g. `image`). Providers can use the helpers in
+     * `@ai-sdk/provider-utils` (`isFullMediaType`, `getTopLevelMediaType`,
+     * `detectMediaType`) to resolve the field according to their API
+     * requirements.
      *
      * @see https://www.iana.org/assignments/media-types/media-types.xhtml
      */
@@ -1928,13 +1985,26 @@ type LanguageModelV4ToolResultOutput = {
          */
         providerOptions?: SharedV4ProviderOptions;
     } | {
-        type: 'file-data';
+        type: 'file';
         /**
-         * Base-64 encoded media data.
+         * File data as a tagged discriminated union:
+         *
+         * - `{ type: 'data', data }`: raw bytes (Uint8Array) or base64-encoded string.
+         * - `{ type: 'url', url }`: a URL that points to the file.
+         * - `{ type: 'reference', reference }`: a provider reference (`{ [provider]: id }`).
+         * - `{ type: 'text', text }`: inline text content (e.g. an inline text document).
          */
-        data: string;
+        data: SharedV4FileData;
         /**
-         * IANA media type.
+         * Either a full IANA media type (`type/subtype`, e.g. `image/png`) or just
+         * the top-level IANA segment (e.g. `image`, `audio`, `video`, `text`).
+         *
+         * `*`-subtype wildcards (e.g. `image/*`) are normalized as equivalent to the
+         * top-level segment alone (e.g. `image`). Providers can use the helpers in
+         * `@ai-sdk/provider-utils` (`isFullMediaType`, `getTopLevelMediaType`,
+         * `detectMediaType`) to resolve the field according to their API
+         * requirements.
+         *
          * @see https://www.iana.org/assignments/media-types/media-types.xhtml
          */
         mediaType: string;
@@ -1946,32 +2016,6 @@ type LanguageModelV4ToolResultOutput = {
          * Provider-specific options.
          */
         providerOptions?: SharedV4ProviderOptions;
-    } | {
-        type: 'file-url';
-        /**
-         * URL of the file.
-         */
-        url: string;
-        /**
-         * IANA media type.
-         * @see https://www.iana.org/assignments/media-types/media-types.xhtml
-         */
-        mediaType: string;
-        /**
-         * Provider-specific options.
-         */
-        providerOptions?: SharedV4ProviderOptions;
-    } | {
-        type: 'file-reference';
-        /**
-         * Provider-specific references for the file.
-         * The key is the provider name, e.g. 'openai' or 'anthropic'.
-         */
-        providerReference: SharedV4ProviderReference;
-        /**
-         * Provider-specific options.
-         */
-        providerOptions?: SharedV4ProviderOptions;
     } | {
         /**
          * Custom content part. This can be used to implement
@@ -2160,14 +2204,17 @@ type LanguageModelV4File = {
      */
     mediaType: string;
     /**
-     * Generated file data as base64 encoded strings or binary data.
+     * Generated file data as a tagged discriminated union:
+     *
+     * - `{ type: 'data', data }`: raw bytes (Uint8Array) or base64-encoded string.
+     * - `{ type: 'url', url }`: a URL that points to the file.
      *
      * The file data should be returned without any unnecessary conversion.
      * If the API returns base64 encoded strings, the file data should be returned
      * as base64 encoded strings. If the API returns binary data, the file data should
      * be returned as binary data.
      */
-    data: string | Uint8Array;
+    data: SharedV4FileDataData | SharedV4FileDataUrl;
     /**
      * Optional provider-specific metadata for the file part.
      */
@@ -2200,14 +2247,17 @@ type LanguageModelV4ReasoningFile = {
      */
     mediaType: string;
     /**
-     * Generated file data as base64 encoded strings or binary data.
+     * Generated file data as a tagged discriminated union:
+     *
+     * - `{ type: 'data', data }`: raw bytes (Uint8Array) or base64-encoded string.
+     * - `{ type: 'url', url }`: a URL that points to the file.
      *
      * The file data should be returned without any unnecessary conversion.
      * If the API returns base64 encoded strings, the file data should be returned
      * as base64 encoded strings. If the API returns binary data, the file data should
      * be returned as binary data.
      */
-    data: string | Uint8Array;
+    data: SharedV4FileDataData | SharedV4FileDataUrl;
     /**
      * Optional provider-specific metadata for the reasoning file part.
      */
@@ -5186,9 +5236,12 @@ interface SkillsV4File {
      */
     path: string;
     /**
-     * The content of the file, either as a base64 string or binary data.
+     * The file data.
+     *
+     * - `{ type: 'data', data }`: raw bytes (`Uint8Array`) or a base64-encoded string.
+     * - `{ type: 'text', text }`: inline text (UTF-8).
      */
-    content: string | Uint8Array;
+    data: SharedV4FileDataData | SharedV4FileDataText;
 }
 interface SkillsV4UploadSkillCallOptions {
     /**
@@ -6139,6 +6192,512 @@ interface ProviderV2 {
     speechModel?(modelId: string): SpeechModelV2;
 }
+/**
+ * A tool definition for realtime models. Sent as part of the session
+ * configuration so the model knows which functions it can call.
+ */
+type RealtimeModelV4ToolDefinition = {
+    /**
+     * The type of the tool (always 'function').
+     */
+    type: 'function';
+    /**
+     * The name of the tool. Unique within the session.
+     */
+    name: string;
+    /**
+     * A description of what the tool does. The model uses this to decide
+     * whether to call the tool.
+     */
+    description?: string;
+    /**
+     * JSON Schema describing the parameters the tool expects.
+     */
+    parameters: JSONSchema7;
+};
+/**
+ * Provider-neutral configuration for a realtime session.
+ * Each provider maps this to their specific session.update payload.
+ */
+type RealtimeModelV4SessionConfig = {
+    /**
+     * System instructions for the model.
+     */
+    instructions?: string;
+    /**
+     * Voice to use for audio output.
+     */
+    voice?: string;
+    /**
+     * Which output modalities the model should produce.
+     */
+    outputModalities?: Array<'text' | 'audio'>;
+    /**
+     * Audio format configuration for input audio.
+     */
+    inputAudioFormat?: {
+        /**
+         * Audio format type (e.g. "audio/pcm", "audio/pcmu", "audio/pcma").
+         */
+        type: string;
+        /**
+         * Sample rate in Hz. Only applicable for PCM format.
+         */
+        rate?: number;
+    };
+    /**
+     * Input audio transcription configuration.
+     *
+     * When enabled, providers that support input transcription emit normalized
+     * `input-transcription-completed` events that can be rendered as user
+     * messages.
+     */
+    inputAudioTranscription?: {
+        /**
+         * Provider-specific transcription model.
+         */
+        model?: string;
+        /**
+         * Optional language hint for the input audio.
+         */
+        language?: string;
+        /**
+         * Optional prompt to guide transcription.
+         */
+        prompt?: string;
+    };
+    /**
+     * Output audio transcription configuration.
+     *
+     * When enabled, providers that support output transcription emit normalized
+     * `audio-transcript-delta` / `audio-transcript-done` events for the model's
+     * spoken response. Some providers transcribe output by default; setting this
+     * makes the behavior explicit rather than relying on that default.
+     */
+    outputAudioTranscription?: {
+        /**
+         * Provider-specific transcription model.
+         */
+        model?: string;
+        /**
+         * Optional language hint for the output audio.
+         */
+        language?: string;
+        /**
+         * Optional prompt to guide transcription.
+         */
+        prompt?: string;
+    };
+    /**
+     * Audio format configuration for output audio.
+     */
+    outputAudioFormat?: {
+        /**
+         * Audio format type (e.g. "audio/pcm", "audio/pcmu", "audio/pcma").
+         */
+        type: string;
+        /**
+         * Sample rate in Hz. Only applicable for PCM format.
+         */
+        rate?: number;
+    };
+    /**
+     * Voice activity detection configuration.
+     * Set to null or type 'disabled' to turn off VAD (push-to-talk mode).
+     */
+    turnDetection?: {
+        /**
+         * VAD mode. 'server-vad' for automatic detection,
+         * 'semantic-vad' for OpenAI's semantic detection,
+         * 'disabled' to turn off VAD.
+         */
+        type: 'server-vad' | 'semantic-vad' | 'disabled';
+        /**
+         * VAD activation threshold (0.0-1.0).
+         * Higher values require louder audio to trigger.
+         */
+        threshold?: number;
+        /**
+         * How long the user must be silent (in ms) before
+         * the server ends the turn.
+         */
+        silenceDurationMs?: number;
+        /**
+         * Amount of audio (in ms) to include before the
+         * detected start of speech.
+         */
+        prefixPaddingMs?: number;
+    } | null;
+    /**
+     * Tool definitions available to the model in this session.
+     */
+    tools?: RealtimeModelV4ToolDefinition[];
+    /**
+     * Provider-specific options that are passed through to the provider.
+     */
+    providerOptions?: Record<string, unknown>;
+};
+/**
+ * Options for creating an ephemeral client secret for browser-side
+ * WebSocket connections to a realtime model.
+ */
+type RealtimeModelV4ClientSecretOptions = {
+    /**
+     * Number of seconds until the client secret expires.
+     */
+    expiresAfterSeconds?: number;
+    /**
+     * Optional session configuration to embed in the token request.
+     * Some providers (e.g. Google) require the full session config at token creation time.
+     */
+    sessionConfig?: RealtimeModelV4SessionConfig;
+};
+/**
+ * Result of creating an ephemeral client secret.
+ */
+type RealtimeModelV4ClientSecretResult = {
+    /**
+     * The ephemeral token value. Used as a Bearer token or in the
+     * WebSocket subprotocol header for authentication.
+     */
+    token: string;
+    /**
+     * The WebSocket URL to connect to. Includes any provider-specific
+     * query parameters (e.g. model ID).
+     */
+    url: string;
+    /**
+     * Unix timestamp (seconds) when this client secret expires.
+     */
+    expiresAt?: number;
+};
+/**
+ * A conversation item that can be created by the client and sent to
+ * the model via the conversation.item.create event.
+ */
+type RealtimeModelV4ConversationItem = RealtimeModelV4TextMessage | RealtimeModelV4AudioMessage | RealtimeModelV4FunctionCallOutput;
+/**
+ * A text message from the user.
+ */
+type RealtimeModelV4TextMessage = {
+    type: 'text-message';
+    role: 'user';
+    text: string;
+};
+/**
+ * An audio message from the user (complete audio, not streamed).
+ */
+type RealtimeModelV4AudioMessage = {
+    type: 'audio-message';
+    role: 'user';
+    /**
+     * Base64-encoded audio data.
+     */
+    audio: string;
+};
+/**
+ * The output of a function call, sent back to the model so it can
+ * continue generating a response using the tool result.
+ */
+type RealtimeModelV4FunctionCallOutput = {
+    type: 'function-call-output';
+    /**
+     * The call ID from the function-call-arguments-done event.
+     * Must match so the model knows which function call this result is for.
+     */
+    callId: string;
+    /**
+     * The name of the function that was called.
+     * Required by some providers (e.g. Google) in the tool response routing.
+     */
+    name?: string;
+    /**
+     * JSON string containing the function call result.
+     */
+    output: string;
+};
+/**
+ * Normalized events sent from the browser to the realtime model.
+ * Each provider maps this to its native event format before sending
+ * over the WebSocket.
+ */
+type RealtimeModelV4ClientEvent = {
+    type: 'session-update';
+    config: RealtimeModelV4SessionConfig;
+} | {
+    type: 'input-audio-append';
+    /**
+     * Base64-encoded audio chunk to append to the input buffer.
+     */
+    audio: string;
+} | {
+    type: 'input-audio-commit';
+} | {
+    type: 'input-audio-clear';
+} | {
+    type: 'conversation-item-create';
+    item: RealtimeModelV4ConversationItem;
+} | {
+    type: 'conversation-item-truncate';
+    /**
+     * The ID of the assistant message item to truncate.
+     */
+    itemId: string;
+    /**
+     * The index of the content part to truncate.
+     */
+    contentIndex: number;
+    /**
+     * Truncate audio after this many milliseconds.
+     */
+    audioEndMs: number;
+} | {
+    type: 'response-create';
+    options?: {
+        modalities?: string[];
+        instructions?: string;
+        metadata?: Record<string, unknown>;
+    };
+} | {
+    type: 'response-cancel';
+};
+/**
+ * Normalized events emitted by the realtime model (model → browser).
+ * Each provider maps its native event format to this discriminated union.
+ *
+ * Every event includes a `raw` field with the original provider-specific
+ * event data for debugging and provider-specific access.
+ */
+type RealtimeModelV4ServerEvent = {
+    type: 'session-created';
+    sessionId?: string;
+    raw: unknown;
+} | {
+    type: 'session-updated';
+    raw: unknown;
+} | {
+    type: 'speech-started';
+    itemId?: string;
+    raw: unknown;
+} | {
+    type: 'speech-stopped';
+    itemId?: string;
+    raw: unknown;
+} | {
+    type: 'audio-committed';
+    itemId?: string;
+    previousItemId?: string;
+    raw: unknown;
+} | {
+    type: 'conversation-item-added';
+    itemId: string;
+    item: unknown;
+    raw: unknown;
+} | {
+    type: 'input-transcription-completed';
+    itemId: string;
+    transcript: string;
+    raw: unknown;
+} | {
+    type: 'response-created';
+    responseId: string;
+    raw: unknown;
+} | {
+    type: 'response-done';
+    responseId: string;
+    status: string;
+    raw: unknown;
+} | {
+    type: 'output-item-added';
+    responseId: string;
+    itemId: string;
+    raw: unknown;
+} | {
+    type: 'output-item-done';
+    responseId: string;
+    itemId: string;
+    raw: unknown;
+} | {
+    type: 'content-part-added';
+    responseId: string;
+    itemId: string;
+    raw: unknown;
+} | {
+    type: 'content-part-done';
+    responseId: string;
+    itemId: string;
+    raw: unknown;
+} | {
+    type: 'audio-delta';
+    responseId: string;
+    itemId: string;
+    /**
+     * Base64-encoded audio chunk.
+     */
+    delta: string;
+    raw: unknown;
+} | {
+    type: 'audio-done';
+    responseId: string;
+    itemId: string;
+    raw: unknown;
+} | {
+    type: 'audio-transcript-delta';
+    responseId: string;
+    itemId: string;
+    /**
+     * Text chunk of the audio transcript.
+     */
+    delta: string;
+    raw: unknown;
+} | {
+    type: 'audio-transcript-done';
+    responseId: string;
+    itemId: string;
+    transcript?: string;
+    raw: unknown;
+} | {
+    type: 'text-delta';
+    responseId: string;
+    itemId: string;
+    /**
+     * Text chunk of the model's text response.
+     */
+    delta: string;
+    raw: unknown;
+} | {
+    type: 'text-done';
+    responseId: string;
+    itemId: string;
+    text?: string;
+    raw: unknown;
+} | {
+    type: 'function-call-arguments-delta';
+    responseId: string;
+    itemId: string;
+    callId: string;
+    /**
+     * Partial JSON string of function call arguments.
+     */
+    delta: string;
+    raw: unknown;
+} | {
+    type: 'function-call-arguments-done';
+    responseId: string;
+    itemId: string;
+    callId: string;
+    /**
+     * The name of the function to call.
+     */
+    name: string;
+    /**
+     * Complete JSON string of function call arguments.
+     */
+    arguments: string;
+    raw: unknown;
+} | {
+    type: 'error';
+    message: string;
+    code?: string;
+    raw: unknown;
+} | {
+    type: 'custom';
+    /**
+     * The original event type string from the provider.
+     */
+    rawType: string;
+    raw: unknown;
+};
+/**
+ * Specification for a realtime model that supports bidirectional
+ * audio/text communication over WebSocket.
+ *
+ * Providers implement this interface to enable realtime voice
+ * conversations through the AI SDK.
+ */
+type RealtimeModelV4 = {
+    /**
+     * The realtime model must specify which interface version it implements.
+     */
+    readonly specificationVersion: 'v4';
+    /**
+     * Provider ID (e.g. 'openai', 'xai').
+     */
+    readonly provider: string;
+    /**
+     * Provider-specific model ID (e.g. 'gpt-4o-realtime', 'grok-3').
+     */
+    readonly modelId: string;
+    /**
+     * Server-side: Creates an ephemeral client secret for authenticating
+     * browser-side WebSocket connections. The secret is short-lived and
+     * safe to expose to client code.
+     *
+     * Naming: "do" prefix to prevent accidental direct usage by the user.
+     */
+    doCreateClientSecret(options: RealtimeModelV4ClientSecretOptions): PromiseLike<RealtimeModelV4ClientSecretResult>;
+    /**
+     * Browser-side: Returns the WebSocket URL and subprotocols to use
+     * when connecting. Each provider has its own authentication mechanism
+     * (e.g. OpenAI uses subprotocol headers, xAI may use query params).
+     */
+    getWebSocketConfig(options: {
+        token: string;
+        url: string;
+    }): {
+        url: string;
+        protocols?: string[];
+    };
+    /**
+     * Browser-side: Parses a raw JSON event received over the WebSocket
+     * and returns one or more normalized events. Providers map their native
+     * event format to the common RealtimeModelV4ServerEvent union.
+     *
+     * Returns an array when a single provider message maps to multiple
+     * normalized events (e.g. Google's serverContent can contain audio,
+     * text, and turn-complete data in one message).
+     */
+    parseServerEvent(raw: unknown): RealtimeModelV4ServerEvent | RealtimeModelV4ServerEvent[];
+    /**
+     * Browser-side: Serializes a normalized client event into the
+     * provider's native JSON format for sending over the WebSocket.
+     */
+    serializeClientEvent(event: RealtimeModelV4ClientEvent): unknown | PromiseLike<unknown>;
+    /**
+     * Browser-side: Builds the provider-specific session configuration
+     * payload from a normalized session config. Used to construct the
+     * session.update event sent after WebSocket connection.
+     */
+    buildSessionConfig(config: RealtimeModelV4SessionConfig): unknown;
+    /**
+     * Browser-side: Returns a message to auto-send back over the WebSocket
+     * in response to a raw incoming message, or null if no response is needed.
+     *
+     * Used for provider-specific keepalive protocols (e.g. ping/pong).
+     * Called by the session layer before parseServerEvent.
+     */
+    getHealthCheckResponse?(raw: unknown): unknown | null;
+};
+type RealtimeFactoryV4GetTokenOptions = {
+    model: string;
+} & RealtimeModelV4ClientSecretOptions;
+type RealtimeFactoryV4GetTokenResult = {
+    token: string;
+    url: string;
+    expiresAt?: number;
+};
+interface RealtimeFactoryV4 {
+    (modelId: string): RealtimeModelV4;
+    getToken(options: RealtimeFactoryV4GetTokenOptions): Promise<RealtimeFactoryV4GetTokenResult>;
+}
 /**
  * A video or image file that can be used for video editing or image-to-video generation.
  * Supports both image inputs (for image-to-video) and video inputs (for editing).
@@ -6576,4 +7135,4 @@ type VideoModelV3 = {
     }>;
 };
-export { AISDKError, APICallError, type EmbeddingModelV2, type EmbeddingModelV2Embedding, type EmbeddingModelV3, type EmbeddingModelV3CallOptions, type EmbeddingModelV3Embedding, type EmbeddingModelV3Middleware, type EmbeddingModelV3Result, type EmbeddingModelV4, type EmbeddingModelV4CallOptions, type EmbeddingModelV4Embedding, type EmbeddingModelV4Middleware, type EmbeddingModelV4Result, EmptyResponseBodyError, type VideoModelV3 as Experimental_VideoModelV3, type VideoModelV3CallOptions as Experimental_VideoModelV3CallOptions, type VideoModelV3File as Experimental_VideoModelV3File, type VideoModelV3VideoData as Experimental_VideoModelV3VideoData, type VideoModelV4 as Experimental_VideoModelV4, type VideoModelV4CallOptions as Experimental_VideoModelV4CallOptions, type VideoModelV4File as Experimental_VideoModelV4File, type VideoModelV4Result as Experimental_VideoModelV4Result, type VideoModelV4VideoData as Experimental_VideoModelV4VideoData, type FilesV4, type FilesV4UploadFileCallOptions, type FilesV4UploadFileResult, type ImageModelV2, type ImageModelV2CallOptions, type ImageModelV2CallWarning, type ImageModelV2ProviderMetadata, type ImageModelV3, type ImageModelV3CallOptions, type ImageModelV3File, type ImageModelV3Middleware, type ImageModelV3ProviderMetadata, type ImageModelV3Usage, type ImageModelV4, type ImageModelV4CallOptions, type ImageModelV4File, type ImageModelV4Middleware, type ImageModelV4ProviderMetadata, type ImageModelV4Result, type ImageModelV4Usage, InvalidArgumentError, InvalidPromptError, InvalidResponseDataError, type JSONArray, type JSONObject, JSONParseError, type JSONValue, type LanguageModelV2, type LanguageModelV2CallOptions, type LanguageModelV2CallWarning, type LanguageModelV2Content, type LanguageModelV2DataContent, type LanguageModelV2File, type LanguageModelV2FilePart, type LanguageModelV2FinishReason, type LanguageModelV2FunctionTool, type LanguageModelV2Message, type LanguageModelV2Middleware, type LanguageModelV2Prompt, type LanguageModelV2ProviderDefinedTool, type LanguageModelV2Reasoning, type LanguageModelV2ReasoningPart, type LanguageModelV2ResponseMetadata, type LanguageModelV2Source, type LanguageModelV2StreamPart, type LanguageModelV2Text, type LanguageModelV2TextPart, type LanguageModelV2ToolCall, type LanguageModelV2ToolCallPart, type LanguageModelV2ToolChoice, type LanguageModelV2ToolResultOutput, type LanguageModelV2ToolResultPart, type LanguageModelV2Usage, type LanguageModelV3, type LanguageModelV3CallOptions, type LanguageModelV3Content, type LanguageModelV3DataContent, type LanguageModelV3File, type LanguageModelV3FilePart, type LanguageModelV3FinishReason, type LanguageModelV3FunctionTool, type LanguageModelV3GenerateResult, type LanguageModelV3Message, type LanguageModelV3Middleware, type LanguageModelV3Prompt, type LanguageModelV3ProviderTool, type LanguageModelV3Reasoning, type LanguageModelV3ReasoningPart, type LanguageModelV3ResponseMetadata, type LanguageModelV3Source, type LanguageModelV3StreamPart, type LanguageModelV3StreamResult, type LanguageModelV3Text, type LanguageModelV3TextPart, type LanguageModelV3ToolApprovalRequest, type LanguageModelV3ToolApprovalResponsePart, type LanguageModelV3ToolCall, type LanguageModelV3ToolCallPart, type LanguageModelV3ToolChoice, type LanguageModelV3ToolResult, type LanguageModelV3ToolResultOutput, type LanguageModelV3ToolResultPart, type LanguageModelV3Usage, type LanguageModelV4, type LanguageModelV4CallOptions, type LanguageModelV4Content, type LanguageModelV4CustomContent, type LanguageModelV4CustomPart, type LanguageModelV4DataContent, type LanguageModelV4File, type LanguageModelV4FilePart, type LanguageModelV4FinishReason, type LanguageModelV4FunctionTool, type LanguageModelV4GenerateResult, type LanguageModelV4Message, type LanguageModelV4Middleware, type LanguageModelV4Prompt, type LanguageModelV4ProviderTool, type LanguageModelV4Reasoning, type LanguageModelV4ReasoningFile, type LanguageModelV4ReasoningFilePart, type LanguageModelV4ReasoningPart, type LanguageModelV4ResponseMetadata, type LanguageModelV4Source, type LanguageModelV4StreamPart, type LanguageModelV4StreamResult, type LanguageModelV4Text, type LanguageModelV4TextPart, type LanguageModelV4ToolApprovalRequest, type LanguageModelV4ToolApprovalResponsePart, type LanguageModelV4ToolCall, type LanguageModelV4ToolCallPart, type LanguageModelV4ToolChoice, type LanguageModelV4ToolResult, type LanguageModelV4ToolResultOutput, type LanguageModelV4ToolResultPart, type LanguageModelV4Usage, LoadAPIKeyError, LoadSettingError, NoContentGeneratedError, NoSuchModelError, NoSuchProviderReferenceError, type ProviderV2, type ProviderV3, type ProviderV4, type RerankingModelV3, type RerankingModelV3CallOptions, type RerankingModelV4, type RerankingModelV4CallOptions, type RerankingModelV4Result, type SharedV2Headers, type SharedV2ProviderMetadata, type SharedV2ProviderOptions, type SharedV3Headers, type SharedV3ProviderMetadata, type SharedV3ProviderOptions, type SharedV3Warning, type SharedV4Headers, type SharedV4ProviderMetadata, type SharedV4ProviderOptions, type SharedV4ProviderReference, type SharedV4Warning, type SkillsV4, type SkillsV4File, type SkillsV4UploadSkillCallOptions, type SkillsV4UploadSkillResult, type SpeechModelV2, type SpeechModelV2CallOptions, type SpeechModelV2CallWarning, type SpeechModelV3, type SpeechModelV3CallOptions, type SpeechModelV4, type SpeechModelV4CallOptions, type SpeechModelV4Result, TooManyEmbeddingValuesForCallError, type TranscriptionModelV2, type TranscriptionModelV2CallOptions, type TranscriptionModelV2CallWarning, type TranscriptionModelV3, type TranscriptionModelV3CallOptions, type TranscriptionModelV4, type TranscriptionModelV4CallOptions, type TranscriptionModelV4Result, type TypeValidationContext, TypeValidationError, UnsupportedFunctionalityError, getErrorMessage, isJSONArray, isJSONObject, isJSONValue };
+export { AISDKError, APICallError, type EmbeddingModelV2, type EmbeddingModelV2Embedding, type EmbeddingModelV3, type EmbeddingModelV3CallOptions, type EmbeddingModelV3Embedding, type EmbeddingModelV3Middleware, type EmbeddingModelV3Result, type EmbeddingModelV4, type EmbeddingModelV4CallOptions, type EmbeddingModelV4Embedding, type EmbeddingModelV4Middleware, type EmbeddingModelV4Result, EmptyResponseBodyError, type RealtimeFactoryV4 as Experimental_RealtimeFactoryV4, type RealtimeFactoryV4GetTokenOptions as Experimental_RealtimeFactoryV4GetTokenOptions, type RealtimeFactoryV4GetTokenResult as Experimental_RealtimeFactoryV4GetTokenResult, type RealtimeModelV4 as Experimental_RealtimeModelV4, type RealtimeModelV4AudioMessage as Experimental_RealtimeModelV4AudioMessage, type RealtimeModelV4ClientEvent as Experimental_RealtimeModelV4ClientEvent, type RealtimeModelV4ClientSecretOptions as Experimental_RealtimeModelV4ClientSecretOptions, type RealtimeModelV4ClientSecretResult as Experimental_RealtimeModelV4ClientSecretResult, type RealtimeModelV4ConversationItem as Experimental_RealtimeModelV4ConversationItem, type RealtimeModelV4FunctionCallOutput as Experimental_RealtimeModelV4FunctionCallOutput, type RealtimeModelV4ServerEvent as Experimental_RealtimeModelV4ServerEvent, type RealtimeModelV4SessionConfig as Experimental_RealtimeModelV4SessionConfig, type RealtimeModelV4TextMessage as Experimental_RealtimeModelV4TextMessage, type RealtimeModelV4ToolDefinition as Experimental_RealtimeModelV4ToolDefinition, type VideoModelV3 as Experimental_VideoModelV3, type VideoModelV3CallOptions as Experimental_VideoModelV3CallOptions, type VideoModelV3File as Experimental_VideoModelV3File, type VideoModelV3VideoData as Experimental_VideoModelV3VideoData, type VideoModelV4 as Experimental_VideoModelV4, type VideoModelV4CallOptions as Experimental_VideoModelV4CallOptions, type VideoModelV4File as Experimental_VideoModelV4File, type VideoModelV4Result as Experimental_VideoModelV4Result, type VideoModelV4VideoData as Experimental_VideoModelV4VideoData, type FilesV4, type FilesV4UploadFileCallOptions, type FilesV4UploadFileResult, type ImageModelV2, type ImageModelV2CallOptions, type ImageModelV2CallWarning, type ImageModelV2ProviderMetadata, type ImageModelV3, type ImageModelV3CallOptions, type ImageModelV3File, type ImageModelV3Middleware, type ImageModelV3ProviderMetadata, type ImageModelV3Usage, type ImageModelV4, type ImageModelV4CallOptions, type ImageModelV4File, type ImageModelV4Middleware, type ImageModelV4ProviderMetadata, type ImageModelV4Result, type ImageModelV4Usage, InvalidArgumentError, InvalidPromptError, InvalidResponseDataError, type JSONArray, type JSONObject, JSONParseError, type JSONValue, type LanguageModelV2, type LanguageModelV2CallOptions, type LanguageModelV2CallWarning, type LanguageModelV2Content, type LanguageModelV2DataContent, type LanguageModelV2File, type LanguageModelV2FilePart, type LanguageModelV2FinishReason, type LanguageModelV2FunctionTool, type LanguageModelV2Message, type LanguageModelV2Middleware, type LanguageModelV2Prompt, type LanguageModelV2ProviderDefinedTool, type LanguageModelV2Reasoning, type LanguageModelV2ReasoningPart, type LanguageModelV2ResponseMetadata, type LanguageModelV2Source, type LanguageModelV2StreamPart, type LanguageModelV2Text, type LanguageModelV2TextPart, type LanguageModelV2ToolCall, type LanguageModelV2ToolCallPart, type LanguageModelV2ToolChoice, type LanguageModelV2ToolResultOutput, type LanguageModelV2ToolResultPart, type LanguageModelV2Usage, type LanguageModelV3, type LanguageModelV3CallOptions, type LanguageModelV3Content, type LanguageModelV3DataContent, type LanguageModelV3File, type LanguageModelV3FilePart, type LanguageModelV3FinishReason, type LanguageModelV3FunctionTool, type LanguageModelV3GenerateResult, type LanguageModelV3Message, type LanguageModelV3Middleware, type LanguageModelV3Prompt, type LanguageModelV3ProviderTool, type LanguageModelV3Reasoning, type LanguageModelV3ReasoningPart, type LanguageModelV3ResponseMetadata, type LanguageModelV3Source, type LanguageModelV3StreamPart, type LanguageModelV3StreamResult, type LanguageModelV3Text, type LanguageModelV3TextPart, type LanguageModelV3ToolApprovalRequest, type LanguageModelV3ToolApprovalResponsePart, type LanguageModelV3ToolCall, type LanguageModelV3ToolCallPart, type LanguageModelV3ToolChoice, type LanguageModelV3ToolResult, type LanguageModelV3ToolResultOutput, type LanguageModelV3ToolResultPart, type LanguageModelV3Usage, type LanguageModelV4, type LanguageModelV4CallOptions, type LanguageModelV4Content, type LanguageModelV4CustomContent, type LanguageModelV4CustomPart, type LanguageModelV4File, type LanguageModelV4FilePart, type LanguageModelV4FinishReason, type LanguageModelV4FunctionTool, type LanguageModelV4GenerateResult, type LanguageModelV4Message, type LanguageModelV4Middleware, type LanguageModelV4Prompt, type LanguageModelV4ProviderTool, type LanguageModelV4Reasoning, type LanguageModelV4ReasoningFile, type LanguageModelV4ReasoningFilePart, type LanguageModelV4ReasoningPart, type LanguageModelV4ResponseMetadata, type LanguageModelV4Source, type LanguageModelV4StreamPart, type LanguageModelV4StreamResult, type LanguageModelV4Text, type LanguageModelV4TextPart, type LanguageModelV4ToolApprovalRequest, type LanguageModelV4ToolApprovalResponsePart, type LanguageModelV4ToolCall, type LanguageModelV4ToolCallPart, type LanguageModelV4ToolChoice, type LanguageModelV4ToolResult, type LanguageModelV4ToolResultOutput, type LanguageModelV4ToolResultPart, type LanguageModelV4Usage, LoadAPIKeyError, LoadSettingError, NoContentGeneratedError, NoSuchModelError, NoSuchProviderReferenceError, type ProviderV2, type ProviderV3, type ProviderV4, type RerankingModelV3, type RerankingModelV3CallOptions, type RerankingModelV4, type RerankingModelV4CallOptions, type RerankingModelV4Result, type SharedV2Headers, type SharedV2ProviderMetadata, type SharedV2ProviderOptions, type SharedV3Headers, type SharedV3ProviderMetadata, type SharedV3ProviderOptions, type SharedV3Warning, type SharedV4FileData, type SharedV4FileDataData, type SharedV4FileDataReference, type SharedV4FileDataText, type SharedV4FileDataUrl, type SharedV4Headers, type SharedV4ProviderMetadata, type SharedV4ProviderOptions, type SharedV4ProviderReference, type SharedV4Warning, type SkillsV4, type SkillsV4File, type SkillsV4UploadSkillCallOptions, type SkillsV4UploadSkillResult, type SpeechModelV2, type SpeechModelV2CallOptions, type SpeechModelV2CallWarning, type SpeechModelV3, type SpeechModelV3CallOptions, type SpeechModelV4, type SpeechModelV4CallOptions, type SpeechModelV4Result, TooManyEmbeddingValuesForCallError, type TranscriptionModelV2, type TranscriptionModelV2CallOptions, type TranscriptionModelV2CallWarning, type TranscriptionModelV3, type TranscriptionModelV3CallOptions, type TranscriptionModelV4, type TranscriptionModelV4CallOptions, type TranscriptionModelV4Result, type TypeValidationContext, TypeValidationError, UnsupportedFunctionalityError, getErrorMessage, isJSONArray, isJSONObject, isJSONValue };