ai 4.3.1 → 4.3.3
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/CHANGELOG.md +18 -0
- package/dist/index.d.mts +134 -3
- package/dist/index.d.ts +134 -3
- package/dist/index.js +156 -24
- package/dist/index.js.map +1 -1
- package/dist/index.mjs +145 -14
- package/dist/index.mjs.map +1 -1
- package/mcp-stdio/dist/index.js +1 -1
- package/mcp-stdio/dist/index.js.map +1 -1
- package/mcp-stdio/dist/index.mjs +1 -1
- package/mcp-stdio/dist/index.mjs.map +1 -1
- package/mcp-stdio/get-environment.test.ts +13 -0
- package/mcp-stdio/get-environment.ts +1 -1
- package/package.json +5 -5
- package/rsc/dist/rsc-server.mjs +12 -6
- package/rsc/dist/rsc-server.mjs.map +1 -1
package/CHANGELOG.md
CHANGED
@@ -1,5 +1,23 @@
|
|
1
1
|
# ai
|
2
2
|
|
3
|
+
## 4.3.3
|
4
|
+
|
5
|
+
### Patch Changes
|
6
|
+
|
7
|
+
- 3e88f4d: fix (ai/mcp): prevent mutation of customEnv
|
8
|
+
- c21fa6d: feat: add transcription with experimental_transcribe
|
9
|
+
- Updated dependencies [c21fa6d]
|
10
|
+
- @ai-sdk/provider-utils@2.2.5
|
11
|
+
- @ai-sdk/provider@1.1.1
|
12
|
+
- @ai-sdk/react@1.2.7
|
13
|
+
- @ai-sdk/ui-utils@1.2.6
|
14
|
+
|
15
|
+
## 4.3.2
|
16
|
+
|
17
|
+
### Patch Changes
|
18
|
+
|
19
|
+
- 665a567: fix (core): improve error handling in streamText's consumeStream method
|
20
|
+
|
3
21
|
## 4.3.1
|
4
22
|
|
5
23
|
### Patch Changes
|
package/dist/index.d.mts
CHANGED
@@ -2,7 +2,7 @@ import { IDGenerator } from '@ai-sdk/provider-utils';
|
|
2
2
|
export { CoreToolCall, CoreToolResult, IDGenerator, ToolCall, ToolResult, createIdGenerator, generateId } from '@ai-sdk/provider-utils';
|
3
3
|
import { DataStreamString, Message, Schema, DeepPartial, JSONValue as JSONValue$1, AssistantMessage, DataMessage } from '@ai-sdk/ui-utils';
|
4
4
|
export { AssistantMessage, AssistantStatus, Attachment, ChatRequest, ChatRequestOptions, CreateMessage, DataMessage, DataStreamPart, DeepPartial, IdGenerator, JSONValue, Message, RequestOptions, Schema, ToolInvocation, UIMessage, UseAssistantOptions, formatAssistantStreamPart, formatDataStreamPart, jsonSchema, parseAssistantStreamPart, parseDataStreamPart, processDataStream, processTextStream, zodSchema } from '@ai-sdk/ui-utils';
|
5
|
-
import { LanguageModelV1, LanguageModelV1FinishReason, LanguageModelV1LogProbs, LanguageModelV1CallWarning, LanguageModelV1Source, JSONValue, EmbeddingModelV1, EmbeddingModelV1Embedding, ImageModelV1, ImageModelV1CallWarning, LanguageModelV1ProviderMetadata, LanguageModelV1CallOptions, AISDKError, LanguageModelV1FunctionToolCall, JSONSchema7, JSONParseError, TypeValidationError, ProviderV1, NoSuchModelError } from '@ai-sdk/provider';
|
5
|
+
import { LanguageModelV1, LanguageModelV1FinishReason, LanguageModelV1LogProbs, LanguageModelV1CallWarning, LanguageModelV1Source, JSONValue, EmbeddingModelV1, EmbeddingModelV1Embedding, ImageModelV1, ImageModelV1CallWarning, LanguageModelV1ProviderMetadata, LanguageModelV1CallOptions, AISDKError, LanguageModelV1FunctionToolCall, JSONSchema7, JSONParseError, TypeValidationError, TranscriptionModelV1CallWarning, TranscriptionModelV1, ProviderV1, NoSuchModelError } from '@ai-sdk/provider';
|
6
6
|
export { AISDKError, APICallError, EmptyResponseBodyError, InvalidPromptError, InvalidResponseDataError, JSONParseError, LanguageModelV1, LanguageModelV1CallOptions, LanguageModelV1Prompt, LanguageModelV1StreamPart, LoadAPIKeyError, NoContentGeneratedError, NoSuchModelError, TypeValidationError, UnsupportedFunctionalityError } from '@ai-sdk/provider';
|
7
7
|
import { ServerResponse } from 'node:http';
|
8
8
|
import { AttributeValue, Tracer } from '@opentelemetry/api';
|
@@ -2539,6 +2539,9 @@ type DataStreamOptions = {
|
|
2539
2539
|
*/
|
2540
2540
|
experimental_sendStart?: boolean;
|
2541
2541
|
};
|
2542
|
+
type ConsumeStreamOptions = {
|
2543
|
+
onError?: (error: unknown) => void;
|
2544
|
+
};
|
2542
2545
|
/**
|
2543
2546
|
A result object for accessing different stream types and additional information.
|
2544
2547
|
*/
|
@@ -2659,8 +2662,10 @@ interface StreamTextResult<TOOLS extends ToolSet, PARTIAL_OUTPUT> {
|
|
2659
2662
|
This is useful to force the stream to finish.
|
2660
2663
|
It effectively removes the backpressure and allows the stream to finish,
|
2661
2664
|
triggering the `onFinish` callback and the promise resolution.
|
2665
|
+
|
2666
|
+
If an error occurs, it is passed to the optional `onError` callback.
|
2662
2667
|
*/
|
2663
|
-
consumeStream(): Promise<void>;
|
2668
|
+
consumeStream(options?: ConsumeStreamOptions): Promise<void>;
|
2664
2669
|
/**
|
2665
2670
|
Converts the result to a data stream.
|
2666
2671
|
|
@@ -3787,6 +3792,132 @@ Callback that is called when the LLM response and the final object validation ar
|
|
3787
3792
|
};
|
3788
3793
|
}): StreamObjectResult<JSONValue, JSONValue, never>;
|
3789
3794
|
|
3795
|
+
/**
|
3796
|
+
Warning from the model provider for this call. The call will proceed, but e.g.
|
3797
|
+
some settings might not be supported, which can lead to suboptimal results.
|
3798
|
+
*/
|
3799
|
+
type TranscriptionWarning = TranscriptionModelV1CallWarning;
|
3800
|
+
|
3801
|
+
type TranscriptionModelResponseMetadata = {
|
3802
|
+
/**
|
3803
|
+
Timestamp for the start of the generated response.
|
3804
|
+
*/
|
3805
|
+
timestamp: Date;
|
3806
|
+
/**
|
3807
|
+
The ID of the response model that was used to generate the response.
|
3808
|
+
*/
|
3809
|
+
modelId: string;
|
3810
|
+
/**
|
3811
|
+
Response headers.
|
3812
|
+
*/
|
3813
|
+
headers?: Record<string, string>;
|
3814
|
+
};
|
3815
|
+
|
3816
|
+
/**
|
3817
|
+
The result of a `transcribe` call.
|
3818
|
+
It contains the transcript and additional information.
|
3819
|
+
*/
|
3820
|
+
interface TranscriptionResult {
|
3821
|
+
/**
|
3822
|
+
* The complete transcribed text from the audio.
|
3823
|
+
*/
|
3824
|
+
readonly text: string;
|
3825
|
+
/**
|
3826
|
+
* Array of transcript segments with timing information.
|
3827
|
+
* Each segment represents a portion of the transcribed text with start and end times.
|
3828
|
+
*/
|
3829
|
+
readonly segments: Array<{
|
3830
|
+
/**
|
3831
|
+
* The text content of this segment.
|
3832
|
+
*/
|
3833
|
+
readonly text: string;
|
3834
|
+
/**
|
3835
|
+
* The start time of this segment in seconds.
|
3836
|
+
*/
|
3837
|
+
readonly startSecond: number;
|
3838
|
+
/**
|
3839
|
+
* The end time of this segment in seconds.
|
3840
|
+
*/
|
3841
|
+
readonly endSecond: number;
|
3842
|
+
}>;
|
3843
|
+
/**
|
3844
|
+
* The detected language of the audio content, as an ISO-639-1 code (e.g., 'en' for English).
|
3845
|
+
* May be undefined if the language couldn't be detected.
|
3846
|
+
*/
|
3847
|
+
readonly language: string | undefined;
|
3848
|
+
/**
|
3849
|
+
* The total duration of the audio file in seconds.
|
3850
|
+
* May be undefined if the duration couldn't be determined.
|
3851
|
+
*/
|
3852
|
+
readonly durationInSeconds: number | undefined;
|
3853
|
+
/**
|
3854
|
+
Warnings for the call, e.g. unsupported settings.
|
3855
|
+
*/
|
3856
|
+
readonly warnings: Array<TranscriptionWarning>;
|
3857
|
+
/**
|
3858
|
+
Response metadata from the provider. There may be multiple responses if we made multiple calls to the model.
|
3859
|
+
*/
|
3860
|
+
readonly responses: Array<TranscriptionModelResponseMetadata>;
|
3861
|
+
/**
|
3862
|
+
Provider metadata from the provider.
|
3863
|
+
*/
|
3864
|
+
readonly providerMetadata: Record<string, Record<string, JSONValue>>;
|
3865
|
+
}
|
3866
|
+
|
3867
|
+
/**
|
3868
|
+
Generates transcripts using a transcription model.
|
3869
|
+
|
3870
|
+
@param model - The transcription model to use.
|
3871
|
+
@param audio - The audio data to transcribe as DataContent (string | Uint8Array | ArrayBuffer | Buffer) or a URL.
|
3872
|
+
@param providerOptions - Additional provider-specific options that are passed through to the provider
|
3873
|
+
as body parameters.
|
3874
|
+
@param maxRetries - Maximum number of retries. Set to 0 to disable retries. Default: 2.
|
3875
|
+
@param abortSignal - An optional abort signal that can be used to cancel the call.
|
3876
|
+
@param headers - Additional HTTP headers to be sent with the request. Only applicable for HTTP-based providers.
|
3877
|
+
|
3878
|
+
@returns A result object that contains the generated transcript.
|
3879
|
+
*/
|
3880
|
+
declare function transcribe({ model, audio, providerOptions, maxRetries: maxRetriesArg, abortSignal, headers, }: {
|
3881
|
+
/**
|
3882
|
+
The transcription model to use.
|
3883
|
+
*/
|
3884
|
+
model: TranscriptionModelV1;
|
3885
|
+
/**
|
3886
|
+
The audio data to transcribe.
|
3887
|
+
*/
|
3888
|
+
audio: DataContent | URL;
|
3889
|
+
/**
|
3890
|
+
Additional provider-specific options that are passed through to the provider
|
3891
|
+
as body parameters.
|
3892
|
+
|
3893
|
+
The outer record is keyed by the provider name, and the inner
|
3894
|
+
record is keyed by the provider-specific metadata key.
|
3895
|
+
```ts
|
3896
|
+
{
|
3897
|
+
"openai": {
|
3898
|
+
"temperature": 0
|
3899
|
+
}
|
3900
|
+
}
|
3901
|
+
```
|
3902
|
+
*/
|
3903
|
+
providerOptions?: ProviderOptions;
|
3904
|
+
/**
|
3905
|
+
Maximum number of retries per transcript model call. Set to 0 to disable retries.
|
3906
|
+
|
3907
|
+
@default 2
|
3908
|
+
*/
|
3909
|
+
maxRetries?: number;
|
3910
|
+
/**
|
3911
|
+
Abort signal.
|
3912
|
+
*/
|
3913
|
+
abortSignal?: AbortSignal;
|
3914
|
+
/**
|
3915
|
+
Additional headers to include in the request.
|
3916
|
+
Only applicable for HTTP-based providers.
|
3917
|
+
*/
|
3918
|
+
headers?: Record<string, string>;
|
3919
|
+
}): Promise<TranscriptionResult>;
|
3920
|
+
|
3790
3921
|
/**
|
3791
3922
|
* Experimental middleware for LanguageModelV1.
|
3792
3923
|
* This type defines the structure for middleware that can be used to modify
|
@@ -4390,4 +4521,4 @@ declare namespace llamaindexAdapter {
|
|
4390
4521
|
};
|
4391
4522
|
}
|
4392
4523
|
|
4393
|
-
export { AssistantContent, AssistantResponse, CallWarning, ChunkDetector, CoreAssistantMessage, CoreMessage, CoreSystemMessage, CoreTool, CoreToolCallUnion, CoreToolChoice, CoreToolMessage, CoreToolResultUnion, CoreUserMessage, DataContent, DataStreamOptions, DataStreamWriter, DownloadError, EmbedManyResult, EmbedResult, Embedding, EmbeddingModel, EmbeddingModelUsage, GenerateImageResult as Experimental_GenerateImageResult, GeneratedFile as Experimental_GeneratedImage, Experimental_LanguageModelV1Middleware, FilePart, FinishReason, GenerateObjectResult, GenerateTextOnStepFinishCallback, GenerateTextResult, GeneratedFile, ImageModel, ImageGenerationWarning as ImageModelCallWarning, ImageModelResponseMetadata, ImagePart, InvalidArgumentError, InvalidDataContentError, InvalidMessageRoleError, InvalidStreamPartError, InvalidToolArgumentsError, JSONRPCError, JSONRPCMessage, JSONRPCNotification, JSONRPCRequest, JSONRPCResponse, langchainAdapter as LangChainAdapter, LanguageModel, LanguageModelRequestMetadata, LanguageModelResponseMetadata, LanguageModelUsage, LanguageModelV1Middleware, llamaindexAdapter as LlamaIndexAdapter, LogProbs, MCPClientError, MCPTransport, MessageConversionError, NoImageGeneratedError, NoObjectGeneratedError, NoOutputSpecifiedError, NoSuchProviderError, NoSuchToolError, ObjectStreamPart, output as Output, Provider, ProviderMetadata, ProviderRegistryProvider, RepairTextFunction, RetryError, StepResult, StreamData, StreamObjectOnFinishCallback, StreamObjectResult, StreamTextOnChunkCallback, StreamTextOnErrorCallback, StreamTextOnFinishCallback, StreamTextOnStepFinishCallback, StreamTextResult, StreamTextTransform, TelemetrySettings, TextPart, TextStreamPart, Tool, ToolCallPart, ToolCallRepairError, ToolCallRepairFunction, ToolCallUnion, ToolChoice, ToolContent, ToolExecutionError, ToolExecutionOptions, ToolResultPart, ToolResultUnion, ToolSet, UserContent, appendClientMessage, appendResponseMessages, convertToCoreMessages, coreAssistantMessageSchema, coreMessageSchema, coreSystemMessageSchema, coreToolMessageSchema, coreUserMessageSchema, cosineSimilarity, createDataStream, createDataStreamResponse, createProviderRegistry, customProvider, defaultSettingsMiddleware, embed, embedMany, createMCPClient as experimental_createMCPClient, experimental_createProviderRegistry, experimental_customProvider, generateImage as experimental_generateImage, experimental_wrapLanguageModel, extractReasoningMiddleware, generateObject, generateText, pipeDataStreamToResponse, simulateReadableStream, simulateStreamingMiddleware, smoothStream, streamObject, streamText, tool, wrapLanguageModel };
|
4524
|
+
export { AssistantContent, AssistantResponse, CallWarning, ChunkDetector, CoreAssistantMessage, CoreMessage, CoreSystemMessage, CoreTool, CoreToolCallUnion, CoreToolChoice, CoreToolMessage, CoreToolResultUnion, CoreUserMessage, DataContent, DataStreamOptions, DataStreamWriter, DownloadError, EmbedManyResult, EmbedResult, Embedding, EmbeddingModel, EmbeddingModelUsage, GenerateImageResult as Experimental_GenerateImageResult, GeneratedFile as Experimental_GeneratedImage, Experimental_LanguageModelV1Middleware, TranscriptionResult as Experimental_TranscriptionResult, FilePart, FinishReason, GenerateObjectResult, GenerateTextOnStepFinishCallback, GenerateTextResult, GeneratedFile, ImageModel, ImageGenerationWarning as ImageModelCallWarning, ImageModelResponseMetadata, ImagePart, InvalidArgumentError, InvalidDataContentError, InvalidMessageRoleError, InvalidStreamPartError, InvalidToolArgumentsError, JSONRPCError, JSONRPCMessage, JSONRPCNotification, JSONRPCRequest, JSONRPCResponse, langchainAdapter as LangChainAdapter, LanguageModel, LanguageModelRequestMetadata, LanguageModelResponseMetadata, LanguageModelUsage, LanguageModelV1Middleware, llamaindexAdapter as LlamaIndexAdapter, LogProbs, MCPClientError, MCPTransport, MessageConversionError, NoImageGeneratedError, NoObjectGeneratedError, NoOutputSpecifiedError, NoSuchProviderError, NoSuchToolError, ObjectStreamPart, output as Output, Provider, ProviderMetadata, ProviderRegistryProvider, RepairTextFunction, RetryError, StepResult, StreamData, StreamObjectOnFinishCallback, StreamObjectResult, StreamTextOnChunkCallback, StreamTextOnErrorCallback, StreamTextOnFinishCallback, StreamTextOnStepFinishCallback, StreamTextResult, StreamTextTransform, TelemetrySettings, TextPart, TextStreamPart, Tool, ToolCallPart, ToolCallRepairError, ToolCallRepairFunction, ToolCallUnion, ToolChoice, ToolContent, ToolExecutionError, ToolExecutionOptions, ToolResultPart, ToolResultUnion, ToolSet, UserContent, appendClientMessage, appendResponseMessages, convertToCoreMessages, coreAssistantMessageSchema, coreMessageSchema, coreSystemMessageSchema, coreToolMessageSchema, coreUserMessageSchema, cosineSimilarity, createDataStream, createDataStreamResponse, createProviderRegistry, customProvider, defaultSettingsMiddleware, embed, embedMany, createMCPClient as experimental_createMCPClient, experimental_createProviderRegistry, experimental_customProvider, generateImage as experimental_generateImage, transcribe as experimental_transcribe, experimental_wrapLanguageModel, extractReasoningMiddleware, generateObject, generateText, pipeDataStreamToResponse, simulateReadableStream, simulateStreamingMiddleware, smoothStream, streamObject, streamText, tool, wrapLanguageModel };
|
package/dist/index.d.ts
CHANGED
@@ -2,7 +2,7 @@ import { IDGenerator } from '@ai-sdk/provider-utils';
|
|
2
2
|
export { CoreToolCall, CoreToolResult, IDGenerator, ToolCall, ToolResult, createIdGenerator, generateId } from '@ai-sdk/provider-utils';
|
3
3
|
import { DataStreamString, Message, Schema, DeepPartial, JSONValue as JSONValue$1, AssistantMessage, DataMessage } from '@ai-sdk/ui-utils';
|
4
4
|
export { AssistantMessage, AssistantStatus, Attachment, ChatRequest, ChatRequestOptions, CreateMessage, DataMessage, DataStreamPart, DeepPartial, IdGenerator, JSONValue, Message, RequestOptions, Schema, ToolInvocation, UIMessage, UseAssistantOptions, formatAssistantStreamPart, formatDataStreamPart, jsonSchema, parseAssistantStreamPart, parseDataStreamPart, processDataStream, processTextStream, zodSchema } from '@ai-sdk/ui-utils';
|
5
|
-
import { LanguageModelV1, LanguageModelV1FinishReason, LanguageModelV1LogProbs, LanguageModelV1CallWarning, LanguageModelV1Source, JSONValue, EmbeddingModelV1, EmbeddingModelV1Embedding, ImageModelV1, ImageModelV1CallWarning, LanguageModelV1ProviderMetadata, LanguageModelV1CallOptions, AISDKError, LanguageModelV1FunctionToolCall, JSONSchema7, JSONParseError, TypeValidationError, ProviderV1, NoSuchModelError } from '@ai-sdk/provider';
|
5
|
+
import { LanguageModelV1, LanguageModelV1FinishReason, LanguageModelV1LogProbs, LanguageModelV1CallWarning, LanguageModelV1Source, JSONValue, EmbeddingModelV1, EmbeddingModelV1Embedding, ImageModelV1, ImageModelV1CallWarning, LanguageModelV1ProviderMetadata, LanguageModelV1CallOptions, AISDKError, LanguageModelV1FunctionToolCall, JSONSchema7, JSONParseError, TypeValidationError, TranscriptionModelV1CallWarning, TranscriptionModelV1, ProviderV1, NoSuchModelError } from '@ai-sdk/provider';
|
6
6
|
export { AISDKError, APICallError, EmptyResponseBodyError, InvalidPromptError, InvalidResponseDataError, JSONParseError, LanguageModelV1, LanguageModelV1CallOptions, LanguageModelV1Prompt, LanguageModelV1StreamPart, LoadAPIKeyError, NoContentGeneratedError, NoSuchModelError, TypeValidationError, UnsupportedFunctionalityError } from '@ai-sdk/provider';
|
7
7
|
import { ServerResponse } from 'node:http';
|
8
8
|
import { AttributeValue, Tracer } from '@opentelemetry/api';
|
@@ -2539,6 +2539,9 @@ type DataStreamOptions = {
|
|
2539
2539
|
*/
|
2540
2540
|
experimental_sendStart?: boolean;
|
2541
2541
|
};
|
2542
|
+
type ConsumeStreamOptions = {
|
2543
|
+
onError?: (error: unknown) => void;
|
2544
|
+
};
|
2542
2545
|
/**
|
2543
2546
|
A result object for accessing different stream types and additional information.
|
2544
2547
|
*/
|
@@ -2659,8 +2662,10 @@ interface StreamTextResult<TOOLS extends ToolSet, PARTIAL_OUTPUT> {
|
|
2659
2662
|
This is useful to force the stream to finish.
|
2660
2663
|
It effectively removes the backpressure and allows the stream to finish,
|
2661
2664
|
triggering the `onFinish` callback and the promise resolution.
|
2665
|
+
|
2666
|
+
If an error occurs, it is passed to the optional `onError` callback.
|
2662
2667
|
*/
|
2663
|
-
consumeStream(): Promise<void>;
|
2668
|
+
consumeStream(options?: ConsumeStreamOptions): Promise<void>;
|
2664
2669
|
/**
|
2665
2670
|
Converts the result to a data stream.
|
2666
2671
|
|
@@ -3787,6 +3792,132 @@ Callback that is called when the LLM response and the final object validation ar
|
|
3787
3792
|
};
|
3788
3793
|
}): StreamObjectResult<JSONValue, JSONValue, never>;
|
3789
3794
|
|
3795
|
+
/**
|
3796
|
+
Warning from the model provider for this call. The call will proceed, but e.g.
|
3797
|
+
some settings might not be supported, which can lead to suboptimal results.
|
3798
|
+
*/
|
3799
|
+
type TranscriptionWarning = TranscriptionModelV1CallWarning;
|
3800
|
+
|
3801
|
+
type TranscriptionModelResponseMetadata = {
|
3802
|
+
/**
|
3803
|
+
Timestamp for the start of the generated response.
|
3804
|
+
*/
|
3805
|
+
timestamp: Date;
|
3806
|
+
/**
|
3807
|
+
The ID of the response model that was used to generate the response.
|
3808
|
+
*/
|
3809
|
+
modelId: string;
|
3810
|
+
/**
|
3811
|
+
Response headers.
|
3812
|
+
*/
|
3813
|
+
headers?: Record<string, string>;
|
3814
|
+
};
|
3815
|
+
|
3816
|
+
/**
|
3817
|
+
The result of a `transcribe` call.
|
3818
|
+
It contains the transcript and additional information.
|
3819
|
+
*/
|
3820
|
+
interface TranscriptionResult {
|
3821
|
+
/**
|
3822
|
+
* The complete transcribed text from the audio.
|
3823
|
+
*/
|
3824
|
+
readonly text: string;
|
3825
|
+
/**
|
3826
|
+
* Array of transcript segments with timing information.
|
3827
|
+
* Each segment represents a portion of the transcribed text with start and end times.
|
3828
|
+
*/
|
3829
|
+
readonly segments: Array<{
|
3830
|
+
/**
|
3831
|
+
* The text content of this segment.
|
3832
|
+
*/
|
3833
|
+
readonly text: string;
|
3834
|
+
/**
|
3835
|
+
* The start time of this segment in seconds.
|
3836
|
+
*/
|
3837
|
+
readonly startSecond: number;
|
3838
|
+
/**
|
3839
|
+
* The end time of this segment in seconds.
|
3840
|
+
*/
|
3841
|
+
readonly endSecond: number;
|
3842
|
+
}>;
|
3843
|
+
/**
|
3844
|
+
* The detected language of the audio content, as an ISO-639-1 code (e.g., 'en' for English).
|
3845
|
+
* May be undefined if the language couldn't be detected.
|
3846
|
+
*/
|
3847
|
+
readonly language: string | undefined;
|
3848
|
+
/**
|
3849
|
+
* The total duration of the audio file in seconds.
|
3850
|
+
* May be undefined if the duration couldn't be determined.
|
3851
|
+
*/
|
3852
|
+
readonly durationInSeconds: number | undefined;
|
3853
|
+
/**
|
3854
|
+
Warnings for the call, e.g. unsupported settings.
|
3855
|
+
*/
|
3856
|
+
readonly warnings: Array<TranscriptionWarning>;
|
3857
|
+
/**
|
3858
|
+
Response metadata from the provider. There may be multiple responses if we made multiple calls to the model.
|
3859
|
+
*/
|
3860
|
+
readonly responses: Array<TranscriptionModelResponseMetadata>;
|
3861
|
+
/**
|
3862
|
+
Provider metadata from the provider.
|
3863
|
+
*/
|
3864
|
+
readonly providerMetadata: Record<string, Record<string, JSONValue>>;
|
3865
|
+
}
|
3866
|
+
|
3867
|
+
/**
|
3868
|
+
Generates transcripts using a transcription model.
|
3869
|
+
|
3870
|
+
@param model - The transcription model to use.
|
3871
|
+
@param audio - The audio data to transcribe as DataContent (string | Uint8Array | ArrayBuffer | Buffer) or a URL.
|
3872
|
+
@param providerOptions - Additional provider-specific options that are passed through to the provider
|
3873
|
+
as body parameters.
|
3874
|
+
@param maxRetries - Maximum number of retries. Set to 0 to disable retries. Default: 2.
|
3875
|
+
@param abortSignal - An optional abort signal that can be used to cancel the call.
|
3876
|
+
@param headers - Additional HTTP headers to be sent with the request. Only applicable for HTTP-based providers.
|
3877
|
+
|
3878
|
+
@returns A result object that contains the generated transcript.
|
3879
|
+
*/
|
3880
|
+
declare function transcribe({ model, audio, providerOptions, maxRetries: maxRetriesArg, abortSignal, headers, }: {
|
3881
|
+
/**
|
3882
|
+
The transcription model to use.
|
3883
|
+
*/
|
3884
|
+
model: TranscriptionModelV1;
|
3885
|
+
/**
|
3886
|
+
The audio data to transcribe.
|
3887
|
+
*/
|
3888
|
+
audio: DataContent | URL;
|
3889
|
+
/**
|
3890
|
+
Additional provider-specific options that are passed through to the provider
|
3891
|
+
as body parameters.
|
3892
|
+
|
3893
|
+
The outer record is keyed by the provider name, and the inner
|
3894
|
+
record is keyed by the provider-specific metadata key.
|
3895
|
+
```ts
|
3896
|
+
{
|
3897
|
+
"openai": {
|
3898
|
+
"temperature": 0
|
3899
|
+
}
|
3900
|
+
}
|
3901
|
+
```
|
3902
|
+
*/
|
3903
|
+
providerOptions?: ProviderOptions;
|
3904
|
+
/**
|
3905
|
+
Maximum number of retries per transcript model call. Set to 0 to disable retries.
|
3906
|
+
|
3907
|
+
@default 2
|
3908
|
+
*/
|
3909
|
+
maxRetries?: number;
|
3910
|
+
/**
|
3911
|
+
Abort signal.
|
3912
|
+
*/
|
3913
|
+
abortSignal?: AbortSignal;
|
3914
|
+
/**
|
3915
|
+
Additional headers to include in the request.
|
3916
|
+
Only applicable for HTTP-based providers.
|
3917
|
+
*/
|
3918
|
+
headers?: Record<string, string>;
|
3919
|
+
}): Promise<TranscriptionResult>;
|
3920
|
+
|
3790
3921
|
/**
|
3791
3922
|
* Experimental middleware for LanguageModelV1.
|
3792
3923
|
* This type defines the structure for middleware that can be used to modify
|
@@ -4390,4 +4521,4 @@ declare namespace llamaindexAdapter {
|
|
4390
4521
|
};
|
4391
4522
|
}
|
4392
4523
|
|
4393
|
-
export { AssistantContent, AssistantResponse, CallWarning, ChunkDetector, CoreAssistantMessage, CoreMessage, CoreSystemMessage, CoreTool, CoreToolCallUnion, CoreToolChoice, CoreToolMessage, CoreToolResultUnion, CoreUserMessage, DataContent, DataStreamOptions, DataStreamWriter, DownloadError, EmbedManyResult, EmbedResult, Embedding, EmbeddingModel, EmbeddingModelUsage, GenerateImageResult as Experimental_GenerateImageResult, GeneratedFile as Experimental_GeneratedImage, Experimental_LanguageModelV1Middleware, FilePart, FinishReason, GenerateObjectResult, GenerateTextOnStepFinishCallback, GenerateTextResult, GeneratedFile, ImageModel, ImageGenerationWarning as ImageModelCallWarning, ImageModelResponseMetadata, ImagePart, InvalidArgumentError, InvalidDataContentError, InvalidMessageRoleError, InvalidStreamPartError, InvalidToolArgumentsError, JSONRPCError, JSONRPCMessage, JSONRPCNotification, JSONRPCRequest, JSONRPCResponse, langchainAdapter as LangChainAdapter, LanguageModel, LanguageModelRequestMetadata, LanguageModelResponseMetadata, LanguageModelUsage, LanguageModelV1Middleware, llamaindexAdapter as LlamaIndexAdapter, LogProbs, MCPClientError, MCPTransport, MessageConversionError, NoImageGeneratedError, NoObjectGeneratedError, NoOutputSpecifiedError, NoSuchProviderError, NoSuchToolError, ObjectStreamPart, output as Output, Provider, ProviderMetadata, ProviderRegistryProvider, RepairTextFunction, RetryError, StepResult, StreamData, StreamObjectOnFinishCallback, StreamObjectResult, StreamTextOnChunkCallback, StreamTextOnErrorCallback, StreamTextOnFinishCallback, StreamTextOnStepFinishCallback, StreamTextResult, StreamTextTransform, TelemetrySettings, TextPart, TextStreamPart, Tool, ToolCallPart, ToolCallRepairError, ToolCallRepairFunction, ToolCallUnion, ToolChoice, ToolContent, ToolExecutionError, ToolExecutionOptions, ToolResultPart, ToolResultUnion, ToolSet, UserContent, appendClientMessage, appendResponseMessages, convertToCoreMessages, coreAssistantMessageSchema, coreMessageSchema, coreSystemMessageSchema, coreToolMessageSchema, coreUserMessageSchema, cosineSimilarity, createDataStream, createDataStreamResponse, createProviderRegistry, customProvider, defaultSettingsMiddleware, embed, embedMany, createMCPClient as experimental_createMCPClient, experimental_createProviderRegistry, experimental_customProvider, generateImage as experimental_generateImage, experimental_wrapLanguageModel, extractReasoningMiddleware, generateObject, generateText, pipeDataStreamToResponse, simulateReadableStream, simulateStreamingMiddleware, smoothStream, streamObject, streamText, tool, wrapLanguageModel };
|
4524
|
+
export { AssistantContent, AssistantResponse, CallWarning, ChunkDetector, CoreAssistantMessage, CoreMessage, CoreSystemMessage, CoreTool, CoreToolCallUnion, CoreToolChoice, CoreToolMessage, CoreToolResultUnion, CoreUserMessage, DataContent, DataStreamOptions, DataStreamWriter, DownloadError, EmbedManyResult, EmbedResult, Embedding, EmbeddingModel, EmbeddingModelUsage, GenerateImageResult as Experimental_GenerateImageResult, GeneratedFile as Experimental_GeneratedImage, Experimental_LanguageModelV1Middleware, TranscriptionResult as Experimental_TranscriptionResult, FilePart, FinishReason, GenerateObjectResult, GenerateTextOnStepFinishCallback, GenerateTextResult, GeneratedFile, ImageModel, ImageGenerationWarning as ImageModelCallWarning, ImageModelResponseMetadata, ImagePart, InvalidArgumentError, InvalidDataContentError, InvalidMessageRoleError, InvalidStreamPartError, InvalidToolArgumentsError, JSONRPCError, JSONRPCMessage, JSONRPCNotification, JSONRPCRequest, JSONRPCResponse, langchainAdapter as LangChainAdapter, LanguageModel, LanguageModelRequestMetadata, LanguageModelResponseMetadata, LanguageModelUsage, LanguageModelV1Middleware, llamaindexAdapter as LlamaIndexAdapter, LogProbs, MCPClientError, MCPTransport, MessageConversionError, NoImageGeneratedError, NoObjectGeneratedError, NoOutputSpecifiedError, NoSuchProviderError, NoSuchToolError, ObjectStreamPart, output as Output, Provider, ProviderMetadata, ProviderRegistryProvider, RepairTextFunction, RetryError, StepResult, StreamData, StreamObjectOnFinishCallback, StreamObjectResult, StreamTextOnChunkCallback, StreamTextOnErrorCallback, StreamTextOnFinishCallback, StreamTextOnStepFinishCallback, StreamTextResult, StreamTextTransform, TelemetrySettings, TextPart, TextStreamPart, Tool, ToolCallPart, ToolCallRepairError, ToolCallRepairFunction, ToolCallUnion, ToolChoice, ToolContent, ToolExecutionError, ToolExecutionOptions, ToolResultPart, ToolResultUnion, ToolSet, UserContent, appendClientMessage, appendResponseMessages, convertToCoreMessages, coreAssistantMessageSchema, coreMessageSchema, coreSystemMessageSchema, coreToolMessageSchema, coreUserMessageSchema, cosineSimilarity, createDataStream, createDataStreamResponse, createProviderRegistry, customProvider, defaultSettingsMiddleware, embed, embedMany, createMCPClient as experimental_createMCPClient, experimental_createProviderRegistry, experimental_customProvider, generateImage as experimental_generateImage, transcribe as experimental_transcribe, experimental_wrapLanguageModel, extractReasoningMiddleware, generateObject, generateText, pipeDataStreamToResponse, simulateReadableStream, simulateStreamingMiddleware, smoothStream, streamObject, streamText, tool, wrapLanguageModel };
|