@cloudflare/workers-types 4.20251121.0 → 4.20251125.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -4002,6 +4002,427 @@ declare abstract class BaseAiTranslation {
4002
4002
  inputs: AiTranslationInput;
4003
4003
  postProcessedOutputs: AiTranslationOutput;
4004
4004
  }
4005
+ /**
4006
+ * Workers AI support for OpenAI's Responses API
4007
+ * Reference: https://github.com/openai/openai-node/blob/master/src/resources/responses/responses.ts
4008
+ *
4009
+ * It's a stripped down version from its source.
4010
+ * It currently supports basic function calling, json mode and accepts images as input.
4011
+ *
4012
+ * It does not include types for WebSearch, CodeInterpreter, FileInputs, MCP, CustomTools.
4013
+ * We plan to add those incrementally as model + platform capabilities evolve.
4014
+ */
4015
+ type ResponsesInput = {
4016
+ background?: boolean | null;
4017
+ conversation?: string | ResponseConversationParam | null;
4018
+ include?: Array<ResponseIncludable> | null;
4019
+ input?: string | ResponseInput;
4020
+ instructions?: string | null;
4021
+ max_output_tokens?: number | null;
4022
+ parallel_tool_calls?: boolean | null;
4023
+ previous_response_id?: string | null;
4024
+ prompt_cache_key?: string;
4025
+ reasoning?: Reasoning | null;
4026
+ safety_identifier?: string;
4027
+ service_tier?: "auto" | "default" | "flex" | "scale" | "priority" | null;
4028
+ stream?: boolean | null;
4029
+ stream_options?: StreamOptions | null;
4030
+ temperature?: number | null;
4031
+ text?: ResponseTextConfig;
4032
+ tool_choice?: ToolChoiceOptions | ToolChoiceFunction;
4033
+ tools?: Array<Tool>;
4034
+ top_p?: number | null;
4035
+ truncation?: "auto" | "disabled" | null;
4036
+ };
4037
+ type ResponsesOutput = {
4038
+ id?: string;
4039
+ created_at?: number;
4040
+ output_text?: string;
4041
+ error?: ResponseError | null;
4042
+ incomplete_details?: ResponseIncompleteDetails | null;
4043
+ instructions?: string | Array<ResponseInputItem> | null;
4044
+ object?: "response";
4045
+ output?: Array<ResponseOutputItem>;
4046
+ parallel_tool_calls?: boolean;
4047
+ temperature?: number | null;
4048
+ tool_choice?: ToolChoiceOptions | ToolChoiceFunction;
4049
+ tools?: Array<Tool>;
4050
+ top_p?: number | null;
4051
+ max_output_tokens?: number | null;
4052
+ previous_response_id?: string | null;
4053
+ prompt?: ResponsePrompt | null;
4054
+ reasoning?: Reasoning | null;
4055
+ safety_identifier?: string;
4056
+ service_tier?: "auto" | "default" | "flex" | "scale" | "priority" | null;
4057
+ status?: ResponseStatus;
4058
+ text?: ResponseTextConfig;
4059
+ truncation?: "auto" | "disabled" | null;
4060
+ usage?: ResponseUsage;
4061
+ };
4062
+ type EasyInputMessage = {
4063
+ content: string | ResponseInputMessageContentList;
4064
+ role: "user" | "assistant" | "system" | "developer";
4065
+ type?: "message";
4066
+ };
4067
+ type ResponsesFunctionTool = {
4068
+ name: string;
4069
+ parameters: {
4070
+ [key: string]: unknown;
4071
+ } | null;
4072
+ strict: boolean | null;
4073
+ type: "function";
4074
+ description?: string | null;
4075
+ };
4076
+ type ResponseIncompleteDetails = {
4077
+ reason?: "max_output_tokens" | "content_filter";
4078
+ };
4079
+ type ResponsePrompt = {
4080
+ id: string;
4081
+ variables?: {
4082
+ [key: string]: string | ResponseInputText | ResponseInputImage;
4083
+ } | null;
4084
+ version?: string | null;
4085
+ };
4086
+ type Reasoning = {
4087
+ effort?: ReasoningEffort | null;
4088
+ generate_summary?: "auto" | "concise" | "detailed" | null;
4089
+ summary?: "auto" | "concise" | "detailed" | null;
4090
+ };
4091
+ type ResponseContent =
4092
+ | ResponseInputText
4093
+ | ResponseInputImage
4094
+ | ResponseOutputText
4095
+ | ResponseOutputRefusal
4096
+ | ResponseContentReasoningText;
4097
+ type ResponseContentReasoningText = {
4098
+ text: string;
4099
+ type: "reasoning_text";
4100
+ };
4101
+ type ResponseConversationParam = {
4102
+ id: string;
4103
+ };
4104
+ type ResponseCreatedEvent = {
4105
+ response: Response;
4106
+ sequence_number: number;
4107
+ type: "response.created";
4108
+ };
4109
+ type ResponseCustomToolCallOutput = {
4110
+ call_id: string;
4111
+ output: string | Array<ResponseInputText | ResponseInputImage>;
4112
+ type: "custom_tool_call_output";
4113
+ id?: string;
4114
+ };
4115
+ type ResponseError = {
4116
+ code:
4117
+ | "server_error"
4118
+ | "rate_limit_exceeded"
4119
+ | "invalid_prompt"
4120
+ | "vector_store_timeout"
4121
+ | "invalid_image"
4122
+ | "invalid_image_format"
4123
+ | "invalid_base64_image"
4124
+ | "invalid_image_url"
4125
+ | "image_too_large"
4126
+ | "image_too_small"
4127
+ | "image_parse_error"
4128
+ | "image_content_policy_violation"
4129
+ | "invalid_image_mode"
4130
+ | "image_file_too_large"
4131
+ | "unsupported_image_media_type"
4132
+ | "empty_image_file"
4133
+ | "failed_to_download_image"
4134
+ | "image_file_not_found";
4135
+ message: string;
4136
+ };
4137
+ type ResponseErrorEvent = {
4138
+ code: string | null;
4139
+ message: string;
4140
+ param: string | null;
4141
+ sequence_number: number;
4142
+ type: "error";
4143
+ };
4144
+ type ResponseFailedEvent = {
4145
+ response: Response;
4146
+ sequence_number: number;
4147
+ type: "response.failed";
4148
+ };
4149
+ type ResponseFormatText = {
4150
+ type: "text";
4151
+ };
4152
+ type ResponseFormatJSONObject = {
4153
+ type: "json_object";
4154
+ };
4155
+ type ResponseFormatTextConfig =
4156
+ | ResponseFormatText
4157
+ | ResponseFormatTextJSONSchemaConfig
4158
+ | ResponseFormatJSONObject;
4159
+ type ResponseFormatTextJSONSchemaConfig = {
4160
+ name: string;
4161
+ schema: {
4162
+ [key: string]: unknown;
4163
+ };
4164
+ type: "json_schema";
4165
+ description?: string;
4166
+ strict?: boolean | null;
4167
+ };
4168
+ type ResponseFunctionCallArgumentsDeltaEvent = {
4169
+ delta: string;
4170
+ item_id: string;
4171
+ output_index: number;
4172
+ sequence_number: number;
4173
+ type: "response.function_call_arguments.delta";
4174
+ };
4175
+ type ResponseFunctionCallArgumentsDoneEvent = {
4176
+ arguments: string;
4177
+ item_id: string;
4178
+ name: string;
4179
+ output_index: number;
4180
+ sequence_number: number;
4181
+ type: "response.function_call_arguments.done";
4182
+ };
4183
+ type ResponseFunctionCallOutputItem =
4184
+ | ResponseInputTextContent
4185
+ | ResponseInputImageContent;
4186
+ type ResponseFunctionCallOutputItemList = Array<ResponseFunctionCallOutputItem>;
4187
+ type ResponseFunctionToolCall = {
4188
+ arguments: string;
4189
+ call_id: string;
4190
+ name: string;
4191
+ type: "function_call";
4192
+ id?: string;
4193
+ status?: "in_progress" | "completed" | "incomplete";
4194
+ };
4195
+ interface ResponseFunctionToolCallItem extends ResponseFunctionToolCall {
4196
+ id: string;
4197
+ }
4198
+ type ResponseFunctionToolCallOutputItem = {
4199
+ id: string;
4200
+ call_id: string;
4201
+ output: string | Array<ResponseInputText | ResponseInputImage>;
4202
+ type: "function_call_output";
4203
+ status?: "in_progress" | "completed" | "incomplete";
4204
+ };
4205
+ type ResponseIncludable =
4206
+ | "message.input_image.image_url"
4207
+ | "message.output_text.logprobs";
4208
+ type ResponseIncompleteEvent = {
4209
+ response: Response;
4210
+ sequence_number: number;
4211
+ type: "response.incomplete";
4212
+ };
4213
+ type ResponseInput = Array<ResponseInputItem>;
4214
+ type ResponseInputContent = ResponseInputText | ResponseInputImage;
4215
+ type ResponseInputImage = {
4216
+ detail: "low" | "high" | "auto";
4217
+ type: "input_image";
4218
+ /**
4219
+ * Base64 encoded image
4220
+ */
4221
+ image_url?: string | null;
4222
+ };
4223
+ type ResponseInputImageContent = {
4224
+ type: "input_image";
4225
+ detail?: "low" | "high" | "auto" | null;
4226
+ /**
4227
+ * Base64 encoded image
4228
+ */
4229
+ image_url?: string | null;
4230
+ };
4231
+ type ResponseInputItem =
4232
+ | EasyInputMessage
4233
+ | ResponseInputItemMessage
4234
+ | ResponseOutputMessage
4235
+ | ResponseFunctionToolCall
4236
+ | ResponseInputItemFunctionCallOutput
4237
+ | ResponseReasoningItem;
4238
+ type ResponseInputItemFunctionCallOutput = {
4239
+ call_id: string;
4240
+ output: string | ResponseFunctionCallOutputItemList;
4241
+ type: "function_call_output";
4242
+ id?: string | null;
4243
+ status?: "in_progress" | "completed" | "incomplete" | null;
4244
+ };
4245
+ type ResponseInputItemMessage = {
4246
+ content: ResponseInputMessageContentList;
4247
+ role: "user" | "system" | "developer";
4248
+ status?: "in_progress" | "completed" | "incomplete";
4249
+ type?: "message";
4250
+ };
4251
+ type ResponseInputMessageContentList = Array<ResponseInputContent>;
4252
+ type ResponseInputMessageItem = {
4253
+ id: string;
4254
+ content: ResponseInputMessageContentList;
4255
+ role: "user" | "system" | "developer";
4256
+ status?: "in_progress" | "completed" | "incomplete";
4257
+ type?: "message";
4258
+ };
4259
+ type ResponseInputText = {
4260
+ text: string;
4261
+ type: "input_text";
4262
+ };
4263
+ type ResponseInputTextContent = {
4264
+ text: string;
4265
+ type: "input_text";
4266
+ };
4267
+ type ResponseItem =
4268
+ | ResponseInputMessageItem
4269
+ | ResponseOutputMessage
4270
+ | ResponseFunctionToolCallItem
4271
+ | ResponseFunctionToolCallOutputItem;
4272
+ type ResponseOutputItem =
4273
+ | ResponseOutputMessage
4274
+ | ResponseFunctionToolCall
4275
+ | ResponseReasoningItem;
4276
+ type ResponseOutputItemAddedEvent = {
4277
+ item: ResponseOutputItem;
4278
+ output_index: number;
4279
+ sequence_number: number;
4280
+ type: "response.output_item.added";
4281
+ };
4282
+ type ResponseOutputItemDoneEvent = {
4283
+ item: ResponseOutputItem;
4284
+ output_index: number;
4285
+ sequence_number: number;
4286
+ type: "response.output_item.done";
4287
+ };
4288
+ type ResponseOutputMessage = {
4289
+ id: string;
4290
+ content: Array<ResponseOutputText | ResponseOutputRefusal>;
4291
+ role: "assistant";
4292
+ status: "in_progress" | "completed" | "incomplete";
4293
+ type: "message";
4294
+ };
4295
+ type ResponseOutputRefusal = {
4296
+ refusal: string;
4297
+ type: "refusal";
4298
+ };
4299
+ type ResponseOutputText = {
4300
+ text: string;
4301
+ type: "output_text";
4302
+ logprobs?: Array<Logprob>;
4303
+ };
4304
+ type ResponseReasoningItem = {
4305
+ id: string;
4306
+ summary: Array<ResponseReasoningSummaryItem>;
4307
+ type: "reasoning";
4308
+ content?: Array<ResponseReasoningContentItem>;
4309
+ encrypted_content?: string | null;
4310
+ status?: "in_progress" | "completed" | "incomplete";
4311
+ };
4312
+ type ResponseReasoningSummaryItem = {
4313
+ text: string;
4314
+ type: "summary_text";
4315
+ };
4316
+ type ResponseReasoningContentItem = {
4317
+ text: string;
4318
+ type: "reasoning_text";
4319
+ };
4320
+ type ResponseReasoningTextDeltaEvent = {
4321
+ content_index: number;
4322
+ delta: string;
4323
+ item_id: string;
4324
+ output_index: number;
4325
+ sequence_number: number;
4326
+ type: "response.reasoning_text.delta";
4327
+ };
4328
+ type ResponseReasoningTextDoneEvent = {
4329
+ content_index: number;
4330
+ item_id: string;
4331
+ output_index: number;
4332
+ sequence_number: number;
4333
+ text: string;
4334
+ type: "response.reasoning_text.done";
4335
+ };
4336
+ type ResponseRefusalDeltaEvent = {
4337
+ content_index: number;
4338
+ delta: string;
4339
+ item_id: string;
4340
+ output_index: number;
4341
+ sequence_number: number;
4342
+ type: "response.refusal.delta";
4343
+ };
4344
+ type ResponseRefusalDoneEvent = {
4345
+ content_index: number;
4346
+ item_id: string;
4347
+ output_index: number;
4348
+ refusal: string;
4349
+ sequence_number: number;
4350
+ type: "response.refusal.done";
4351
+ };
4352
+ type ResponseStatus =
4353
+ | "completed"
4354
+ | "failed"
4355
+ | "in_progress"
4356
+ | "cancelled"
4357
+ | "queued"
4358
+ | "incomplete";
4359
+ type ResponseStreamEvent =
4360
+ | ResponseCompletedEvent
4361
+ | ResponseCreatedEvent
4362
+ | ResponseErrorEvent
4363
+ | ResponseFunctionCallArgumentsDeltaEvent
4364
+ | ResponseFunctionCallArgumentsDoneEvent
4365
+ | ResponseFailedEvent
4366
+ | ResponseIncompleteEvent
4367
+ | ResponseOutputItemAddedEvent
4368
+ | ResponseOutputItemDoneEvent
4369
+ | ResponseReasoningTextDeltaEvent
4370
+ | ResponseReasoningTextDoneEvent
4371
+ | ResponseRefusalDeltaEvent
4372
+ | ResponseRefusalDoneEvent
4373
+ | ResponseTextDeltaEvent
4374
+ | ResponseTextDoneEvent;
4375
+ type ResponseCompletedEvent = {
4376
+ response: Response;
4377
+ sequence_number: number;
4378
+ type: "response.completed";
4379
+ };
4380
+ type ResponseTextConfig = {
4381
+ format?: ResponseFormatTextConfig;
4382
+ verbosity?: "low" | "medium" | "high" | null;
4383
+ };
4384
+ type ResponseTextDeltaEvent = {
4385
+ content_index: number;
4386
+ delta: string;
4387
+ item_id: string;
4388
+ logprobs: Array<Logprob>;
4389
+ output_index: number;
4390
+ sequence_number: number;
4391
+ type: "response.output_text.delta";
4392
+ };
4393
+ type ResponseTextDoneEvent = {
4394
+ content_index: number;
4395
+ item_id: string;
4396
+ logprobs: Array<Logprob>;
4397
+ output_index: number;
4398
+ sequence_number: number;
4399
+ text: string;
4400
+ type: "response.output_text.done";
4401
+ };
4402
+ type Logprob = {
4403
+ token: string;
4404
+ logprob: number;
4405
+ top_logprobs?: Array<TopLogprob>;
4406
+ };
4407
+ type TopLogprob = {
4408
+ token?: string;
4409
+ logprob?: number;
4410
+ };
4411
+ type ResponseUsage = {
4412
+ input_tokens: number;
4413
+ output_tokens: number;
4414
+ total_tokens: number;
4415
+ };
4416
+ type Tool = ResponsesFunctionTool;
4417
+ type ToolChoiceFunction = {
4418
+ name: string;
4419
+ type: "function";
4420
+ };
4421
+ type ToolChoiceOptions = "none";
4422
+ type ReasoningEffort = "minimal" | "low" | "medium" | "high" | null;
4423
+ type StreamOptions = {
4424
+ include_obfuscation?: boolean;
4425
+ };
4005
4426
  type Ai_Cf_Baai_Bge_Base_En_V1_5_Input =
4006
4427
  | {
4007
4428
  text: string | string[];
@@ -4034,8 +4455,8 @@ type Ai_Cf_Baai_Bge_Base_En_V1_5_Output =
4034
4455
  */
4035
4456
  pooling?: "mean" | "cls";
4036
4457
  }
4037
- | AsyncResponse;
4038
- interface AsyncResponse {
4458
+ | Ai_Cf_Baai_Bge_Base_En_V1_5_AsyncResponse;
4459
+ interface Ai_Cf_Baai_Bge_Base_En_V1_5_AsyncResponse {
4039
4460
  /**
4040
4461
  * The async request id that can be used to obtain the results.
4041
4462
  */
@@ -4117,7 +4538,13 @@ type Ai_Cf_Meta_M2M100_1_2B_Output =
4117
4538
  */
4118
4539
  translated_text?: string;
4119
4540
  }
4120
- | AsyncResponse;
4541
+ | Ai_Cf_Meta_M2M100_1_2B_AsyncResponse;
4542
+ interface Ai_Cf_Meta_M2M100_1_2B_AsyncResponse {
4543
+ /**
4544
+ * The async request id that can be used to obtain the results.
4545
+ */
4546
+ request_id?: string;
4547
+ }
4121
4548
  declare abstract class Base_Ai_Cf_Meta_M2M100_1_2B {
4122
4549
  inputs: Ai_Cf_Meta_M2M100_1_2B_Input;
4123
4550
  postProcessedOutputs: Ai_Cf_Meta_M2M100_1_2B_Output;
@@ -4154,7 +4581,13 @@ type Ai_Cf_Baai_Bge_Small_En_V1_5_Output =
4154
4581
  */
4155
4582
  pooling?: "mean" | "cls";
4156
4583
  }
4157
- | AsyncResponse;
4584
+ | Ai_Cf_Baai_Bge_Small_En_V1_5_AsyncResponse;
4585
+ interface Ai_Cf_Baai_Bge_Small_En_V1_5_AsyncResponse {
4586
+ /**
4587
+ * The async request id that can be used to obtain the results.
4588
+ */
4589
+ request_id?: string;
4590
+ }
4158
4591
  declare abstract class Base_Ai_Cf_Baai_Bge_Small_En_V1_5 {
4159
4592
  inputs: Ai_Cf_Baai_Bge_Small_En_V1_5_Input;
4160
4593
  postProcessedOutputs: Ai_Cf_Baai_Bge_Small_En_V1_5_Output;
@@ -4191,7 +4624,13 @@ type Ai_Cf_Baai_Bge_Large_En_V1_5_Output =
4191
4624
  */
4192
4625
  pooling?: "mean" | "cls";
4193
4626
  }
4194
- | AsyncResponse;
4627
+ | Ai_Cf_Baai_Bge_Large_En_V1_5_AsyncResponse;
4628
+ interface Ai_Cf_Baai_Bge_Large_En_V1_5_AsyncResponse {
4629
+ /**
4630
+ * The async request id that can be used to obtain the results.
4631
+ */
4632
+ request_id?: string;
4633
+ }
4195
4634
  declare abstract class Base_Ai_Cf_Baai_Bge_Large_En_V1_5 {
4196
4635
  inputs: Ai_Cf_Baai_Bge_Large_En_V1_5_Input;
4197
4636
  postProcessedOutputs: Ai_Cf_Baai_Bge_Large_En_V1_5_Output;
@@ -4382,15 +4821,18 @@ declare abstract class Base_Ai_Cf_Openai_Whisper_Large_V3_Turbo {
4382
4821
  postProcessedOutputs: Ai_Cf_Openai_Whisper_Large_V3_Turbo_Output;
4383
4822
  }
4384
4823
  type Ai_Cf_Baai_Bge_M3_Input =
4385
- | BGEM3InputQueryAndContexts
4386
- | BGEM3InputEmbedding
4824
+ | Ai_Cf_Baai_Bge_M3_Input_QueryAnd_Contexts
4825
+ | Ai_Cf_Baai_Bge_M3_Input_Embedding
4387
4826
  | {
4388
4827
  /**
4389
4828
  * Batch of the embeddings requests to run using async-queue
4390
4829
  */
4391
- requests: (BGEM3InputQueryAndContexts1 | BGEM3InputEmbedding1)[];
4830
+ requests: (
4831
+ | Ai_Cf_Baai_Bge_M3_Input_QueryAnd_Contexts_1
4832
+ | Ai_Cf_Baai_Bge_M3_Input_Embedding_1
4833
+ )[];
4392
4834
  };
4393
- interface BGEM3InputQueryAndContexts {
4835
+ interface Ai_Cf_Baai_Bge_M3_Input_QueryAnd_Contexts {
4394
4836
  /**
4395
4837
  * A query you wish to perform against the provided contexts. If no query is provided the model with respond with embeddings for contexts
4396
4838
  */
@@ -4409,14 +4851,14 @@ interface BGEM3InputQueryAndContexts {
4409
4851
  */
4410
4852
  truncate_inputs?: boolean;
4411
4853
  }
4412
- interface BGEM3InputEmbedding {
4854
+ interface Ai_Cf_Baai_Bge_M3_Input_Embedding {
4413
4855
  text: string | string[];
4414
4856
  /**
4415
4857
  * When provided with too long context should the model error out or truncate the context to fit?
4416
4858
  */
4417
4859
  truncate_inputs?: boolean;
4418
4860
  }
4419
- interface BGEM3InputQueryAndContexts1 {
4861
+ interface Ai_Cf_Baai_Bge_M3_Input_QueryAnd_Contexts_1 {
4420
4862
  /**
4421
4863
  * A query you wish to perform against the provided contexts. If no query is provided the model with respond with embeddings for contexts
4422
4864
  */
@@ -4435,7 +4877,7 @@ interface BGEM3InputQueryAndContexts1 {
4435
4877
  */
4436
4878
  truncate_inputs?: boolean;
4437
4879
  }
4438
- interface BGEM3InputEmbedding1 {
4880
+ interface Ai_Cf_Baai_Bge_M3_Input_Embedding_1 {
4439
4881
  text: string | string[];
4440
4882
  /**
4441
4883
  * When provided with too long context should the model error out or truncate the context to fit?
@@ -4443,11 +4885,11 @@ interface BGEM3InputEmbedding1 {
4443
4885
  truncate_inputs?: boolean;
4444
4886
  }
4445
4887
  type Ai_Cf_Baai_Bge_M3_Output =
4446
- | BGEM3OuputQuery
4447
- | BGEM3OutputEmbeddingForContexts
4448
- | BGEM3OuputEmbedding
4449
- | AsyncResponse;
4450
- interface BGEM3OuputQuery {
4888
+ | Ai_Cf_Baai_Bge_M3_Ouput_Query
4889
+ | Ai_Cf_Baai_Bge_M3_Output_EmbeddingFor_Contexts
4890
+ | Ai_Cf_Baai_Bge_M3_Ouput_Embedding
4891
+ | Ai_Cf_Baai_Bge_M3_AsyncResponse;
4892
+ interface Ai_Cf_Baai_Bge_M3_Ouput_Query {
4451
4893
  response?: {
4452
4894
  /**
4453
4895
  * Index of the context in the request
@@ -4459,7 +4901,7 @@ interface BGEM3OuputQuery {
4459
4901
  score?: number;
4460
4902
  }[];
4461
4903
  }
4462
- interface BGEM3OutputEmbeddingForContexts {
4904
+ interface Ai_Cf_Baai_Bge_M3_Output_EmbeddingFor_Contexts {
4463
4905
  response?: number[][];
4464
4906
  shape?: number[];
4465
4907
  /**
@@ -4467,7 +4909,7 @@ interface BGEM3OutputEmbeddingForContexts {
4467
4909
  */
4468
4910
  pooling?: "mean" | "cls";
4469
4911
  }
4470
- interface BGEM3OuputEmbedding {
4912
+ interface Ai_Cf_Baai_Bge_M3_Ouput_Embedding {
4471
4913
  shape?: number[];
4472
4914
  /**
4473
4915
  * Embeddings of the requested text values
@@ -4478,6 +4920,12 @@ interface BGEM3OuputEmbedding {
4478
4920
  */
4479
4921
  pooling?: "mean" | "cls";
4480
4922
  }
4923
+ interface Ai_Cf_Baai_Bge_M3_AsyncResponse {
4924
+ /**
4925
+ * The async request id that can be used to obtain the results.
4926
+ */
4927
+ request_id?: string;
4928
+ }
4481
4929
  declare abstract class Base_Ai_Cf_Baai_Bge_M3 {
4482
4930
  inputs: Ai_Cf_Baai_Bge_M3_Input;
4483
4931
  postProcessedOutputs: Ai_Cf_Baai_Bge_M3_Output;
@@ -4502,8 +4950,10 @@ declare abstract class Base_Ai_Cf_Black_Forest_Labs_Flux_1_Schnell {
4502
4950
  inputs: Ai_Cf_Black_Forest_Labs_Flux_1_Schnell_Input;
4503
4951
  postProcessedOutputs: Ai_Cf_Black_Forest_Labs_Flux_1_Schnell_Output;
4504
4952
  }
4505
- type Ai_Cf_Meta_Llama_3_2_11B_Vision_Instruct_Input = Prompt | Messages;
4506
- interface Prompt {
4953
+ type Ai_Cf_Meta_Llama_3_2_11B_Vision_Instruct_Input =
4954
+ | Ai_Cf_Meta_Llama_3_2_11B_Vision_Instruct_Prompt
4955
+ | Ai_Cf_Meta_Llama_3_2_11B_Vision_Instruct_Messages;
4956
+ interface Ai_Cf_Meta_Llama_3_2_11B_Vision_Instruct_Prompt {
4507
4957
  /**
4508
4958
  * The input text prompt for the model to generate a response.
4509
4959
  */
@@ -4554,7 +5004,7 @@ interface Prompt {
4554
5004
  */
4555
5005
  lora?: string;
4556
5006
  }
4557
- interface Messages {
5007
+ interface Ai_Cf_Meta_Llama_3_2_11B_Vision_Instruct_Messages {
4558
5008
  /**
4559
5009
  * An array of message objects representing the conversation history.
4560
5010
  */
@@ -4752,10 +5202,10 @@ declare abstract class Base_Ai_Cf_Meta_Llama_3_2_11B_Vision_Instruct {
4752
5202
  postProcessedOutputs: Ai_Cf_Meta_Llama_3_2_11B_Vision_Instruct_Output;
4753
5203
  }
4754
5204
  type Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Input =
4755
- | Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Prompt
4756
- | Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Messages
4757
- | AsyncBatch;
4758
- interface Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Prompt {
5205
+ | Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Prompt
5206
+ | Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Messages
5207
+ | Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Async_Batch;
5208
+ interface Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Prompt {
4759
5209
  /**
4760
5210
  * The input text prompt for the model to generate a response.
4761
5211
  */
@@ -4764,7 +5214,7 @@ interface Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Prompt {
4764
5214
  * Name of the LoRA (Low-Rank Adaptation) model to fine-tune the base model.
4765
5215
  */
4766
5216
  lora?: string;
4767
- response_format?: JSONMode;
5217
+ response_format?: Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_JSON_Mode;
4768
5218
  /**
4769
5219
  * If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
4770
5220
  */
@@ -4806,11 +5256,11 @@ interface Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Prompt {
4806
5256
  */
4807
5257
  presence_penalty?: number;
4808
5258
  }
4809
- interface JSONMode {
5259
+ interface Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_JSON_Mode {
4810
5260
  type?: "json_object" | "json_schema";
4811
5261
  json_schema?: unknown;
4812
5262
  }
4813
- interface Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Messages {
5263
+ interface Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Messages {
4814
5264
  /**
4815
5265
  * An array of message objects representing the conversation history.
4816
5266
  */
@@ -4918,7 +5368,7 @@ interface Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Messages {
4918
5368
  };
4919
5369
  }
4920
5370
  )[];
4921
- response_format?: JSONMode;
5371
+ response_format?: Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_JSON_Mode_1;
4922
5372
  /**
4923
5373
  * If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
4924
5374
  */
@@ -4960,7 +5410,11 @@ interface Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Messages {
4960
5410
  */
4961
5411
  presence_penalty?: number;
4962
5412
  }
4963
- interface AsyncBatch {
5413
+ interface Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_JSON_Mode_1 {
5414
+ type?: "json_object" | "json_schema";
5415
+ json_schema?: unknown;
5416
+ }
5417
+ interface Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Async_Batch {
4964
5418
  requests?: {
4965
5419
  /**
4966
5420
  * User-supplied reference. This field will be present in the response as well it can be used to reference the request and response. It's NOT validated to be unique.
@@ -5002,9 +5456,13 @@ interface AsyncBatch {
5002
5456
  * Increases the likelihood of the model introducing new topics.
5003
5457
  */
5004
5458
  presence_penalty?: number;
5005
- response_format?: JSONMode;
5459
+ response_format?: Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_JSON_Mode_2;
5006
5460
  }[];
5007
5461
  }
5462
+ interface Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_JSON_Mode_2 {
5463
+ type?: "json_object" | "json_schema";
5464
+ json_schema?: unknown;
5465
+ }
5008
5466
  type Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Output =
5009
5467
  | {
5010
5468
  /**
@@ -5043,7 +5501,13 @@ type Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Output =
5043
5501
  }[];
5044
5502
  }
5045
5503
  | string
5046
- | AsyncResponse;
5504
+ | Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_AsyncResponse;
5505
+ interface Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_AsyncResponse {
5506
+ /**
5507
+ * The async request id that can be used to obtain the results.
5508
+ */
5509
+ request_id?: string;
5510
+ }
5047
5511
  declare abstract class Base_Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast {
5048
5512
  inputs: Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Input;
5049
5513
  postProcessedOutputs: Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Output;
@@ -5150,9 +5614,9 @@ declare abstract class Base_Ai_Cf_Baai_Bge_Reranker_Base {
5150
5614
  postProcessedOutputs: Ai_Cf_Baai_Bge_Reranker_Base_Output;
5151
5615
  }
5152
5616
  type Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_Input =
5153
- | Qwen2_5_Coder_32B_Instruct_Prompt
5154
- | Qwen2_5_Coder_32B_Instruct_Messages;
5155
- interface Qwen2_5_Coder_32B_Instruct_Prompt {
5617
+ | Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_Prompt
5618
+ | Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_Messages;
5619
+ interface Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_Prompt {
5156
5620
  /**
5157
5621
  * The input text prompt for the model to generate a response.
5158
5622
  */
@@ -5161,7 +5625,7 @@ interface Qwen2_5_Coder_32B_Instruct_Prompt {
5161
5625
  * Name of the LoRA (Low-Rank Adaptation) model to fine-tune the base model.
5162
5626
  */
5163
5627
  lora?: string;
5164
- response_format?: JSONMode;
5628
+ response_format?: Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_JSON_Mode;
5165
5629
  /**
5166
5630
  * If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
5167
5631
  */
@@ -5203,7 +5667,11 @@ interface Qwen2_5_Coder_32B_Instruct_Prompt {
5203
5667
  */
5204
5668
  presence_penalty?: number;
5205
5669
  }
5206
- interface Qwen2_5_Coder_32B_Instruct_Messages {
5670
+ interface Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_JSON_Mode {
5671
+ type?: "json_object" | "json_schema";
5672
+ json_schema?: unknown;
5673
+ }
5674
+ interface Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_Messages {
5207
5675
  /**
5208
5676
  * An array of message objects representing the conversation history.
5209
5677
  */
@@ -5311,7 +5779,7 @@ interface Qwen2_5_Coder_32B_Instruct_Messages {
5311
5779
  };
5312
5780
  }
5313
5781
  )[];
5314
- response_format?: JSONMode;
5782
+ response_format?: Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_JSON_Mode_1;
5315
5783
  /**
5316
5784
  * If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
5317
5785
  */
@@ -5353,6 +5821,10 @@ interface Qwen2_5_Coder_32B_Instruct_Messages {
5353
5821
  */
5354
5822
  presence_penalty?: number;
5355
5823
  }
5824
+ interface Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_JSON_Mode_1 {
5825
+ type?: "json_object" | "json_schema";
5826
+ json_schema?: unknown;
5827
+ }
5356
5828
  type Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_Output = {
5357
5829
  /**
5358
5830
  * The generated text response from the model
@@ -5393,8 +5865,10 @@ declare abstract class Base_Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct {
5393
5865
  inputs: Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_Input;
5394
5866
  postProcessedOutputs: Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_Output;
5395
5867
  }
5396
- type Ai_Cf_Qwen_Qwq_32B_Input = Qwen_Qwq_32B_Prompt | Qwen_Qwq_32B_Messages;
5397
- interface Qwen_Qwq_32B_Prompt {
5868
+ type Ai_Cf_Qwen_Qwq_32B_Input =
5869
+ | Ai_Cf_Qwen_Qwq_32B_Prompt
5870
+ | Ai_Cf_Qwen_Qwq_32B_Messages;
5871
+ interface Ai_Cf_Qwen_Qwq_32B_Prompt {
5398
5872
  /**
5399
5873
  * The input text prompt for the model to generate a response.
5400
5874
  */
@@ -5444,7 +5918,7 @@ interface Qwen_Qwq_32B_Prompt {
5444
5918
  */
5445
5919
  presence_penalty?: number;
5446
5920
  }
5447
- interface Qwen_Qwq_32B_Messages {
5921
+ interface Ai_Cf_Qwen_Qwq_32B_Messages {
5448
5922
  /**
5449
5923
  * An array of message objects representing the conversation history.
5450
5924
  */
@@ -5666,9 +6140,9 @@ declare abstract class Base_Ai_Cf_Qwen_Qwq_32B {
5666
6140
  postProcessedOutputs: Ai_Cf_Qwen_Qwq_32B_Output;
5667
6141
  }
5668
6142
  type Ai_Cf_Mistralai_Mistral_Small_3_1_24B_Instruct_Input =
5669
- | Mistral_Small_3_1_24B_Instruct_Prompt
5670
- | Mistral_Small_3_1_24B_Instruct_Messages;
5671
- interface Mistral_Small_3_1_24B_Instruct_Prompt {
6143
+ | Ai_Cf_Mistralai_Mistral_Small_3_1_24B_Instruct_Prompt
6144
+ | Ai_Cf_Mistralai_Mistral_Small_3_1_24B_Instruct_Messages;
6145
+ interface Ai_Cf_Mistralai_Mistral_Small_3_1_24B_Instruct_Prompt {
5672
6146
  /**
5673
6147
  * The input text prompt for the model to generate a response.
5674
6148
  */
@@ -5718,7 +6192,7 @@ interface Mistral_Small_3_1_24B_Instruct_Prompt {
5718
6192
  */
5719
6193
  presence_penalty?: number;
5720
6194
  }
5721
- interface Mistral_Small_3_1_24B_Instruct_Messages {
6195
+ interface Ai_Cf_Mistralai_Mistral_Small_3_1_24B_Instruct_Messages {
5722
6196
  /**
5723
6197
  * An array of message objects representing the conversation history.
5724
6198
  */
@@ -5940,9 +6414,9 @@ declare abstract class Base_Ai_Cf_Mistralai_Mistral_Small_3_1_24B_Instruct {
5940
6414
  postProcessedOutputs: Ai_Cf_Mistralai_Mistral_Small_3_1_24B_Instruct_Output;
5941
6415
  }
5942
6416
  type Ai_Cf_Google_Gemma_3_12B_It_Input =
5943
- | Google_Gemma_3_12B_It_Prompt
5944
- | Google_Gemma_3_12B_It_Messages;
5945
- interface Google_Gemma_3_12B_It_Prompt {
6417
+ | Ai_Cf_Google_Gemma_3_12B_It_Prompt
6418
+ | Ai_Cf_Google_Gemma_3_12B_It_Messages;
6419
+ interface Ai_Cf_Google_Gemma_3_12B_It_Prompt {
5946
6420
  /**
5947
6421
  * The input text prompt for the model to generate a response.
5948
6422
  */
@@ -5992,7 +6466,7 @@ interface Google_Gemma_3_12B_It_Prompt {
5992
6466
  */
5993
6467
  presence_penalty?: number;
5994
6468
  }
5995
- interface Google_Gemma_3_12B_It_Messages {
6469
+ interface Ai_Cf_Google_Gemma_3_12B_It_Messages {
5996
6470
  /**
5997
6471
  * An array of message objects representing the conversation history.
5998
6472
  */
@@ -6015,20 +6489,7 @@ interface Google_Gemma_3_12B_It_Messages {
6015
6489
  */
6016
6490
  url?: string;
6017
6491
  };
6018
- }[]
6019
- | {
6020
- /**
6021
- * Type of the content provided
6022
- */
6023
- type?: string;
6024
- text?: string;
6025
- image_url?: {
6026
- /**
6027
- * image uri with data (e.g. data:image/jpeg;base64,/9j/...). HTTP URL will not be accepted
6028
- */
6029
- url?: string;
6030
- };
6031
- };
6492
+ }[];
6032
6493
  }[];
6033
6494
  functions?: {
6034
6495
  name: string;
@@ -6210,10 +6671,10 @@ declare abstract class Base_Ai_Cf_Google_Gemma_3_12B_It {
6210
6671
  postProcessedOutputs: Ai_Cf_Google_Gemma_3_12B_It_Output;
6211
6672
  }
6212
6673
  type Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Input =
6213
- | Ai_Cf_Meta_Llama_4_Prompt
6214
- | Ai_Cf_Meta_Llama_4_Messages
6215
- | Ai_Cf_Meta_Llama_4_Async_Batch;
6216
- interface Ai_Cf_Meta_Llama_4_Prompt {
6674
+ | Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Prompt
6675
+ | Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Messages
6676
+ | Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Async_Batch;
6677
+ interface Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Prompt {
6217
6678
  /**
6218
6679
  * The input text prompt for the model to generate a response.
6219
6680
  */
@@ -6222,7 +6683,7 @@ interface Ai_Cf_Meta_Llama_4_Prompt {
6222
6683
  * JSON schema that should be fulfilled for the response.
6223
6684
  */
6224
6685
  guided_json?: object;
6225
- response_format?: JSONMode;
6686
+ response_format?: Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_JSON_Mode;
6226
6687
  /**
6227
6688
  * If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
6228
6689
  */
@@ -6264,7 +6725,11 @@ interface Ai_Cf_Meta_Llama_4_Prompt {
6264
6725
  */
6265
6726
  presence_penalty?: number;
6266
6727
  }
6267
- interface Ai_Cf_Meta_Llama_4_Messages {
6728
+ interface Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_JSON_Mode {
6729
+ type?: "json_object" | "json_schema";
6730
+ json_schema?: unknown;
6731
+ }
6732
+ interface Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Messages {
6268
6733
  /**
6269
6734
  * An array of message objects representing the conversation history.
6270
6735
  */
@@ -6400,7 +6865,7 @@ interface Ai_Cf_Meta_Llama_4_Messages {
6400
6865
  };
6401
6866
  }
6402
6867
  )[];
6403
- response_format?: JSONMode;
6868
+ response_format?: Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_JSON_Mode;
6404
6869
  /**
6405
6870
  * JSON schema that should be fufilled for the response.
6406
6871
  */
@@ -6446,13 +6911,13 @@ interface Ai_Cf_Meta_Llama_4_Messages {
6446
6911
  */
6447
6912
  presence_penalty?: number;
6448
6913
  }
6449
- interface Ai_Cf_Meta_Llama_4_Async_Batch {
6914
+ interface Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Async_Batch {
6450
6915
  requests: (
6451
- | Ai_Cf_Meta_Llama_4_Prompt_Inner
6452
- | Ai_Cf_Meta_Llama_4_Messages_Inner
6916
+ | Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Prompt_Inner
6917
+ | Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Messages_Inner
6453
6918
  )[];
6454
6919
  }
6455
- interface Ai_Cf_Meta_Llama_4_Prompt_Inner {
6920
+ interface Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Prompt_Inner {
6456
6921
  /**
6457
6922
  * The input text prompt for the model to generate a response.
6458
6923
  */
@@ -6461,7 +6926,7 @@ interface Ai_Cf_Meta_Llama_4_Prompt_Inner {
6461
6926
  * JSON schema that should be fulfilled for the response.
6462
6927
  */
6463
6928
  guided_json?: object;
6464
- response_format?: JSONMode;
6929
+ response_format?: Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_JSON_Mode;
6465
6930
  /**
6466
6931
  * If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
6467
6932
  */
@@ -6503,7 +6968,7 @@ interface Ai_Cf_Meta_Llama_4_Prompt_Inner {
6503
6968
  */
6504
6969
  presence_penalty?: number;
6505
6970
  }
6506
- interface Ai_Cf_Meta_Llama_4_Messages_Inner {
6971
+ interface Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Messages_Inner {
6507
6972
  /**
6508
6973
  * An array of message objects representing the conversation history.
6509
6974
  */
@@ -6639,7 +7104,7 @@ interface Ai_Cf_Meta_Llama_4_Messages_Inner {
6639
7104
  };
6640
7105
  }
6641
7106
  )[];
6642
- response_format?: JSONMode;
7107
+ response_format?: Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_JSON_Mode;
6643
7108
  /**
6644
7109
  * JSON schema that should be fufilled for the response.
6645
7110
  */
@@ -6738,414 +7203,1813 @@ declare abstract class Base_Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct {
6738
7203
  inputs: Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Input;
6739
7204
  postProcessedOutputs: Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Output;
6740
7205
  }
6741
- interface Ai_Cf_Deepgram_Nova_3_Input {
6742
- audio: {
6743
- body: object;
6744
- contentType: string;
6745
- };
6746
- /**
6747
- * Sets how the model will interpret strings submitted to the custom_topic param. When strict, the model will only return topics submitted using the custom_topic param. When extended, the model will return its own detected topics in addition to those submitted using the custom_topic param.
6748
- */
6749
- custom_topic_mode?: "extended" | "strict";
6750
- /**
6751
- * Custom topics you want the model to detect within your input audio or text if present Submit up to 100
6752
- */
6753
- custom_topic?: string;
6754
- /**
6755
- * Sets how the model will interpret intents submitted to the custom_intent param. When strict, the model will only return intents submitted using the custom_intent param. When extended, the model will return its own detected intents in addition those submitted using the custom_intents param
6756
- */
6757
- custom_intent_mode?: "extended" | "strict";
6758
- /**
6759
- * Custom intents you want the model to detect within your input audio if present
6760
- */
6761
- custom_intent?: string;
6762
- /**
6763
- * Identifies and extracts key entities from content in submitted audio
6764
- */
6765
- detect_entities?: boolean;
6766
- /**
6767
- * Identifies the dominant language spoken in submitted audio
6768
- */
6769
- detect_language?: boolean;
6770
- /**
6771
- * Recognize speaker changes. Each word in the transcript will be assigned a speaker number starting at 0
6772
- */
6773
- diarize?: boolean;
7206
+ type Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Input =
7207
+ | Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Prompt
7208
+ | Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Messages
7209
+ | Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Async_Batch;
7210
+ interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Prompt {
6774
7211
  /**
6775
- * Identify and extract key entities from content in submitted audio
7212
+ * The input text prompt for the model to generate a response.
6776
7213
  */
6777
- dictation?: boolean;
7214
+ prompt: string;
6778
7215
  /**
6779
- * Specify the expected encoding of your submitted audio
7216
+ * Name of the LoRA (Low-Rank Adaptation) model to fine-tune the base model.
6780
7217
  */
6781
- encoding?:
6782
- | "linear16"
6783
- | "flac"
6784
- | "mulaw"
6785
- | "amr-nb"
6786
- | "amr-wb"
6787
- | "opus"
6788
- | "speex"
6789
- | "g729";
7218
+ lora?: string;
7219
+ response_format?: Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_JSON_Mode;
6790
7220
  /**
6791
- * Arbitrary key-value pairs that are attached to the API response for usage in downstream processing
7221
+ * If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
6792
7222
  */
6793
- extra?: string;
7223
+ raw?: boolean;
6794
7224
  /**
6795
- * Filler Words can help transcribe interruptions in your audio, like 'uh' and 'um'
7225
+ * If true, the response will be streamed back incrementally using SSE, Server Sent Events.
6796
7226
  */
6797
- filler_words?: boolean;
7227
+ stream?: boolean;
6798
7228
  /**
6799
- * Key term prompting can boost or suppress specialized terminology and brands.
7229
+ * The maximum number of tokens to generate in the response.
6800
7230
  */
6801
- keyterm?: string;
7231
+ max_tokens?: number;
6802
7232
  /**
6803
- * Keywords can boost or suppress specialized terminology and brands.
7233
+ * Controls the randomness of the output; higher values produce more random results.
6804
7234
  */
6805
- keywords?: string;
7235
+ temperature?: number;
6806
7236
  /**
6807
- * The BCP-47 language tag that hints at the primary spoken language. Depending on the Model and API endpoint you choose only certain languages are available.
7237
+ * Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses.
6808
7238
  */
6809
- language?: string;
7239
+ top_p?: number;
6810
7240
  /**
6811
- * Spoken measurements will be converted to their corresponding abbreviations.
7241
+ * Limits the AI to choose from the top 'k' most probable words. Lower values make responses more focused; higher values introduce more variety and potential surprises.
6812
7242
  */
6813
- measurements?: boolean;
7243
+ top_k?: number;
6814
7244
  /**
6815
- * Opts out requests from the Deepgram Model Improvement Program. Refer to our Docs for pricing impacts before setting this to true. https://dpgr.am/deepgram-mip.
7245
+ * Random seed for reproducibility of the generation.
6816
7246
  */
6817
- mip_opt_out?: boolean;
7247
+ seed?: number;
6818
7248
  /**
6819
- * Mode of operation for the model representing broad area of topic that will be talked about in the supplied audio
7249
+ * Penalty for repeated tokens; higher values discourage repetition.
6820
7250
  */
6821
- mode?: "general" | "medical" | "finance";
7251
+ repetition_penalty?: number;
6822
7252
  /**
6823
- * Transcribe each audio channel independently.
7253
+ * Decreases the likelihood of the model repeating the same lines verbatim.
6824
7254
  */
6825
- multichannel?: boolean;
7255
+ frequency_penalty?: number;
6826
7256
  /**
6827
- * Numerals converts numbers from written format to numerical format.
7257
+ * Increases the likelihood of the model introducing new topics.
6828
7258
  */
6829
- numerals?: boolean;
7259
+ presence_penalty?: number;
7260
+ }
7261
+ interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_JSON_Mode {
7262
+ type?: "json_object" | "json_schema";
7263
+ json_schema?: unknown;
7264
+ }
7265
+ interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Messages {
6830
7266
  /**
6831
- * Splits audio into paragraphs to improve transcript readability.
7267
+ * An array of message objects representing the conversation history.
6832
7268
  */
6833
- paragraphs?: boolean;
7269
+ messages: {
7270
+ /**
7271
+ * The role of the message sender (e.g., 'user', 'assistant', 'system', 'tool').
7272
+ */
7273
+ role: string;
7274
+ /**
7275
+ * The content of the message as a string.
7276
+ */
7277
+ content: string;
7278
+ }[];
7279
+ functions?: {
7280
+ name: string;
7281
+ code: string;
7282
+ }[];
6834
7283
  /**
6835
- * Profanity Filter looks for recognized profanity and converts it to the nearest recognized non-profane word or removes it from the transcript completely.
7284
+ * A list of tools available for the assistant to use.
7285
+ */
7286
+ tools?: (
7287
+ | {
7288
+ /**
7289
+ * The name of the tool. More descriptive the better.
7290
+ */
7291
+ name: string;
7292
+ /**
7293
+ * A brief description of what the tool does.
7294
+ */
7295
+ description: string;
7296
+ /**
7297
+ * Schema defining the parameters accepted by the tool.
7298
+ */
7299
+ parameters: {
7300
+ /**
7301
+ * The type of the parameters object (usually 'object').
7302
+ */
7303
+ type: string;
7304
+ /**
7305
+ * List of required parameter names.
7306
+ */
7307
+ required?: string[];
7308
+ /**
7309
+ * Definitions of each parameter.
7310
+ */
7311
+ properties: {
7312
+ [k: string]: {
7313
+ /**
7314
+ * The data type of the parameter.
7315
+ */
7316
+ type: string;
7317
+ /**
7318
+ * A description of the expected parameter.
7319
+ */
7320
+ description: string;
7321
+ };
7322
+ };
7323
+ };
7324
+ }
7325
+ | {
7326
+ /**
7327
+ * Specifies the type of tool (e.g., 'function').
7328
+ */
7329
+ type: string;
7330
+ /**
7331
+ * Details of the function tool.
7332
+ */
7333
+ function: {
7334
+ /**
7335
+ * The name of the function.
7336
+ */
7337
+ name: string;
7338
+ /**
7339
+ * A brief description of what the function does.
7340
+ */
7341
+ description: string;
7342
+ /**
7343
+ * Schema defining the parameters accepted by the function.
7344
+ */
7345
+ parameters: {
7346
+ /**
7347
+ * The type of the parameters object (usually 'object').
7348
+ */
7349
+ type: string;
7350
+ /**
7351
+ * List of required parameter names.
7352
+ */
7353
+ required?: string[];
7354
+ /**
7355
+ * Definitions of each parameter.
7356
+ */
7357
+ properties: {
7358
+ [k: string]: {
7359
+ /**
7360
+ * The data type of the parameter.
7361
+ */
7362
+ type: string;
7363
+ /**
7364
+ * A description of the expected parameter.
7365
+ */
7366
+ description: string;
7367
+ };
7368
+ };
7369
+ };
7370
+ };
7371
+ }
7372
+ )[];
7373
+ response_format?: Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_JSON_Mode_1;
7374
+ /**
7375
+ * If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
7376
+ */
7377
+ raw?: boolean;
7378
+ /**
7379
+ * If true, the response will be streamed back incrementally using SSE, Server Sent Events.
7380
+ */
7381
+ stream?: boolean;
7382
+ /**
7383
+ * The maximum number of tokens to generate in the response.
7384
+ */
7385
+ max_tokens?: number;
7386
+ /**
7387
+ * Controls the randomness of the output; higher values produce more random results.
7388
+ */
7389
+ temperature?: number;
7390
+ /**
7391
+ * Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses.
7392
+ */
7393
+ top_p?: number;
7394
+ /**
7395
+ * Limits the AI to choose from the top 'k' most probable words. Lower values make responses more focused; higher values introduce more variety and potential surprises.
7396
+ */
7397
+ top_k?: number;
7398
+ /**
7399
+ * Random seed for reproducibility of the generation.
7400
+ */
7401
+ seed?: number;
7402
+ /**
7403
+ * Penalty for repeated tokens; higher values discourage repetition.
7404
+ */
7405
+ repetition_penalty?: number;
7406
+ /**
7407
+ * Decreases the likelihood of the model repeating the same lines verbatim.
7408
+ */
7409
+ frequency_penalty?: number;
7410
+ /**
7411
+ * Increases the likelihood of the model introducing new topics.
7412
+ */
7413
+ presence_penalty?: number;
7414
+ }
7415
+ interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_JSON_Mode_1 {
7416
+ type?: "json_object" | "json_schema";
7417
+ json_schema?: unknown;
7418
+ }
7419
+ interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Async_Batch {
7420
+ requests: (
7421
+ | Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Prompt_1
7422
+ | Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Messages_1
7423
+ )[];
7424
+ }
7425
+ interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Prompt_1 {
7426
+ /**
7427
+ * The input text prompt for the model to generate a response.
7428
+ */
7429
+ prompt: string;
7430
+ /**
7431
+ * Name of the LoRA (Low-Rank Adaptation) model to fine-tune the base model.
7432
+ */
7433
+ lora?: string;
7434
+ response_format?: Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_JSON_Mode_2;
7435
+ /**
7436
+ * If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
7437
+ */
7438
+ raw?: boolean;
7439
+ /**
7440
+ * If true, the response will be streamed back incrementally using SSE, Server Sent Events.
7441
+ */
7442
+ stream?: boolean;
7443
+ /**
7444
+ * The maximum number of tokens to generate in the response.
7445
+ */
7446
+ max_tokens?: number;
7447
+ /**
7448
+ * Controls the randomness of the output; higher values produce more random results.
7449
+ */
7450
+ temperature?: number;
7451
+ /**
7452
+ * Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses.
7453
+ */
7454
+ top_p?: number;
7455
+ /**
7456
+ * Limits the AI to choose from the top 'k' most probable words. Lower values make responses more focused; higher values introduce more variety and potential surprises.
7457
+ */
7458
+ top_k?: number;
7459
+ /**
7460
+ * Random seed for reproducibility of the generation.
7461
+ */
7462
+ seed?: number;
7463
+ /**
7464
+ * Penalty for repeated tokens; higher values discourage repetition.
7465
+ */
7466
+ repetition_penalty?: number;
7467
+ /**
7468
+ * Decreases the likelihood of the model repeating the same lines verbatim.
7469
+ */
7470
+ frequency_penalty?: number;
7471
+ /**
7472
+ * Increases the likelihood of the model introducing new topics.
7473
+ */
7474
+ presence_penalty?: number;
7475
+ }
7476
+ interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_JSON_Mode_2 {
7477
+ type?: "json_object" | "json_schema";
7478
+ json_schema?: unknown;
7479
+ }
7480
+ interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Messages_1 {
7481
+ /**
7482
+ * An array of message objects representing the conversation history.
7483
+ */
7484
+ messages: {
7485
+ /**
7486
+ * The role of the message sender (e.g., 'user', 'assistant', 'system', 'tool').
7487
+ */
7488
+ role: string;
7489
+ /**
7490
+ * The content of the message as a string.
7491
+ */
7492
+ content: string;
7493
+ }[];
7494
+ functions?: {
7495
+ name: string;
7496
+ code: string;
7497
+ }[];
7498
+ /**
7499
+ * A list of tools available for the assistant to use.
7500
+ */
7501
+ tools?: (
7502
+ | {
7503
+ /**
7504
+ * The name of the tool. More descriptive the better.
7505
+ */
7506
+ name: string;
7507
+ /**
7508
+ * A brief description of what the tool does.
7509
+ */
7510
+ description: string;
7511
+ /**
7512
+ * Schema defining the parameters accepted by the tool.
7513
+ */
7514
+ parameters: {
7515
+ /**
7516
+ * The type of the parameters object (usually 'object').
7517
+ */
7518
+ type: string;
7519
+ /**
7520
+ * List of required parameter names.
7521
+ */
7522
+ required?: string[];
7523
+ /**
7524
+ * Definitions of each parameter.
7525
+ */
7526
+ properties: {
7527
+ [k: string]: {
7528
+ /**
7529
+ * The data type of the parameter.
7530
+ */
7531
+ type: string;
7532
+ /**
7533
+ * A description of the expected parameter.
7534
+ */
7535
+ description: string;
7536
+ };
7537
+ };
7538
+ };
7539
+ }
7540
+ | {
7541
+ /**
7542
+ * Specifies the type of tool (e.g., 'function').
7543
+ */
7544
+ type: string;
7545
+ /**
7546
+ * Details of the function tool.
7547
+ */
7548
+ function: {
7549
+ /**
7550
+ * The name of the function.
7551
+ */
7552
+ name: string;
7553
+ /**
7554
+ * A brief description of what the function does.
7555
+ */
7556
+ description: string;
7557
+ /**
7558
+ * Schema defining the parameters accepted by the function.
7559
+ */
7560
+ parameters: {
7561
+ /**
7562
+ * The type of the parameters object (usually 'object').
7563
+ */
7564
+ type: string;
7565
+ /**
7566
+ * List of required parameter names.
7567
+ */
7568
+ required?: string[];
7569
+ /**
7570
+ * Definitions of each parameter.
7571
+ */
7572
+ properties: {
7573
+ [k: string]: {
7574
+ /**
7575
+ * The data type of the parameter.
7576
+ */
7577
+ type: string;
7578
+ /**
7579
+ * A description of the expected parameter.
7580
+ */
7581
+ description: string;
7582
+ };
7583
+ };
7584
+ };
7585
+ };
7586
+ }
7587
+ )[];
7588
+ response_format?: Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_JSON_Mode_3;
7589
+ /**
7590
+ * If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
7591
+ */
7592
+ raw?: boolean;
7593
+ /**
7594
+ * If true, the response will be streamed back incrementally using SSE, Server Sent Events.
7595
+ */
7596
+ stream?: boolean;
7597
+ /**
7598
+ * The maximum number of tokens to generate in the response.
7599
+ */
7600
+ max_tokens?: number;
7601
+ /**
7602
+ * Controls the randomness of the output; higher values produce more random results.
7603
+ */
7604
+ temperature?: number;
7605
+ /**
7606
+ * Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses.
7607
+ */
7608
+ top_p?: number;
7609
+ /**
7610
+ * Limits the AI to choose from the top 'k' most probable words. Lower values make responses more focused; higher values introduce more variety and potential surprises.
7611
+ */
7612
+ top_k?: number;
7613
+ /**
7614
+ * Random seed for reproducibility of the generation.
7615
+ */
7616
+ seed?: number;
7617
+ /**
7618
+ * Penalty for repeated tokens; higher values discourage repetition.
7619
+ */
7620
+ repetition_penalty?: number;
7621
+ /**
7622
+ * Decreases the likelihood of the model repeating the same lines verbatim.
7623
+ */
7624
+ frequency_penalty?: number;
7625
+ /**
7626
+ * Increases the likelihood of the model introducing new topics.
7627
+ */
7628
+ presence_penalty?: number;
7629
+ }
7630
+ interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_JSON_Mode_3 {
7631
+ type?: "json_object" | "json_schema";
7632
+ json_schema?: unknown;
7633
+ }
7634
+ type Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Output =
7635
+ | Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Chat_Completion_Response
7636
+ | Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Text_Completion_Response
7637
+ | string
7638
+ | Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_AsyncResponse;
7639
+ interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Chat_Completion_Response {
7640
+ /**
7641
+ * Unique identifier for the completion
7642
+ */
7643
+ id?: string;
7644
+ /**
7645
+ * Object type identifier
7646
+ */
7647
+ object?: "chat.completion";
7648
+ /**
7649
+ * Unix timestamp of when the completion was created
7650
+ */
7651
+ created?: number;
7652
+ /**
7653
+ * Model used for the completion
7654
+ */
7655
+ model?: string;
7656
+ /**
7657
+ * List of completion choices
7658
+ */
7659
+ choices?: {
7660
+ /**
7661
+ * Index of the choice in the list
7662
+ */
7663
+ index?: number;
7664
+ /**
7665
+ * The message generated by the model
7666
+ */
7667
+ message?: {
7668
+ /**
7669
+ * Role of the message author
7670
+ */
7671
+ role: string;
7672
+ /**
7673
+ * The content of the message
7674
+ */
7675
+ content: string;
7676
+ /**
7677
+ * Internal reasoning content (if available)
7678
+ */
7679
+ reasoning_content?: string;
7680
+ /**
7681
+ * Tool calls made by the assistant
7682
+ */
7683
+ tool_calls?: {
7684
+ /**
7685
+ * Unique identifier for the tool call
7686
+ */
7687
+ id: string;
7688
+ /**
7689
+ * Type of tool call
7690
+ */
7691
+ type: "function";
7692
+ function: {
7693
+ /**
7694
+ * Name of the function to call
7695
+ */
7696
+ name: string;
7697
+ /**
7698
+ * JSON string of arguments for the function
7699
+ */
7700
+ arguments: string;
7701
+ };
7702
+ }[];
7703
+ };
7704
+ /**
7705
+ * Reason why the model stopped generating
7706
+ */
7707
+ finish_reason?: string;
7708
+ /**
7709
+ * Stop reason (may be null)
7710
+ */
7711
+ stop_reason?: string | null;
7712
+ /**
7713
+ * Log probabilities (if requested)
7714
+ */
7715
+ logprobs?: {} | null;
7716
+ }[];
7717
+ /**
7718
+ * Usage statistics for the inference request
7719
+ */
7720
+ usage?: {
7721
+ /**
7722
+ * Total number of tokens in input
7723
+ */
7724
+ prompt_tokens?: number;
7725
+ /**
7726
+ * Total number of tokens in output
7727
+ */
7728
+ completion_tokens?: number;
7729
+ /**
7730
+ * Total number of input and output tokens
7731
+ */
7732
+ total_tokens?: number;
7733
+ };
7734
+ /**
7735
+ * Log probabilities for the prompt (if requested)
7736
+ */
7737
+ prompt_logprobs?: {} | null;
7738
+ }
7739
+ interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Text_Completion_Response {
7740
+ /**
7741
+ * Unique identifier for the completion
7742
+ */
7743
+ id?: string;
7744
+ /**
7745
+ * Object type identifier
7746
+ */
7747
+ object?: "text_completion";
7748
+ /**
7749
+ * Unix timestamp of when the completion was created
7750
+ */
7751
+ created?: number;
7752
+ /**
7753
+ * Model used for the completion
7754
+ */
7755
+ model?: string;
7756
+ /**
7757
+ * List of completion choices
7758
+ */
7759
+ choices?: {
7760
+ /**
7761
+ * Index of the choice in the list
7762
+ */
7763
+ index: number;
7764
+ /**
7765
+ * The generated text completion
7766
+ */
7767
+ text: string;
7768
+ /**
7769
+ * Reason why the model stopped generating
7770
+ */
7771
+ finish_reason: string;
7772
+ /**
7773
+ * Stop reason (may be null)
7774
+ */
7775
+ stop_reason?: string | null;
7776
+ /**
7777
+ * Log probabilities (if requested)
7778
+ */
7779
+ logprobs?: {} | null;
7780
+ /**
7781
+ * Log probabilities for the prompt (if requested)
7782
+ */
7783
+ prompt_logprobs?: {} | null;
7784
+ }[];
7785
+ /**
7786
+ * Usage statistics for the inference request
7787
+ */
7788
+ usage?: {
7789
+ /**
7790
+ * Total number of tokens in input
7791
+ */
7792
+ prompt_tokens?: number;
7793
+ /**
7794
+ * Total number of tokens in output
7795
+ */
7796
+ completion_tokens?: number;
7797
+ /**
7798
+ * Total number of input and output tokens
7799
+ */
7800
+ total_tokens?: number;
7801
+ };
7802
+ }
7803
+ interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_AsyncResponse {
7804
+ /**
7805
+ * The async request id that can be used to obtain the results.
7806
+ */
7807
+ request_id?: string;
7808
+ }
7809
+ declare abstract class Base_Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8 {
7810
+ inputs: Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Input;
7811
+ postProcessedOutputs: Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Output;
7812
+ }
7813
+ interface Ai_Cf_Deepgram_Nova_3_Input {
7814
+ audio: {
7815
+ body: object;
7816
+ contentType: string;
7817
+ };
7818
+ /**
7819
+ * Sets how the model will interpret strings submitted to the custom_topic param. When strict, the model will only return topics submitted using the custom_topic param. When extended, the model will return its own detected topics in addition to those submitted using the custom_topic param.
7820
+ */
7821
+ custom_topic_mode?: "extended" | "strict";
7822
+ /**
7823
+ * Custom topics you want the model to detect within your input audio or text if present Submit up to 100
7824
+ */
7825
+ custom_topic?: string;
7826
+ /**
7827
+ * Sets how the model will interpret intents submitted to the custom_intent param. When strict, the model will only return intents submitted using the custom_intent param. When extended, the model will return its own detected intents in addition those submitted using the custom_intents param
7828
+ */
7829
+ custom_intent_mode?: "extended" | "strict";
7830
+ /**
7831
+ * Custom intents you want the model to detect within your input audio if present
7832
+ */
7833
+ custom_intent?: string;
7834
+ /**
7835
+ * Identifies and extracts key entities from content in submitted audio
7836
+ */
7837
+ detect_entities?: boolean;
7838
+ /**
7839
+ * Identifies the dominant language spoken in submitted audio
7840
+ */
7841
+ detect_language?: boolean;
7842
+ /**
7843
+ * Recognize speaker changes. Each word in the transcript will be assigned a speaker number starting at 0
7844
+ */
7845
+ diarize?: boolean;
7846
+ /**
7847
+ * Identify and extract key entities from content in submitted audio
7848
+ */
7849
+ dictation?: boolean;
7850
+ /**
7851
+ * Specify the expected encoding of your submitted audio
7852
+ */
7853
+ encoding?:
7854
+ | "linear16"
7855
+ | "flac"
7856
+ | "mulaw"
7857
+ | "amr-nb"
7858
+ | "amr-wb"
7859
+ | "opus"
7860
+ | "speex"
7861
+ | "g729";
7862
+ /**
7863
+ * Arbitrary key-value pairs that are attached to the API response for usage in downstream processing
7864
+ */
7865
+ extra?: string;
7866
+ /**
7867
+ * Filler Words can help transcribe interruptions in your audio, like 'uh' and 'um'
7868
+ */
7869
+ filler_words?: boolean;
7870
+ /**
7871
+ * Key term prompting can boost or suppress specialized terminology and brands.
7872
+ */
7873
+ keyterm?: string;
7874
+ /**
7875
+ * Keywords can boost or suppress specialized terminology and brands.
7876
+ */
7877
+ keywords?: string;
7878
+ /**
7879
+ * The BCP-47 language tag that hints at the primary spoken language. Depending on the Model and API endpoint you choose only certain languages are available.
7880
+ */
7881
+ language?: string;
7882
+ /**
7883
+ * Spoken measurements will be converted to their corresponding abbreviations.
7884
+ */
7885
+ measurements?: boolean;
7886
+ /**
7887
+ * Opts out requests from the Deepgram Model Improvement Program. Refer to our Docs for pricing impacts before setting this to true. https://dpgr.am/deepgram-mip.
7888
+ */
7889
+ mip_opt_out?: boolean;
7890
+ /**
7891
+ * Mode of operation for the model representing broad area of topic that will be talked about in the supplied audio
7892
+ */
7893
+ mode?: "general" | "medical" | "finance";
7894
+ /**
7895
+ * Transcribe each audio channel independently.
7896
+ */
7897
+ multichannel?: boolean;
7898
+ /**
7899
+ * Numerals converts numbers from written format to numerical format.
7900
+ */
7901
+ numerals?: boolean;
7902
+ /**
7903
+ * Splits audio into paragraphs to improve transcript readability.
7904
+ */
7905
+ paragraphs?: boolean;
7906
+ /**
7907
+ * Profanity Filter looks for recognized profanity and converts it to the nearest recognized non-profane word or removes it from the transcript completely.
6836
7908
  */
6837
7909
  profanity_filter?: boolean;
6838
7910
  /**
6839
- * Add punctuation and capitalization to the transcript.
7911
+ * Add punctuation and capitalization to the transcript.
7912
+ */
7913
+ punctuate?: boolean;
7914
+ /**
7915
+ * Redaction removes sensitive information from your transcripts.
7916
+ */
7917
+ redact?: string;
7918
+ /**
7919
+ * Search for terms or phrases in submitted audio and replaces them.
7920
+ */
7921
+ replace?: string;
7922
+ /**
7923
+ * Search for terms or phrases in submitted audio.
7924
+ */
7925
+ search?: string;
7926
+ /**
7927
+ * Recognizes the sentiment throughout a transcript or text.
7928
+ */
7929
+ sentiment?: boolean;
7930
+ /**
7931
+ * Apply formatting to transcript output. When set to true, additional formatting will be applied to transcripts to improve readability.
7932
+ */
7933
+ smart_format?: boolean;
7934
+ /**
7935
+ * Detect topics throughout a transcript or text.
7936
+ */
7937
+ topics?: boolean;
7938
+ /**
7939
+ * Segments speech into meaningful semantic units.
7940
+ */
7941
+ utterances?: boolean;
7942
+ /**
7943
+ * Seconds to wait before detecting a pause between words in submitted audio.
7944
+ */
7945
+ utt_split?: number;
7946
+ /**
7947
+ * The number of channels in the submitted audio
7948
+ */
7949
+ channels?: number;
7950
+ /**
7951
+ * Specifies whether the streaming endpoint should provide ongoing transcription updates as more audio is received. When set to true, the endpoint sends continuous updates, meaning transcription results may evolve over time. Note: Supported only for webosockets.
7952
+ */
7953
+ interim_results?: boolean;
7954
+ /**
7955
+ * Indicates how long model will wait to detect whether a speaker has finished speaking or pauses for a significant period of time. When set to a value, the streaming endpoint immediately finalizes the transcription for the processed time range and returns the transcript with a speech_final parameter set to true. Can also be set to false to disable endpointing
7956
+ */
7957
+ endpointing?: string;
7958
+ /**
7959
+ * Indicates that speech has started. You'll begin receiving Speech Started messages upon speech starting. Note: Supported only for webosockets.
7960
+ */
7961
+ vad_events?: boolean;
7962
+ /**
7963
+ * Indicates how long model will wait to send an UtteranceEnd message after a word has been transcribed. Use with interim_results. Note: Supported only for webosockets.
7964
+ */
7965
+ utterance_end_ms?: boolean;
7966
+ }
7967
+ interface Ai_Cf_Deepgram_Nova_3_Output {
7968
+ results?: {
7969
+ channels?: {
7970
+ alternatives?: {
7971
+ confidence?: number;
7972
+ transcript?: string;
7973
+ words?: {
7974
+ confidence?: number;
7975
+ end?: number;
7976
+ start?: number;
7977
+ word?: string;
7978
+ }[];
7979
+ }[];
7980
+ }[];
7981
+ summary?: {
7982
+ result?: string;
7983
+ short?: string;
7984
+ };
7985
+ sentiments?: {
7986
+ segments?: {
7987
+ text?: string;
7988
+ start_word?: number;
7989
+ end_word?: number;
7990
+ sentiment?: string;
7991
+ sentiment_score?: number;
7992
+ }[];
7993
+ average?: {
7994
+ sentiment?: string;
7995
+ sentiment_score?: number;
7996
+ };
7997
+ };
7998
+ };
7999
+ }
8000
+ declare abstract class Base_Ai_Cf_Deepgram_Nova_3 {
8001
+ inputs: Ai_Cf_Deepgram_Nova_3_Input;
8002
+ postProcessedOutputs: Ai_Cf_Deepgram_Nova_3_Output;
8003
+ }
8004
+ interface Ai_Cf_Qwen_Qwen3_Embedding_0_6B_Input {
8005
+ queries?: string | string[];
8006
+ /**
8007
+ * Optional instruction for the task
8008
+ */
8009
+ instruction?: string;
8010
+ documents?: string | string[];
8011
+ text?: string | string[];
8012
+ }
8013
+ interface Ai_Cf_Qwen_Qwen3_Embedding_0_6B_Output {
8014
+ data?: number[][];
8015
+ shape?: number[];
8016
+ }
8017
+ declare abstract class Base_Ai_Cf_Qwen_Qwen3_Embedding_0_6B {
8018
+ inputs: Ai_Cf_Qwen_Qwen3_Embedding_0_6B_Input;
8019
+ postProcessedOutputs: Ai_Cf_Qwen_Qwen3_Embedding_0_6B_Output;
8020
+ }
8021
+ type Ai_Cf_Pipecat_Ai_Smart_Turn_V2_Input =
8022
+ | {
8023
+ /**
8024
+ * readable stream with audio data and content-type specified for that data
8025
+ */
8026
+ audio: {
8027
+ body: object;
8028
+ contentType: string;
8029
+ };
8030
+ /**
8031
+ * type of data PCM data that's sent to the inference server as raw array
8032
+ */
8033
+ dtype?: "uint8" | "float32" | "float64";
8034
+ }
8035
+ | {
8036
+ /**
8037
+ * base64 encoded audio data
8038
+ */
8039
+ audio: string;
8040
+ /**
8041
+ * type of data PCM data that's sent to the inference server as raw array
8042
+ */
8043
+ dtype?: "uint8" | "float32" | "float64";
8044
+ };
8045
+ interface Ai_Cf_Pipecat_Ai_Smart_Turn_V2_Output {
8046
+ /**
8047
+ * if true, end-of-turn was detected
8048
+ */
8049
+ is_complete?: boolean;
8050
+ /**
8051
+ * probability of the end-of-turn detection
8052
+ */
8053
+ probability?: number;
8054
+ }
8055
+ declare abstract class Base_Ai_Cf_Pipecat_Ai_Smart_Turn_V2 {
8056
+ inputs: Ai_Cf_Pipecat_Ai_Smart_Turn_V2_Input;
8057
+ postProcessedOutputs: Ai_Cf_Pipecat_Ai_Smart_Turn_V2_Output;
8058
+ }
8059
+ declare abstract class Base_Ai_Cf_Openai_Gpt_Oss_120B {
8060
+ inputs: ResponsesInput;
8061
+ postProcessedOutputs: ResponsesOutput;
8062
+ }
8063
+ declare abstract class Base_Ai_Cf_Openai_Gpt_Oss_20B {
8064
+ inputs: ResponsesInput;
8065
+ postProcessedOutputs: ResponsesOutput;
8066
+ }
8067
+ interface Ai_Cf_Leonardo_Phoenix_1_0_Input {
8068
+ /**
8069
+ * A text description of the image you want to generate.
8070
+ */
8071
+ prompt: string;
8072
+ /**
8073
+ * Controls how closely the generated image should adhere to the prompt; higher values make the image more aligned with the prompt
8074
+ */
8075
+ guidance?: number;
8076
+ /**
8077
+ * Random seed for reproducibility of the image generation
8078
+ */
8079
+ seed?: number;
8080
+ /**
8081
+ * The height of the generated image in pixels
8082
+ */
8083
+ height?: number;
8084
+ /**
8085
+ * The width of the generated image in pixels
8086
+ */
8087
+ width?: number;
8088
+ /**
8089
+ * The number of diffusion steps; higher values can improve quality but take longer
8090
+ */
8091
+ num_steps?: number;
8092
+ /**
8093
+ * Specify what to exclude from the generated images
8094
+ */
8095
+ negative_prompt?: string;
8096
+ }
8097
+ /**
8098
+ * The generated image in JPEG format
8099
+ */
8100
+ type Ai_Cf_Leonardo_Phoenix_1_0_Output = string;
8101
+ declare abstract class Base_Ai_Cf_Leonardo_Phoenix_1_0 {
8102
+ inputs: Ai_Cf_Leonardo_Phoenix_1_0_Input;
8103
+ postProcessedOutputs: Ai_Cf_Leonardo_Phoenix_1_0_Output;
8104
+ }
8105
+ interface Ai_Cf_Leonardo_Lucid_Origin_Input {
8106
+ /**
8107
+ * A text description of the image you want to generate.
8108
+ */
8109
+ prompt: string;
8110
+ /**
8111
+ * Controls how closely the generated image should adhere to the prompt; higher values make the image more aligned with the prompt
8112
+ */
8113
+ guidance?: number;
8114
+ /**
8115
+ * Random seed for reproducibility of the image generation
8116
+ */
8117
+ seed?: number;
8118
+ /**
8119
+ * The height of the generated image in pixels
8120
+ */
8121
+ height?: number;
8122
+ /**
8123
+ * The width of the generated image in pixels
8124
+ */
8125
+ width?: number;
8126
+ /**
8127
+ * The number of diffusion steps; higher values can improve quality but take longer
8128
+ */
8129
+ num_steps?: number;
8130
+ /**
8131
+ * The number of diffusion steps; higher values can improve quality but take longer
8132
+ */
8133
+ steps?: number;
8134
+ }
8135
+ interface Ai_Cf_Leonardo_Lucid_Origin_Output {
8136
+ /**
8137
+ * The generated image in Base64 format.
8138
+ */
8139
+ image?: string;
8140
+ }
8141
+ declare abstract class Base_Ai_Cf_Leonardo_Lucid_Origin {
8142
+ inputs: Ai_Cf_Leonardo_Lucid_Origin_Input;
8143
+ postProcessedOutputs: Ai_Cf_Leonardo_Lucid_Origin_Output;
8144
+ }
8145
+ interface Ai_Cf_Deepgram_Aura_1_Input {
8146
+ /**
8147
+ * Speaker used to produce the audio.
8148
+ */
8149
+ speaker?:
8150
+ | "angus"
8151
+ | "asteria"
8152
+ | "arcas"
8153
+ | "orion"
8154
+ | "orpheus"
8155
+ | "athena"
8156
+ | "luna"
8157
+ | "zeus"
8158
+ | "perseus"
8159
+ | "helios"
8160
+ | "hera"
8161
+ | "stella";
8162
+ /**
8163
+ * Encoding of the output audio.
8164
+ */
8165
+ encoding?: "linear16" | "flac" | "mulaw" | "alaw" | "mp3" | "opus" | "aac";
8166
+ /**
8167
+ * Container specifies the file format wrapper for the output audio. The available options depend on the encoding type..
8168
+ */
8169
+ container?: "none" | "wav" | "ogg";
8170
+ /**
8171
+ * The text content to be converted to speech
8172
+ */
8173
+ text: string;
8174
+ /**
8175
+ * Sample Rate specifies the sample rate for the output audio. Based on the encoding, different sample rates are supported. For some encodings, the sample rate is not configurable
8176
+ */
8177
+ sample_rate?: number;
8178
+ /**
8179
+ * The bitrate of the audio in bits per second. Choose from predefined ranges or specific values based on the encoding type.
8180
+ */
8181
+ bit_rate?: number;
8182
+ }
8183
+ /**
8184
+ * The generated audio in MP3 format
8185
+ */
8186
+ type Ai_Cf_Deepgram_Aura_1_Output = string;
8187
+ declare abstract class Base_Ai_Cf_Deepgram_Aura_1 {
8188
+ inputs: Ai_Cf_Deepgram_Aura_1_Input;
8189
+ postProcessedOutputs: Ai_Cf_Deepgram_Aura_1_Output;
8190
+ }
8191
+ interface Ai_Cf_Ai4Bharat_Indictrans2_En_Indic_1B_Input {
8192
+ /**
8193
+ * Input text to translate. Can be a single string or a list of strings.
8194
+ */
8195
+ text: string | string[];
8196
+ /**
8197
+ * Target langauge to translate to
8198
+ */
8199
+ target_language:
8200
+ | "asm_Beng"
8201
+ | "awa_Deva"
8202
+ | "ben_Beng"
8203
+ | "bho_Deva"
8204
+ | "brx_Deva"
8205
+ | "doi_Deva"
8206
+ | "eng_Latn"
8207
+ | "gom_Deva"
8208
+ | "gon_Deva"
8209
+ | "guj_Gujr"
8210
+ | "hin_Deva"
8211
+ | "hne_Deva"
8212
+ | "kan_Knda"
8213
+ | "kas_Arab"
8214
+ | "kas_Deva"
8215
+ | "kha_Latn"
8216
+ | "lus_Latn"
8217
+ | "mag_Deva"
8218
+ | "mai_Deva"
8219
+ | "mal_Mlym"
8220
+ | "mar_Deva"
8221
+ | "mni_Beng"
8222
+ | "mni_Mtei"
8223
+ | "npi_Deva"
8224
+ | "ory_Orya"
8225
+ | "pan_Guru"
8226
+ | "san_Deva"
8227
+ | "sat_Olck"
8228
+ | "snd_Arab"
8229
+ | "snd_Deva"
8230
+ | "tam_Taml"
8231
+ | "tel_Telu"
8232
+ | "urd_Arab"
8233
+ | "unr_Deva";
8234
+ }
8235
+ interface Ai_Cf_Ai4Bharat_Indictrans2_En_Indic_1B_Output {
8236
+ /**
8237
+ * Translated texts
8238
+ */
8239
+ translations: string[];
8240
+ }
8241
+ declare abstract class Base_Ai_Cf_Ai4Bharat_Indictrans2_En_Indic_1B {
8242
+ inputs: Ai_Cf_Ai4Bharat_Indictrans2_En_Indic_1B_Input;
8243
+ postProcessedOutputs: Ai_Cf_Ai4Bharat_Indictrans2_En_Indic_1B_Output;
8244
+ }
8245
+ type Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Input =
8246
+ | Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Prompt
8247
+ | Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Messages
8248
+ | Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Async_Batch;
8249
+ interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Prompt {
8250
+ /**
8251
+ * The input text prompt for the model to generate a response.
8252
+ */
8253
+ prompt: string;
8254
+ /**
8255
+ * Name of the LoRA (Low-Rank Adaptation) model to fine-tune the base model.
8256
+ */
8257
+ lora?: string;
8258
+ response_format?: Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_JSON_Mode;
8259
+ /**
8260
+ * If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
8261
+ */
8262
+ raw?: boolean;
8263
+ /**
8264
+ * If true, the response will be streamed back incrementally using SSE, Server Sent Events.
8265
+ */
8266
+ stream?: boolean;
8267
+ /**
8268
+ * The maximum number of tokens to generate in the response.
8269
+ */
8270
+ max_tokens?: number;
8271
+ /**
8272
+ * Controls the randomness of the output; higher values produce more random results.
8273
+ */
8274
+ temperature?: number;
8275
+ /**
8276
+ * Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses.
8277
+ */
8278
+ top_p?: number;
8279
+ /**
8280
+ * Limits the AI to choose from the top 'k' most probable words. Lower values make responses more focused; higher values introduce more variety and potential surprises.
8281
+ */
8282
+ top_k?: number;
8283
+ /**
8284
+ * Random seed for reproducibility of the generation.
8285
+ */
8286
+ seed?: number;
8287
+ /**
8288
+ * Penalty for repeated tokens; higher values discourage repetition.
8289
+ */
8290
+ repetition_penalty?: number;
8291
+ /**
8292
+ * Decreases the likelihood of the model repeating the same lines verbatim.
8293
+ */
8294
+ frequency_penalty?: number;
8295
+ /**
8296
+ * Increases the likelihood of the model introducing new topics.
8297
+ */
8298
+ presence_penalty?: number;
8299
+ }
8300
+ interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_JSON_Mode {
8301
+ type?: "json_object" | "json_schema";
8302
+ json_schema?: unknown;
8303
+ }
8304
+ interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Messages {
8305
+ /**
8306
+ * An array of message objects representing the conversation history.
8307
+ */
8308
+ messages: {
8309
+ /**
8310
+ * The role of the message sender (e.g., 'user', 'assistant', 'system', 'tool').
8311
+ */
8312
+ role: string;
8313
+ /**
8314
+ * The content of the message as a string.
8315
+ */
8316
+ content: string;
8317
+ }[];
8318
+ functions?: {
8319
+ name: string;
8320
+ code: string;
8321
+ }[];
8322
+ /**
8323
+ * A list of tools available for the assistant to use.
8324
+ */
8325
+ tools?: (
8326
+ | {
8327
+ /**
8328
+ * The name of the tool. More descriptive the better.
8329
+ */
8330
+ name: string;
8331
+ /**
8332
+ * A brief description of what the tool does.
8333
+ */
8334
+ description: string;
8335
+ /**
8336
+ * Schema defining the parameters accepted by the tool.
8337
+ */
8338
+ parameters: {
8339
+ /**
8340
+ * The type of the parameters object (usually 'object').
8341
+ */
8342
+ type: string;
8343
+ /**
8344
+ * List of required parameter names.
8345
+ */
8346
+ required?: string[];
8347
+ /**
8348
+ * Definitions of each parameter.
8349
+ */
8350
+ properties: {
8351
+ [k: string]: {
8352
+ /**
8353
+ * The data type of the parameter.
8354
+ */
8355
+ type: string;
8356
+ /**
8357
+ * A description of the expected parameter.
8358
+ */
8359
+ description: string;
8360
+ };
8361
+ };
8362
+ };
8363
+ }
8364
+ | {
8365
+ /**
8366
+ * Specifies the type of tool (e.g., 'function').
8367
+ */
8368
+ type: string;
8369
+ /**
8370
+ * Details of the function tool.
8371
+ */
8372
+ function: {
8373
+ /**
8374
+ * The name of the function.
8375
+ */
8376
+ name: string;
8377
+ /**
8378
+ * A brief description of what the function does.
8379
+ */
8380
+ description: string;
8381
+ /**
8382
+ * Schema defining the parameters accepted by the function.
8383
+ */
8384
+ parameters: {
8385
+ /**
8386
+ * The type of the parameters object (usually 'object').
8387
+ */
8388
+ type: string;
8389
+ /**
8390
+ * List of required parameter names.
8391
+ */
8392
+ required?: string[];
8393
+ /**
8394
+ * Definitions of each parameter.
8395
+ */
8396
+ properties: {
8397
+ [k: string]: {
8398
+ /**
8399
+ * The data type of the parameter.
8400
+ */
8401
+ type: string;
8402
+ /**
8403
+ * A description of the expected parameter.
8404
+ */
8405
+ description: string;
8406
+ };
8407
+ };
8408
+ };
8409
+ };
8410
+ }
8411
+ )[];
8412
+ response_format?: Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_JSON_Mode_1;
8413
+ /**
8414
+ * If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
8415
+ */
8416
+ raw?: boolean;
8417
+ /**
8418
+ * If true, the response will be streamed back incrementally using SSE, Server Sent Events.
8419
+ */
8420
+ stream?: boolean;
8421
+ /**
8422
+ * The maximum number of tokens to generate in the response.
8423
+ */
8424
+ max_tokens?: number;
8425
+ /**
8426
+ * Controls the randomness of the output; higher values produce more random results.
8427
+ */
8428
+ temperature?: number;
8429
+ /**
8430
+ * Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses.
6840
8431
  */
6841
- punctuate?: boolean;
8432
+ top_p?: number;
6842
8433
  /**
6843
- * Redaction removes sensitive information from your transcripts.
8434
+ * Limits the AI to choose from the top 'k' most probable words. Lower values make responses more focused; higher values introduce more variety and potential surprises.
6844
8435
  */
6845
- redact?: string;
8436
+ top_k?: number;
6846
8437
  /**
6847
- * Search for terms or phrases in submitted audio and replaces them.
8438
+ * Random seed for reproducibility of the generation.
6848
8439
  */
6849
- replace?: string;
8440
+ seed?: number;
6850
8441
  /**
6851
- * Search for terms or phrases in submitted audio.
8442
+ * Penalty for repeated tokens; higher values discourage repetition.
6852
8443
  */
6853
- search?: string;
8444
+ repetition_penalty?: number;
6854
8445
  /**
6855
- * Recognizes the sentiment throughout a transcript or text.
8446
+ * Decreases the likelihood of the model repeating the same lines verbatim.
6856
8447
  */
6857
- sentiment?: boolean;
8448
+ frequency_penalty?: number;
6858
8449
  /**
6859
- * Apply formatting to transcript output. When set to true, additional formatting will be applied to transcripts to improve readability.
8450
+ * Increases the likelihood of the model introducing new topics.
6860
8451
  */
6861
- smart_format?: boolean;
8452
+ presence_penalty?: number;
8453
+ }
8454
+ interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_JSON_Mode_1 {
8455
+ type?: "json_object" | "json_schema";
8456
+ json_schema?: unknown;
8457
+ }
8458
+ interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Async_Batch {
8459
+ requests: (
8460
+ | Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Prompt_1
8461
+ | Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Messages_1
8462
+ )[];
8463
+ }
8464
+ interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Prompt_1 {
6862
8465
  /**
6863
- * Detect topics throughout a transcript or text.
8466
+ * The input text prompt for the model to generate a response.
6864
8467
  */
6865
- topics?: boolean;
8468
+ prompt: string;
6866
8469
  /**
6867
- * Segments speech into meaningful semantic units.
8470
+ * Name of the LoRA (Low-Rank Adaptation) model to fine-tune the base model.
6868
8471
  */
6869
- utterances?: boolean;
8472
+ lora?: string;
8473
+ response_format?: Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_JSON_Mode_2;
6870
8474
  /**
6871
- * Seconds to wait before detecting a pause between words in submitted audio.
8475
+ * If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
6872
8476
  */
6873
- utt_split?: number;
8477
+ raw?: boolean;
6874
8478
  /**
6875
- * The number of channels in the submitted audio
8479
+ * If true, the response will be streamed back incrementally using SSE, Server Sent Events.
6876
8480
  */
6877
- channels?: number;
8481
+ stream?: boolean;
6878
8482
  /**
6879
- * Specifies whether the streaming endpoint should provide ongoing transcription updates as more audio is received. When set to true, the endpoint sends continuous updates, meaning transcription results may evolve over time. Note: Supported only for webosockets.
8483
+ * The maximum number of tokens to generate in the response.
6880
8484
  */
6881
- interim_results?: boolean;
8485
+ max_tokens?: number;
6882
8486
  /**
6883
- * Indicates how long model will wait to detect whether a speaker has finished speaking or pauses for a significant period of time. When set to a value, the streaming endpoint immediately finalizes the transcription for the processed time range and returns the transcript with a speech_final parameter set to true. Can also be set to false to disable endpointing
8487
+ * Controls the randomness of the output; higher values produce more random results.
6884
8488
  */
6885
- endpointing?: string;
8489
+ temperature?: number;
6886
8490
  /**
6887
- * Indicates that speech has started. You'll begin receiving Speech Started messages upon speech starting. Note: Supported only for webosockets.
8491
+ * Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses.
6888
8492
  */
6889
- vad_events?: boolean;
8493
+ top_p?: number;
6890
8494
  /**
6891
- * Indicates how long model will wait to send an UtteranceEnd message after a word has been transcribed. Use with interim_results. Note: Supported only for webosockets.
8495
+ * Limits the AI to choose from the top 'k' most probable words. Lower values make responses more focused; higher values introduce more variety and potential surprises.
6892
8496
  */
6893
- utterance_end_ms?: boolean;
8497
+ top_k?: number;
8498
+ /**
8499
+ * Random seed for reproducibility of the generation.
8500
+ */
8501
+ seed?: number;
8502
+ /**
8503
+ * Penalty for repeated tokens; higher values discourage repetition.
8504
+ */
8505
+ repetition_penalty?: number;
8506
+ /**
8507
+ * Decreases the likelihood of the model repeating the same lines verbatim.
8508
+ */
8509
+ frequency_penalty?: number;
8510
+ /**
8511
+ * Increases the likelihood of the model introducing new topics.
8512
+ */
8513
+ presence_penalty?: number;
6894
8514
  }
6895
- interface Ai_Cf_Deepgram_Nova_3_Output {
6896
- results?: {
6897
- channels?: {
6898
- alternatives?: {
6899
- confidence?: number;
6900
- transcript?: string;
6901
- words?: {
6902
- confidence?: number;
6903
- end?: number;
6904
- start?: number;
6905
- word?: string;
6906
- }[];
6907
- }[];
6908
- }[];
6909
- summary?: {
6910
- result?: string;
6911
- short?: string;
6912
- };
6913
- sentiments?: {
6914
- segments?: {
6915
- text?: string;
6916
- start_word?: number;
6917
- end_word?: number;
6918
- sentiment?: string;
6919
- sentiment_score?: number;
6920
- }[];
6921
- average?: {
6922
- sentiment?: string;
6923
- sentiment_score?: number;
6924
- };
6925
- };
6926
- };
8515
+ interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_JSON_Mode_2 {
8516
+ type?: "json_object" | "json_schema";
8517
+ json_schema?: unknown;
8518
+ }
8519
+ interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Messages_1 {
8520
+ /**
8521
+ * An array of message objects representing the conversation history.
8522
+ */
8523
+ messages: {
8524
+ /**
8525
+ * The role of the message sender (e.g., 'user', 'assistant', 'system', 'tool').
8526
+ */
8527
+ role: string;
8528
+ /**
8529
+ * The content of the message as a string.
8530
+ */
8531
+ content: string;
8532
+ }[];
8533
+ functions?: {
8534
+ name: string;
8535
+ code: string;
8536
+ }[];
8537
+ /**
8538
+ * A list of tools available for the assistant to use.
8539
+ */
8540
+ tools?: (
8541
+ | {
8542
+ /**
8543
+ * The name of the tool. More descriptive the better.
8544
+ */
8545
+ name: string;
8546
+ /**
8547
+ * A brief description of what the tool does.
8548
+ */
8549
+ description: string;
8550
+ /**
8551
+ * Schema defining the parameters accepted by the tool.
8552
+ */
8553
+ parameters: {
8554
+ /**
8555
+ * The type of the parameters object (usually 'object').
8556
+ */
8557
+ type: string;
8558
+ /**
8559
+ * List of required parameter names.
8560
+ */
8561
+ required?: string[];
8562
+ /**
8563
+ * Definitions of each parameter.
8564
+ */
8565
+ properties: {
8566
+ [k: string]: {
8567
+ /**
8568
+ * The data type of the parameter.
8569
+ */
8570
+ type: string;
8571
+ /**
8572
+ * A description of the expected parameter.
8573
+ */
8574
+ description: string;
8575
+ };
8576
+ };
8577
+ };
8578
+ }
8579
+ | {
8580
+ /**
8581
+ * Specifies the type of tool (e.g., 'function').
8582
+ */
8583
+ type: string;
8584
+ /**
8585
+ * Details of the function tool.
8586
+ */
8587
+ function: {
8588
+ /**
8589
+ * The name of the function.
8590
+ */
8591
+ name: string;
8592
+ /**
8593
+ * A brief description of what the function does.
8594
+ */
8595
+ description: string;
8596
+ /**
8597
+ * Schema defining the parameters accepted by the function.
8598
+ */
8599
+ parameters: {
8600
+ /**
8601
+ * The type of the parameters object (usually 'object').
8602
+ */
8603
+ type: string;
8604
+ /**
8605
+ * List of required parameter names.
8606
+ */
8607
+ required?: string[];
8608
+ /**
8609
+ * Definitions of each parameter.
8610
+ */
8611
+ properties: {
8612
+ [k: string]: {
8613
+ /**
8614
+ * The data type of the parameter.
8615
+ */
8616
+ type: string;
8617
+ /**
8618
+ * A description of the expected parameter.
8619
+ */
8620
+ description: string;
8621
+ };
8622
+ };
8623
+ };
8624
+ };
8625
+ }
8626
+ )[];
8627
+ response_format?: Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_JSON_Mode_3;
8628
+ /**
8629
+ * If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
8630
+ */
8631
+ raw?: boolean;
8632
+ /**
8633
+ * If true, the response will be streamed back incrementally using SSE, Server Sent Events.
8634
+ */
8635
+ stream?: boolean;
8636
+ /**
8637
+ * The maximum number of tokens to generate in the response.
8638
+ */
8639
+ max_tokens?: number;
8640
+ /**
8641
+ * Controls the randomness of the output; higher values produce more random results.
8642
+ */
8643
+ temperature?: number;
8644
+ /**
8645
+ * Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses.
8646
+ */
8647
+ top_p?: number;
8648
+ /**
8649
+ * Limits the AI to choose from the top 'k' most probable words. Lower values make responses more focused; higher values introduce more variety and potential surprises.
8650
+ */
8651
+ top_k?: number;
8652
+ /**
8653
+ * Random seed for reproducibility of the generation.
8654
+ */
8655
+ seed?: number;
8656
+ /**
8657
+ * Penalty for repeated tokens; higher values discourage repetition.
8658
+ */
8659
+ repetition_penalty?: number;
8660
+ /**
8661
+ * Decreases the likelihood of the model repeating the same lines verbatim.
8662
+ */
8663
+ frequency_penalty?: number;
8664
+ /**
8665
+ * Increases the likelihood of the model introducing new topics.
8666
+ */
8667
+ presence_penalty?: number;
6927
8668
  }
6928
- declare abstract class Base_Ai_Cf_Deepgram_Nova_3 {
6929
- inputs: Ai_Cf_Deepgram_Nova_3_Input;
6930
- postProcessedOutputs: Ai_Cf_Deepgram_Nova_3_Output;
8669
+ interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_JSON_Mode_3 {
8670
+ type?: "json_object" | "json_schema";
8671
+ json_schema?: unknown;
6931
8672
  }
6932
- type Ai_Cf_Pipecat_Ai_Smart_Turn_V2_Input =
6933
- | {
8673
+ type Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Output =
8674
+ | Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Chat_Completion_Response
8675
+ | Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Text_Completion_Response
8676
+ | string
8677
+ | Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_AsyncResponse;
8678
+ interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Chat_Completion_Response {
8679
+ /**
8680
+ * Unique identifier for the completion
8681
+ */
8682
+ id?: string;
8683
+ /**
8684
+ * Object type identifier
8685
+ */
8686
+ object?: "chat.completion";
8687
+ /**
8688
+ * Unix timestamp of when the completion was created
8689
+ */
8690
+ created?: number;
8691
+ /**
8692
+ * Model used for the completion
8693
+ */
8694
+ model?: string;
8695
+ /**
8696
+ * List of completion choices
8697
+ */
8698
+ choices?: {
8699
+ /**
8700
+ * Index of the choice in the list
8701
+ */
8702
+ index?: number;
8703
+ /**
8704
+ * The message generated by the model
8705
+ */
8706
+ message?: {
6934
8707
  /**
6935
- * readable stream with audio data and content-type specified for that data
8708
+ * Role of the message author
6936
8709
  */
6937
- audio: {
6938
- body: object;
6939
- contentType: string;
6940
- };
8710
+ role: string;
6941
8711
  /**
6942
- * type of data PCM data that's sent to the inference server as raw array
8712
+ * The content of the message
6943
8713
  */
6944
- dtype?: "uint8" | "float32" | "float64";
6945
- }
6946
- | {
8714
+ content: string;
6947
8715
  /**
6948
- * base64 encoded audio data
8716
+ * Internal reasoning content (if available)
6949
8717
  */
6950
- audio: string;
8718
+ reasoning_content?: string;
6951
8719
  /**
6952
- * type of data PCM data that's sent to the inference server as raw array
8720
+ * Tool calls made by the assistant
6953
8721
  */
6954
- dtype?: "uint8" | "float32" | "float64";
8722
+ tool_calls?: {
8723
+ /**
8724
+ * Unique identifier for the tool call
8725
+ */
8726
+ id: string;
8727
+ /**
8728
+ * Type of tool call
8729
+ */
8730
+ type: "function";
8731
+ function: {
8732
+ /**
8733
+ * Name of the function to call
8734
+ */
8735
+ name: string;
8736
+ /**
8737
+ * JSON string of arguments for the function
8738
+ */
8739
+ arguments: string;
8740
+ };
8741
+ }[];
6955
8742
  };
6956
- interface Ai_Cf_Pipecat_Ai_Smart_Turn_V2_Output {
8743
+ /**
8744
+ * Reason why the model stopped generating
8745
+ */
8746
+ finish_reason?: string;
8747
+ /**
8748
+ * Stop reason (may be null)
8749
+ */
8750
+ stop_reason?: string | null;
8751
+ /**
8752
+ * Log probabilities (if requested)
8753
+ */
8754
+ logprobs?: {} | null;
8755
+ }[];
6957
8756
  /**
6958
- * if true, end-of-turn was detected
8757
+ * Usage statistics for the inference request
6959
8758
  */
6960
- is_complete?: boolean;
8759
+ usage?: {
8760
+ /**
8761
+ * Total number of tokens in input
8762
+ */
8763
+ prompt_tokens?: number;
8764
+ /**
8765
+ * Total number of tokens in output
8766
+ */
8767
+ completion_tokens?: number;
8768
+ /**
8769
+ * Total number of input and output tokens
8770
+ */
8771
+ total_tokens?: number;
8772
+ };
6961
8773
  /**
6962
- * probability of the end-of-turn detection
8774
+ * Log probabilities for the prompt (if requested)
6963
8775
  */
6964
- probability?: number;
6965
- }
6966
- declare abstract class Base_Ai_Cf_Pipecat_Ai_Smart_Turn_V2 {
6967
- inputs: Ai_Cf_Pipecat_Ai_Smart_Turn_V2_Input;
6968
- postProcessedOutputs: Ai_Cf_Pipecat_Ai_Smart_Turn_V2_Output;
8776
+ prompt_logprobs?: {} | null;
6969
8777
  }
6970
- type Ai_Cf_Openai_Gpt_Oss_120B_Input =
6971
- | GPT_OSS_120B_Responses
6972
- | GPT_OSS_120B_Responses_Async;
6973
- interface GPT_OSS_120B_Responses {
8778
+ interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Text_Completion_Response {
8779
+ /**
8780
+ * Unique identifier for the completion
8781
+ */
8782
+ id?: string;
8783
+ /**
8784
+ * Object type identifier
8785
+ */
8786
+ object?: "text_completion";
8787
+ /**
8788
+ * Unix timestamp of when the completion was created
8789
+ */
8790
+ created?: number;
8791
+ /**
8792
+ * Model used for the completion
8793
+ */
8794
+ model?: string;
6974
8795
  /**
6975
- * Responses API Input messages. Refer to OpenAI Responses API docs to learn more about supported content types
8796
+ * List of completion choices
6976
8797
  */
6977
- input: string | unknown[];
6978
- reasoning?: {
8798
+ choices?: {
6979
8799
  /**
6980
- * Constrains effort on reasoning for reasoning models. Currently supported values are low, medium, and high. Reducing reasoning effort can result in faster responses and fewer tokens used on reasoning in a response.
8800
+ * Index of the choice in the list
6981
8801
  */
6982
- effort?: "low" | "medium" | "high";
8802
+ index: number;
6983
8803
  /**
6984
- * A summary of the reasoning performed by the model. This can be useful for debugging and understanding the model's reasoning process. One of auto, concise, or detailed.
8804
+ * The generated text completion
6985
8805
  */
6986
- summary?: "auto" | "concise" | "detailed";
6987
- };
6988
- }
6989
- interface GPT_OSS_120B_Responses_Async {
6990
- requests: {
8806
+ text: string;
6991
8807
  /**
6992
- * Responses API Input messages. Refer to OpenAI Responses API docs to learn more about supported content types
8808
+ * Reason why the model stopped generating
6993
8809
  */
6994
- input: string | unknown[];
6995
- reasoning?: {
6996
- /**
6997
- * Constrains effort on reasoning for reasoning models. Currently supported values are low, medium, and high. Reducing reasoning effort can result in faster responses and fewer tokens used on reasoning in a response.
6998
- */
6999
- effort?: "low" | "medium" | "high";
7000
- /**
7001
- * A summary of the reasoning performed by the model. This can be useful for debugging and understanding the model's reasoning process. One of auto, concise, or detailed.
7002
- */
7003
- summary?: "auto" | "concise" | "detailed";
7004
- };
8810
+ finish_reason: string;
8811
+ /**
8812
+ * Stop reason (may be null)
8813
+ */
8814
+ stop_reason?: string | null;
8815
+ /**
8816
+ * Log probabilities (if requested)
8817
+ */
8818
+ logprobs?: {} | null;
8819
+ /**
8820
+ * Log probabilities for the prompt (if requested)
8821
+ */
8822
+ prompt_logprobs?: {} | null;
7005
8823
  }[];
7006
- }
7007
- type Ai_Cf_Openai_Gpt_Oss_120B_Output = {} | (string & NonNullable<unknown>);
7008
- declare abstract class Base_Ai_Cf_Openai_Gpt_Oss_120B {
7009
- inputs: Ai_Cf_Openai_Gpt_Oss_120B_Input;
7010
- postProcessedOutputs: Ai_Cf_Openai_Gpt_Oss_120B_Output;
7011
- }
7012
- type Ai_Cf_Openai_Gpt_Oss_20B_Input =
7013
- | GPT_OSS_20B_Responses
7014
- | GPT_OSS_20B_Responses_Async;
7015
- interface GPT_OSS_20B_Responses {
7016
8824
  /**
7017
- * Responses API Input messages. Refer to OpenAI Responses API docs to learn more about supported content types
8825
+ * Usage statistics for the inference request
7018
8826
  */
7019
- input: string | unknown[];
7020
- reasoning?: {
8827
+ usage?: {
7021
8828
  /**
7022
- * Constrains effort on reasoning for reasoning models. Currently supported values are low, medium, and high. Reducing reasoning effort can result in faster responses and fewer tokens used on reasoning in a response.
8829
+ * Total number of tokens in input
7023
8830
  */
7024
- effort?: "low" | "medium" | "high";
8831
+ prompt_tokens?: number;
7025
8832
  /**
7026
- * A summary of the reasoning performed by the model. This can be useful for debugging and understanding the model's reasoning process. One of auto, concise, or detailed.
8833
+ * Total number of tokens in output
7027
8834
  */
7028
- summary?: "auto" | "concise" | "detailed";
7029
- };
7030
- }
7031
- interface GPT_OSS_20B_Responses_Async {
7032
- requests: {
8835
+ completion_tokens?: number;
7033
8836
  /**
7034
- * Responses API Input messages. Refer to OpenAI Responses API docs to learn more about supported content types
8837
+ * Total number of input and output tokens
7035
8838
  */
7036
- input: string | unknown[];
7037
- reasoning?: {
7038
- /**
7039
- * Constrains effort on reasoning for reasoning models. Currently supported values are low, medium, and high. Reducing reasoning effort can result in faster responses and fewer tokens used on reasoning in a response.
7040
- */
7041
- effort?: "low" | "medium" | "high";
7042
- /**
7043
- * A summary of the reasoning performed by the model. This can be useful for debugging and understanding the model's reasoning process. One of auto, concise, or detailed.
7044
- */
7045
- summary?: "auto" | "concise" | "detailed";
7046
- };
7047
- }[];
8839
+ total_tokens?: number;
8840
+ };
7048
8841
  }
7049
- type Ai_Cf_Openai_Gpt_Oss_20B_Output = {} | (string & NonNullable<unknown>);
7050
- declare abstract class Base_Ai_Cf_Openai_Gpt_Oss_20B {
7051
- inputs: Ai_Cf_Openai_Gpt_Oss_20B_Input;
7052
- postProcessedOutputs: Ai_Cf_Openai_Gpt_Oss_20B_Output;
8842
+ interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_AsyncResponse {
8843
+ /**
8844
+ * The async request id that can be used to obtain the results.
8845
+ */
8846
+ request_id?: string;
7053
8847
  }
7054
- interface Ai_Cf_Leonardo_Phoenix_1_0_Input {
8848
+ declare abstract class Base_Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It {
8849
+ inputs: Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Input;
8850
+ postProcessedOutputs: Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Output;
8851
+ }
8852
+ interface Ai_Cf_Pfnet_Plamo_Embedding_1B_Input {
7055
8853
  /**
7056
- * A text description of the image you want to generate.
8854
+ * Input text to embed. Can be a single string or a list of strings.
7057
8855
  */
7058
- prompt: string;
8856
+ text: string | string[];
8857
+ }
8858
+ interface Ai_Cf_Pfnet_Plamo_Embedding_1B_Output {
7059
8859
  /**
7060
- * Controls how closely the generated image should adhere to the prompt; higher values make the image more aligned with the prompt
8860
+ * Embedding vectors, where each vector is a list of floats.
7061
8861
  */
7062
- guidance?: number;
8862
+ data: number[][];
7063
8863
  /**
7064
- * Random seed for reproducibility of the image generation
8864
+ * Shape of the embedding data as [number_of_embeddings, embedding_dimension].
8865
+ *
8866
+ * @minItems 2
8867
+ * @maxItems 2
7065
8868
  */
7066
- seed?: number;
8869
+ shape: [number, number];
8870
+ }
8871
+ declare abstract class Base_Ai_Cf_Pfnet_Plamo_Embedding_1B {
8872
+ inputs: Ai_Cf_Pfnet_Plamo_Embedding_1B_Input;
8873
+ postProcessedOutputs: Ai_Cf_Pfnet_Plamo_Embedding_1B_Output;
8874
+ }
8875
+ interface Ai_Cf_Deepgram_Flux_Input {
7067
8876
  /**
7068
- * The height of the generated image in pixels
8877
+ * Encoding of the audio stream. Currently only supports raw signed little-endian 16-bit PCM.
7069
8878
  */
7070
- height?: number;
8879
+ encoding: "linear16";
7071
8880
  /**
7072
- * The width of the generated image in pixels
8881
+ * Sample rate of the audio stream in Hz.
7073
8882
  */
7074
- width?: number;
8883
+ sample_rate: string;
7075
8884
  /**
7076
- * The number of diffusion steps; higher values can improve quality but take longer
8885
+ * End-of-turn confidence required to fire an eager end-of-turn event. When set, enables EagerEndOfTurn and TurnResumed events. Valid Values 0.3 - 0.9.
7077
8886
  */
7078
- num_steps?: number;
8887
+ eager_eot_threshold?: string;
7079
8888
  /**
7080
- * Specify what to exclude from the generated images
8889
+ * End-of-turn confidence required to finish a turn. Valid Values 0.5 - 0.9.
7081
8890
  */
7082
- negative_prompt?: string;
8891
+ eot_threshold?: string;
8892
+ /**
8893
+ * A turn will be finished when this much time has passed after speech, regardless of EOT confidence.
8894
+ */
8895
+ eot_timeout_ms?: string;
8896
+ /**
8897
+ * Keyterm prompting can improve recognition of specialized terminology. Pass multiple keyterm query parameters to boost multiple keyterms.
8898
+ */
8899
+ keyterm?: string;
8900
+ /**
8901
+ * Opts out requests from the Deepgram Model Improvement Program. Refer to Deepgram Docs for pricing impacts before setting this to true. https://dpgr.am/deepgram-mip
8902
+ */
8903
+ mip_opt_out?: "true" | "false";
8904
+ /**
8905
+ * Label your requests for the purpose of identification during usage reporting
8906
+ */
8907
+ tag?: string;
7083
8908
  }
7084
8909
  /**
7085
- * The generated image in JPEG format
8910
+ * Output will be returned as websocket messages.
7086
8911
  */
7087
- type Ai_Cf_Leonardo_Phoenix_1_0_Output = string;
7088
- declare abstract class Base_Ai_Cf_Leonardo_Phoenix_1_0 {
7089
- inputs: Ai_Cf_Leonardo_Phoenix_1_0_Input;
7090
- postProcessedOutputs: Ai_Cf_Leonardo_Phoenix_1_0_Output;
7091
- }
7092
- interface Ai_Cf_Leonardo_Lucid_Origin_Input {
8912
+ interface Ai_Cf_Deepgram_Flux_Output {
7093
8913
  /**
7094
- * A text description of the image you want to generate.
8914
+ * The unique identifier of the request (uuid)
7095
8915
  */
7096
- prompt: string;
8916
+ request_id?: string;
7097
8917
  /**
7098
- * Controls how closely the generated image should adhere to the prompt; higher values make the image more aligned with the prompt
8918
+ * Starts at 0 and increments for each message the server sends to the client.
7099
8919
  */
7100
- guidance?: number;
8920
+ sequence_id?: number;
7101
8921
  /**
7102
- * Random seed for reproducibility of the image generation
8922
+ * The type of event being reported.
7103
8923
  */
7104
- seed?: number;
8924
+ event?:
8925
+ | "Update"
8926
+ | "StartOfTurn"
8927
+ | "EagerEndOfTurn"
8928
+ | "TurnResumed"
8929
+ | "EndOfTurn";
7105
8930
  /**
7106
- * The height of the generated image in pixels
8931
+ * The index of the current turn
7107
8932
  */
7108
- height?: number;
8933
+ turn_index?: number;
7109
8934
  /**
7110
- * The width of the generated image in pixels
8935
+ * Start time in seconds of the audio range that was transcribed
7111
8936
  */
7112
- width?: number;
8937
+ audio_window_start?: number;
7113
8938
  /**
7114
- * The number of diffusion steps; higher values can improve quality but take longer
8939
+ * End time in seconds of the audio range that was transcribed
7115
8940
  */
7116
- num_steps?: number;
8941
+ audio_window_end?: number;
7117
8942
  /**
7118
- * The number of diffusion steps; higher values can improve quality but take longer
8943
+ * Text that was said over the course of the current turn
7119
8944
  */
7120
- steps?: number;
7121
- }
7122
- interface Ai_Cf_Leonardo_Lucid_Origin_Output {
8945
+ transcript?: string;
7123
8946
  /**
7124
- * The generated image in Base64 format.
8947
+ * The words in the transcript
7125
8948
  */
7126
- image?: string;
8949
+ words?: {
8950
+ /**
8951
+ * The individual punctuated, properly-cased word from the transcript
8952
+ */
8953
+ word: string;
8954
+ /**
8955
+ * Confidence that this word was transcribed correctly
8956
+ */
8957
+ confidence: number;
8958
+ }[];
8959
+ /**
8960
+ * Confidence that no more speech is coming in this turn
8961
+ */
8962
+ end_of_turn_confidence?: number;
7127
8963
  }
7128
- declare abstract class Base_Ai_Cf_Leonardo_Lucid_Origin {
7129
- inputs: Ai_Cf_Leonardo_Lucid_Origin_Input;
7130
- postProcessedOutputs: Ai_Cf_Leonardo_Lucid_Origin_Output;
8964
+ declare abstract class Base_Ai_Cf_Deepgram_Flux {
8965
+ inputs: Ai_Cf_Deepgram_Flux_Input;
8966
+ postProcessedOutputs: Ai_Cf_Deepgram_Flux_Output;
7131
8967
  }
7132
- interface Ai_Cf_Deepgram_Aura_1_Input {
8968
+ interface Ai_Cf_Deepgram_Aura_2_En_Input {
7133
8969
  /**
7134
8970
  * Speaker used to produce the audio.
7135
8971
  */
7136
8972
  speaker?:
7137
- | "angus"
7138
- | "asteria"
8973
+ | "amalthea"
8974
+ | "andromeda"
8975
+ | "apollo"
7139
8976
  | "arcas"
7140
- | "orion"
7141
- | "orpheus"
8977
+ | "aries"
8978
+ | "asteria"
7142
8979
  | "athena"
7143
- | "luna"
7144
- | "zeus"
7145
- | "perseus"
7146
- | "helios"
8980
+ | "atlas"
8981
+ | "aurora"
8982
+ | "callista"
8983
+ | "cora"
8984
+ | "cordelia"
8985
+ | "delia"
8986
+ | "draco"
8987
+ | "electra"
8988
+ | "harmonia"
8989
+ | "helena"
7147
8990
  | "hera"
7148
- | "stella";
8991
+ | "hermes"
8992
+ | "hyperion"
8993
+ | "iris"
8994
+ | "janus"
8995
+ | "juno"
8996
+ | "jupiter"
8997
+ | "luna"
8998
+ | "mars"
8999
+ | "minerva"
9000
+ | "neptune"
9001
+ | "odysseus"
9002
+ | "ophelia"
9003
+ | "orion"
9004
+ | "orpheus"
9005
+ | "pandora"
9006
+ | "phoebe"
9007
+ | "pluto"
9008
+ | "saturn"
9009
+ | "thalia"
9010
+ | "theia"
9011
+ | "vesta"
9012
+ | "zeus";
7149
9013
  /**
7150
9014
  * Encoding of the output audio.
7151
9015
  */
@@ -7170,10 +9034,54 @@ interface Ai_Cf_Deepgram_Aura_1_Input {
7170
9034
  /**
7171
9035
  * The generated audio in MP3 format
7172
9036
  */
7173
- type Ai_Cf_Deepgram_Aura_1_Output = string;
7174
- declare abstract class Base_Ai_Cf_Deepgram_Aura_1 {
7175
- inputs: Ai_Cf_Deepgram_Aura_1_Input;
7176
- postProcessedOutputs: Ai_Cf_Deepgram_Aura_1_Output;
9037
+ type Ai_Cf_Deepgram_Aura_2_En_Output = string;
9038
+ declare abstract class Base_Ai_Cf_Deepgram_Aura_2_En {
9039
+ inputs: Ai_Cf_Deepgram_Aura_2_En_Input;
9040
+ postProcessedOutputs: Ai_Cf_Deepgram_Aura_2_En_Output;
9041
+ }
9042
+ interface Ai_Cf_Deepgram_Aura_2_Es_Input {
9043
+ /**
9044
+ * Speaker used to produce the audio.
9045
+ */
9046
+ speaker?:
9047
+ | "sirio"
9048
+ | "nestor"
9049
+ | "carina"
9050
+ | "celeste"
9051
+ | "alvaro"
9052
+ | "diana"
9053
+ | "aquila"
9054
+ | "selena"
9055
+ | "estrella"
9056
+ | "javier";
9057
+ /**
9058
+ * Encoding of the output audio.
9059
+ */
9060
+ encoding?: "linear16" | "flac" | "mulaw" | "alaw" | "mp3" | "opus" | "aac";
9061
+ /**
9062
+ * Container specifies the file format wrapper for the output audio. The available options depend on the encoding type..
9063
+ */
9064
+ container?: "none" | "wav" | "ogg";
9065
+ /**
9066
+ * The text content to be converted to speech
9067
+ */
9068
+ text: string;
9069
+ /**
9070
+ * Sample Rate specifies the sample rate for the output audio. Based on the encoding, different sample rates are supported. For some encodings, the sample rate is not configurable
9071
+ */
9072
+ sample_rate?: number;
9073
+ /**
9074
+ * The bitrate of the audio in bits per second. Choose from predefined ranges or specific values based on the encoding type.
9075
+ */
9076
+ bit_rate?: number;
9077
+ }
9078
+ /**
9079
+ * The generated audio in MP3 format
9080
+ */
9081
+ type Ai_Cf_Deepgram_Aura_2_Es_Output = string;
9082
+ declare abstract class Base_Ai_Cf_Deepgram_Aura_2_Es {
9083
+ inputs: Ai_Cf_Deepgram_Aura_2_Es_Input;
9084
+ postProcessedOutputs: Ai_Cf_Deepgram_Aura_2_Es_Output;
7177
9085
  }
7178
9086
  interface AiModels {
7179
9087
  "@cf/huggingface/distilbert-sst-2-int8": BaseAiTextClassification;
@@ -7218,12 +9126,12 @@ interface AiModels {
7218
9126
  "@cf/meta/llama-3-8b-instruct": BaseAiTextGeneration;
7219
9127
  "@cf/fblgit/una-cybertron-7b-v2-bf16": BaseAiTextGeneration;
7220
9128
  "@cf/meta/llama-3-8b-instruct-awq": BaseAiTextGeneration;
7221
- "@hf/meta-llama/meta-llama-3-8b-instruct": BaseAiTextGeneration;
7222
9129
  "@cf/meta/llama-3.1-8b-instruct-fp8": BaseAiTextGeneration;
7223
9130
  "@cf/meta/llama-3.1-8b-instruct-awq": BaseAiTextGeneration;
7224
9131
  "@cf/meta/llama-3.2-3b-instruct": BaseAiTextGeneration;
7225
9132
  "@cf/meta/llama-3.2-1b-instruct": BaseAiTextGeneration;
7226
9133
  "@cf/deepseek-ai/deepseek-r1-distill-qwen-32b": BaseAiTextGeneration;
9134
+ "@cf/ibm-granite/granite-4.0-h-micro": BaseAiTextGeneration;
7227
9135
  "@cf/facebook/bart-large-cnn": BaseAiSummarization;
7228
9136
  "@cf/llava-hf/llava-1.5-7b-hf": BaseAiImageToText;
7229
9137
  "@cf/baai/bge-base-en-v1.5": Base_Ai_Cf_Baai_Bge_Base_En_V1_5;
@@ -7245,13 +9153,21 @@ interface AiModels {
7245
9153
  "@cf/mistralai/mistral-small-3.1-24b-instruct": Base_Ai_Cf_Mistralai_Mistral_Small_3_1_24B_Instruct;
7246
9154
  "@cf/google/gemma-3-12b-it": Base_Ai_Cf_Google_Gemma_3_12B_It;
7247
9155
  "@cf/meta/llama-4-scout-17b-16e-instruct": Base_Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct;
9156
+ "@cf/qwen/qwen3-30b-a3b-fp8": Base_Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8;
7248
9157
  "@cf/deepgram/nova-3": Base_Ai_Cf_Deepgram_Nova_3;
9158
+ "@cf/qwen/qwen3-embedding-0.6b": Base_Ai_Cf_Qwen_Qwen3_Embedding_0_6B;
7249
9159
  "@cf/pipecat-ai/smart-turn-v2": Base_Ai_Cf_Pipecat_Ai_Smart_Turn_V2;
7250
9160
  "@cf/openai/gpt-oss-120b": Base_Ai_Cf_Openai_Gpt_Oss_120B;
7251
9161
  "@cf/openai/gpt-oss-20b": Base_Ai_Cf_Openai_Gpt_Oss_20B;
7252
9162
  "@cf/leonardo/phoenix-1.0": Base_Ai_Cf_Leonardo_Phoenix_1_0;
7253
9163
  "@cf/leonardo/lucid-origin": Base_Ai_Cf_Leonardo_Lucid_Origin;
7254
9164
  "@cf/deepgram/aura-1": Base_Ai_Cf_Deepgram_Aura_1;
9165
+ "@cf/ai4bharat/indictrans2-en-indic-1B": Base_Ai_Cf_Ai4Bharat_Indictrans2_En_Indic_1B;
9166
+ "@cf/aisingapore/gemma-sea-lion-v4-27b-it": Base_Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It;
9167
+ "@cf/pfnet/plamo-embedding-1b": Base_Ai_Cf_Pfnet_Plamo_Embedding_1B;
9168
+ "@cf/deepgram/flux": Base_Ai_Cf_Deepgram_Flux;
9169
+ "@cf/deepgram/aura-2-en": Base_Ai_Cf_Deepgram_Aura_2_En;
9170
+ "@cf/deepgram/aura-2-es": Base_Ai_Cf_Deepgram_Aura_2_Es;
7255
9171
  }
7256
9172
  type AiOptions = {
7257
9173
  /**
@@ -7263,6 +9179,16 @@ type AiOptions = {
7263
9179
  * Establish websocket connections, only works for supported models
7264
9180
  */
7265
9181
  websocket?: boolean;
9182
+ /**
9183
+ * Tag your requests to group and view them in Cloudflare dashboard.
9184
+ *
9185
+ * Rules:
9186
+ * Tags must only contain letters, numbers, and the symbols: : - . / @
9187
+ * Each tag can have maximum 50 characters.
9188
+ * Maximum 5 tags are allowed each request.
9189
+ * Duplicate tags will removed.
9190
+ */
9191
+ tags: string[];
7266
9192
  gateway?: GatewayOptions;
7267
9193
  returnRawResponse?: boolean;
7268
9194
  prefix?: string;
@@ -9350,12 +11276,13 @@ declare namespace Rpc {
9350
11276
  export type Provider<
9351
11277
  T extends object,
9352
11278
  Reserved extends string = never,
9353
- > = MaybeCallableProvider<T> & {
9354
- [K in Exclude<
9355
- keyof T,
9356
- Reserved | symbol | keyof StubBase<never>
9357
- >]: MethodOrProperty<T[K]>;
9358
- };
11279
+ > = MaybeCallableProvider<T> &
11280
+ Pick<
11281
+ {
11282
+ [K in keyof T]: MethodOrProperty<T[K]>;
11283
+ },
11284
+ Exclude<keyof T, Reserved | symbol | keyof StubBase<never>>
11285
+ >;
9359
11286
  }
9360
11287
  declare namespace Cloudflare {
9361
11288
  // Type of `env`.