@workers-community/workers-types 4.20251120.0 → 4.20251125.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (3) hide show
  1. package/index.d.ts +2289 -362
  2. package/index.ts +2289 -367
  3. package/package.json +1 -1
package/index.d.ts CHANGED
@@ -4109,6 +4109,427 @@ declare abstract class BaseAiTranslation {
4109
4109
  inputs: AiTranslationInput;
4110
4110
  postProcessedOutputs: AiTranslationOutput;
4111
4111
  }
4112
+ /**
4113
+ * Workers AI support for OpenAI's Responses API
4114
+ * Reference: https://github.com/openai/openai-node/blob/master/src/resources/responses/responses.ts
4115
+ *
4116
+ * It's a stripped down version from its source.
4117
+ * It currently supports basic function calling, json mode and accepts images as input.
4118
+ *
4119
+ * It does not include types for WebSearch, CodeInterpreter, FileInputs, MCP, CustomTools.
4120
+ * We plan to add those incrementally as model + platform capabilities evolve.
4121
+ */
4122
+ type ResponsesInput = {
4123
+ background?: boolean | null;
4124
+ conversation?: string | ResponseConversationParam | null;
4125
+ include?: Array<ResponseIncludable> | null;
4126
+ input?: string | ResponseInput;
4127
+ instructions?: string | null;
4128
+ max_output_tokens?: number | null;
4129
+ parallel_tool_calls?: boolean | null;
4130
+ previous_response_id?: string | null;
4131
+ prompt_cache_key?: string;
4132
+ reasoning?: Reasoning | null;
4133
+ safety_identifier?: string;
4134
+ service_tier?: "auto" | "default" | "flex" | "scale" | "priority" | null;
4135
+ stream?: boolean | null;
4136
+ stream_options?: StreamOptions | null;
4137
+ temperature?: number | null;
4138
+ text?: ResponseTextConfig;
4139
+ tool_choice?: ToolChoiceOptions | ToolChoiceFunction;
4140
+ tools?: Array<Tool>;
4141
+ top_p?: number | null;
4142
+ truncation?: "auto" | "disabled" | null;
4143
+ };
4144
+ type ResponsesOutput = {
4145
+ id?: string;
4146
+ created_at?: number;
4147
+ output_text?: string;
4148
+ error?: ResponseError | null;
4149
+ incomplete_details?: ResponseIncompleteDetails | null;
4150
+ instructions?: string | Array<ResponseInputItem> | null;
4151
+ object?: "response";
4152
+ output?: Array<ResponseOutputItem>;
4153
+ parallel_tool_calls?: boolean;
4154
+ temperature?: number | null;
4155
+ tool_choice?: ToolChoiceOptions | ToolChoiceFunction;
4156
+ tools?: Array<Tool>;
4157
+ top_p?: number | null;
4158
+ max_output_tokens?: number | null;
4159
+ previous_response_id?: string | null;
4160
+ prompt?: ResponsePrompt | null;
4161
+ reasoning?: Reasoning | null;
4162
+ safety_identifier?: string;
4163
+ service_tier?: "auto" | "default" | "flex" | "scale" | "priority" | null;
4164
+ status?: ResponseStatus;
4165
+ text?: ResponseTextConfig;
4166
+ truncation?: "auto" | "disabled" | null;
4167
+ usage?: ResponseUsage;
4168
+ };
4169
+ type EasyInputMessage = {
4170
+ content: string | ResponseInputMessageContentList;
4171
+ role: "user" | "assistant" | "system" | "developer";
4172
+ type?: "message";
4173
+ };
4174
+ type ResponsesFunctionTool = {
4175
+ name: string;
4176
+ parameters: {
4177
+ [key: string]: unknown;
4178
+ } | null;
4179
+ strict: boolean | null;
4180
+ type: "function";
4181
+ description?: string | null;
4182
+ };
4183
+ type ResponseIncompleteDetails = {
4184
+ reason?: "max_output_tokens" | "content_filter";
4185
+ };
4186
+ type ResponsePrompt = {
4187
+ id: string;
4188
+ variables?: {
4189
+ [key: string]: string | ResponseInputText | ResponseInputImage;
4190
+ } | null;
4191
+ version?: string | null;
4192
+ };
4193
+ type Reasoning = {
4194
+ effort?: ReasoningEffort | null;
4195
+ generate_summary?: "auto" | "concise" | "detailed" | null;
4196
+ summary?: "auto" | "concise" | "detailed" | null;
4197
+ };
4198
+ type ResponseContent =
4199
+ | ResponseInputText
4200
+ | ResponseInputImage
4201
+ | ResponseOutputText
4202
+ | ResponseOutputRefusal
4203
+ | ResponseContentReasoningText;
4204
+ type ResponseContentReasoningText = {
4205
+ text: string;
4206
+ type: "reasoning_text";
4207
+ };
4208
+ type ResponseConversationParam = {
4209
+ id: string;
4210
+ };
4211
+ type ResponseCreatedEvent = {
4212
+ response: Response;
4213
+ sequence_number: number;
4214
+ type: "response.created";
4215
+ };
4216
+ type ResponseCustomToolCallOutput = {
4217
+ call_id: string;
4218
+ output: string | Array<ResponseInputText | ResponseInputImage>;
4219
+ type: "custom_tool_call_output";
4220
+ id?: string;
4221
+ };
4222
+ type ResponseError = {
4223
+ code:
4224
+ | "server_error"
4225
+ | "rate_limit_exceeded"
4226
+ | "invalid_prompt"
4227
+ | "vector_store_timeout"
4228
+ | "invalid_image"
4229
+ | "invalid_image_format"
4230
+ | "invalid_base64_image"
4231
+ | "invalid_image_url"
4232
+ | "image_too_large"
4233
+ | "image_too_small"
4234
+ | "image_parse_error"
4235
+ | "image_content_policy_violation"
4236
+ | "invalid_image_mode"
4237
+ | "image_file_too_large"
4238
+ | "unsupported_image_media_type"
4239
+ | "empty_image_file"
4240
+ | "failed_to_download_image"
4241
+ | "image_file_not_found";
4242
+ message: string;
4243
+ };
4244
+ type ResponseErrorEvent = {
4245
+ code: string | null;
4246
+ message: string;
4247
+ param: string | null;
4248
+ sequence_number: number;
4249
+ type: "error";
4250
+ };
4251
+ type ResponseFailedEvent = {
4252
+ response: Response;
4253
+ sequence_number: number;
4254
+ type: "response.failed";
4255
+ };
4256
+ type ResponseFormatText = {
4257
+ type: "text";
4258
+ };
4259
+ type ResponseFormatJSONObject = {
4260
+ type: "json_object";
4261
+ };
4262
+ type ResponseFormatTextConfig =
4263
+ | ResponseFormatText
4264
+ | ResponseFormatTextJSONSchemaConfig
4265
+ | ResponseFormatJSONObject;
4266
+ type ResponseFormatTextJSONSchemaConfig = {
4267
+ name: string;
4268
+ schema: {
4269
+ [key: string]: unknown;
4270
+ };
4271
+ type: "json_schema";
4272
+ description?: string;
4273
+ strict?: boolean | null;
4274
+ };
4275
+ type ResponseFunctionCallArgumentsDeltaEvent = {
4276
+ delta: string;
4277
+ item_id: string;
4278
+ output_index: number;
4279
+ sequence_number: number;
4280
+ type: "response.function_call_arguments.delta";
4281
+ };
4282
+ type ResponseFunctionCallArgumentsDoneEvent = {
4283
+ arguments: string;
4284
+ item_id: string;
4285
+ name: string;
4286
+ output_index: number;
4287
+ sequence_number: number;
4288
+ type: "response.function_call_arguments.done";
4289
+ };
4290
+ type ResponseFunctionCallOutputItem =
4291
+ | ResponseInputTextContent
4292
+ | ResponseInputImageContent;
4293
+ type ResponseFunctionCallOutputItemList = Array<ResponseFunctionCallOutputItem>;
4294
+ type ResponseFunctionToolCall = {
4295
+ arguments: string;
4296
+ call_id: string;
4297
+ name: string;
4298
+ type: "function_call";
4299
+ id?: string;
4300
+ status?: "in_progress" | "completed" | "incomplete";
4301
+ };
4302
+ interface ResponseFunctionToolCallItem extends ResponseFunctionToolCall {
4303
+ id: string;
4304
+ }
4305
+ type ResponseFunctionToolCallOutputItem = {
4306
+ id: string;
4307
+ call_id: string;
4308
+ output: string | Array<ResponseInputText | ResponseInputImage>;
4309
+ type: "function_call_output";
4310
+ status?: "in_progress" | "completed" | "incomplete";
4311
+ };
4312
+ type ResponseIncludable =
4313
+ | "message.input_image.image_url"
4314
+ | "message.output_text.logprobs";
4315
+ type ResponseIncompleteEvent = {
4316
+ response: Response;
4317
+ sequence_number: number;
4318
+ type: "response.incomplete";
4319
+ };
4320
+ type ResponseInput = Array<ResponseInputItem>;
4321
+ type ResponseInputContent = ResponseInputText | ResponseInputImage;
4322
+ type ResponseInputImage = {
4323
+ detail: "low" | "high" | "auto";
4324
+ type: "input_image";
4325
+ /**
4326
+ * Base64 encoded image
4327
+ */
4328
+ image_url?: string | null;
4329
+ };
4330
+ type ResponseInputImageContent = {
4331
+ type: "input_image";
4332
+ detail?: "low" | "high" | "auto" | null;
4333
+ /**
4334
+ * Base64 encoded image
4335
+ */
4336
+ image_url?: string | null;
4337
+ };
4338
+ type ResponseInputItem =
4339
+ | EasyInputMessage
4340
+ | ResponseInputItemMessage
4341
+ | ResponseOutputMessage
4342
+ | ResponseFunctionToolCall
4343
+ | ResponseInputItemFunctionCallOutput
4344
+ | ResponseReasoningItem;
4345
+ type ResponseInputItemFunctionCallOutput = {
4346
+ call_id: string;
4347
+ output: string | ResponseFunctionCallOutputItemList;
4348
+ type: "function_call_output";
4349
+ id?: string | null;
4350
+ status?: "in_progress" | "completed" | "incomplete" | null;
4351
+ };
4352
+ type ResponseInputItemMessage = {
4353
+ content: ResponseInputMessageContentList;
4354
+ role: "user" | "system" | "developer";
4355
+ status?: "in_progress" | "completed" | "incomplete";
4356
+ type?: "message";
4357
+ };
4358
+ type ResponseInputMessageContentList = Array<ResponseInputContent>;
4359
+ type ResponseInputMessageItem = {
4360
+ id: string;
4361
+ content: ResponseInputMessageContentList;
4362
+ role: "user" | "system" | "developer";
4363
+ status?: "in_progress" | "completed" | "incomplete";
4364
+ type?: "message";
4365
+ };
4366
+ type ResponseInputText = {
4367
+ text: string;
4368
+ type: "input_text";
4369
+ };
4370
+ type ResponseInputTextContent = {
4371
+ text: string;
4372
+ type: "input_text";
4373
+ };
4374
+ type ResponseItem =
4375
+ | ResponseInputMessageItem
4376
+ | ResponseOutputMessage
4377
+ | ResponseFunctionToolCallItem
4378
+ | ResponseFunctionToolCallOutputItem;
4379
+ type ResponseOutputItem =
4380
+ | ResponseOutputMessage
4381
+ | ResponseFunctionToolCall
4382
+ | ResponseReasoningItem;
4383
+ type ResponseOutputItemAddedEvent = {
4384
+ item: ResponseOutputItem;
4385
+ output_index: number;
4386
+ sequence_number: number;
4387
+ type: "response.output_item.added";
4388
+ };
4389
+ type ResponseOutputItemDoneEvent = {
4390
+ item: ResponseOutputItem;
4391
+ output_index: number;
4392
+ sequence_number: number;
4393
+ type: "response.output_item.done";
4394
+ };
4395
+ type ResponseOutputMessage = {
4396
+ id: string;
4397
+ content: Array<ResponseOutputText | ResponseOutputRefusal>;
4398
+ role: "assistant";
4399
+ status: "in_progress" | "completed" | "incomplete";
4400
+ type: "message";
4401
+ };
4402
+ type ResponseOutputRefusal = {
4403
+ refusal: string;
4404
+ type: "refusal";
4405
+ };
4406
+ type ResponseOutputText = {
4407
+ text: string;
4408
+ type: "output_text";
4409
+ logprobs?: Array<Logprob>;
4410
+ };
4411
+ type ResponseReasoningItem = {
4412
+ id: string;
4413
+ summary: Array<ResponseReasoningSummaryItem>;
4414
+ type: "reasoning";
4415
+ content?: Array<ResponseReasoningContentItem>;
4416
+ encrypted_content?: string | null;
4417
+ status?: "in_progress" | "completed" | "incomplete";
4418
+ };
4419
+ type ResponseReasoningSummaryItem = {
4420
+ text: string;
4421
+ type: "summary_text";
4422
+ };
4423
+ type ResponseReasoningContentItem = {
4424
+ text: string;
4425
+ type: "reasoning_text";
4426
+ };
4427
+ type ResponseReasoningTextDeltaEvent = {
4428
+ content_index: number;
4429
+ delta: string;
4430
+ item_id: string;
4431
+ output_index: number;
4432
+ sequence_number: number;
4433
+ type: "response.reasoning_text.delta";
4434
+ };
4435
+ type ResponseReasoningTextDoneEvent = {
4436
+ content_index: number;
4437
+ item_id: string;
4438
+ output_index: number;
4439
+ sequence_number: number;
4440
+ text: string;
4441
+ type: "response.reasoning_text.done";
4442
+ };
4443
+ type ResponseRefusalDeltaEvent = {
4444
+ content_index: number;
4445
+ delta: string;
4446
+ item_id: string;
4447
+ output_index: number;
4448
+ sequence_number: number;
4449
+ type: "response.refusal.delta";
4450
+ };
4451
+ type ResponseRefusalDoneEvent = {
4452
+ content_index: number;
4453
+ item_id: string;
4454
+ output_index: number;
4455
+ refusal: string;
4456
+ sequence_number: number;
4457
+ type: "response.refusal.done";
4458
+ };
4459
+ type ResponseStatus =
4460
+ | "completed"
4461
+ | "failed"
4462
+ | "in_progress"
4463
+ | "cancelled"
4464
+ | "queued"
4465
+ | "incomplete";
4466
+ type ResponseStreamEvent =
4467
+ | ResponseCompletedEvent
4468
+ | ResponseCreatedEvent
4469
+ | ResponseErrorEvent
4470
+ | ResponseFunctionCallArgumentsDeltaEvent
4471
+ | ResponseFunctionCallArgumentsDoneEvent
4472
+ | ResponseFailedEvent
4473
+ | ResponseIncompleteEvent
4474
+ | ResponseOutputItemAddedEvent
4475
+ | ResponseOutputItemDoneEvent
4476
+ | ResponseReasoningTextDeltaEvent
4477
+ | ResponseReasoningTextDoneEvent
4478
+ | ResponseRefusalDeltaEvent
4479
+ | ResponseRefusalDoneEvent
4480
+ | ResponseTextDeltaEvent
4481
+ | ResponseTextDoneEvent;
4482
+ type ResponseCompletedEvent = {
4483
+ response: Response;
4484
+ sequence_number: number;
4485
+ type: "response.completed";
4486
+ };
4487
+ type ResponseTextConfig = {
4488
+ format?: ResponseFormatTextConfig;
4489
+ verbosity?: "low" | "medium" | "high" | null;
4490
+ };
4491
+ type ResponseTextDeltaEvent = {
4492
+ content_index: number;
4493
+ delta: string;
4494
+ item_id: string;
4495
+ logprobs: Array<Logprob>;
4496
+ output_index: number;
4497
+ sequence_number: number;
4498
+ type: "response.output_text.delta";
4499
+ };
4500
+ type ResponseTextDoneEvent = {
4501
+ content_index: number;
4502
+ item_id: string;
4503
+ logprobs: Array<Logprob>;
4504
+ output_index: number;
4505
+ sequence_number: number;
4506
+ text: string;
4507
+ type: "response.output_text.done";
4508
+ };
4509
+ type Logprob = {
4510
+ token: string;
4511
+ logprob: number;
4512
+ top_logprobs?: Array<TopLogprob>;
4513
+ };
4514
+ type TopLogprob = {
4515
+ token?: string;
4516
+ logprob?: number;
4517
+ };
4518
+ type ResponseUsage = {
4519
+ input_tokens: number;
4520
+ output_tokens: number;
4521
+ total_tokens: number;
4522
+ };
4523
+ type Tool = ResponsesFunctionTool;
4524
+ type ToolChoiceFunction = {
4525
+ name: string;
4526
+ type: "function";
4527
+ };
4528
+ type ToolChoiceOptions = "none";
4529
+ type ReasoningEffort = "minimal" | "low" | "medium" | "high" | null;
4530
+ type StreamOptions = {
4531
+ include_obfuscation?: boolean;
4532
+ };
4112
4533
  type Ai_Cf_Baai_Bge_Base_En_V1_5_Input =
4113
4534
  | {
4114
4535
  text: string | string[];
@@ -4141,8 +4562,8 @@ type Ai_Cf_Baai_Bge_Base_En_V1_5_Output =
4141
4562
  */
4142
4563
  pooling?: "mean" | "cls";
4143
4564
  }
4144
- | AsyncResponse;
4145
- interface AsyncResponse {
4565
+ | Ai_Cf_Baai_Bge_Base_En_V1_5_AsyncResponse;
4566
+ interface Ai_Cf_Baai_Bge_Base_En_V1_5_AsyncResponse {
4146
4567
  /**
4147
4568
  * The async request id that can be used to obtain the results.
4148
4569
  */
@@ -4224,7 +4645,13 @@ type Ai_Cf_Meta_M2M100_1_2B_Output =
4224
4645
  */
4225
4646
  translated_text?: string;
4226
4647
  }
4227
- | AsyncResponse;
4648
+ | Ai_Cf_Meta_M2M100_1_2B_AsyncResponse;
4649
+ interface Ai_Cf_Meta_M2M100_1_2B_AsyncResponse {
4650
+ /**
4651
+ * The async request id that can be used to obtain the results.
4652
+ */
4653
+ request_id?: string;
4654
+ }
4228
4655
  declare abstract class Base_Ai_Cf_Meta_M2M100_1_2B {
4229
4656
  inputs: Ai_Cf_Meta_M2M100_1_2B_Input;
4230
4657
  postProcessedOutputs: Ai_Cf_Meta_M2M100_1_2B_Output;
@@ -4261,7 +4688,13 @@ type Ai_Cf_Baai_Bge_Small_En_V1_5_Output =
4261
4688
  */
4262
4689
  pooling?: "mean" | "cls";
4263
4690
  }
4264
- | AsyncResponse;
4691
+ | Ai_Cf_Baai_Bge_Small_En_V1_5_AsyncResponse;
4692
+ interface Ai_Cf_Baai_Bge_Small_En_V1_5_AsyncResponse {
4693
+ /**
4694
+ * The async request id that can be used to obtain the results.
4695
+ */
4696
+ request_id?: string;
4697
+ }
4265
4698
  declare abstract class Base_Ai_Cf_Baai_Bge_Small_En_V1_5 {
4266
4699
  inputs: Ai_Cf_Baai_Bge_Small_En_V1_5_Input;
4267
4700
  postProcessedOutputs: Ai_Cf_Baai_Bge_Small_En_V1_5_Output;
@@ -4298,7 +4731,13 @@ type Ai_Cf_Baai_Bge_Large_En_V1_5_Output =
4298
4731
  */
4299
4732
  pooling?: "mean" | "cls";
4300
4733
  }
4301
- | AsyncResponse;
4734
+ | Ai_Cf_Baai_Bge_Large_En_V1_5_AsyncResponse;
4735
+ interface Ai_Cf_Baai_Bge_Large_En_V1_5_AsyncResponse {
4736
+ /**
4737
+ * The async request id that can be used to obtain the results.
4738
+ */
4739
+ request_id?: string;
4740
+ }
4302
4741
  declare abstract class Base_Ai_Cf_Baai_Bge_Large_En_V1_5 {
4303
4742
  inputs: Ai_Cf_Baai_Bge_Large_En_V1_5_Input;
4304
4743
  postProcessedOutputs: Ai_Cf_Baai_Bge_Large_En_V1_5_Output;
@@ -4489,15 +4928,18 @@ declare abstract class Base_Ai_Cf_Openai_Whisper_Large_V3_Turbo {
4489
4928
  postProcessedOutputs: Ai_Cf_Openai_Whisper_Large_V3_Turbo_Output;
4490
4929
  }
4491
4930
  type Ai_Cf_Baai_Bge_M3_Input =
4492
- | BGEM3InputQueryAndContexts
4493
- | BGEM3InputEmbedding
4931
+ | Ai_Cf_Baai_Bge_M3_Input_QueryAnd_Contexts
4932
+ | Ai_Cf_Baai_Bge_M3_Input_Embedding
4494
4933
  | {
4495
4934
  /**
4496
4935
  * Batch of the embeddings requests to run using async-queue
4497
4936
  */
4498
- requests: (BGEM3InputQueryAndContexts1 | BGEM3InputEmbedding1)[];
4937
+ requests: (
4938
+ | Ai_Cf_Baai_Bge_M3_Input_QueryAnd_Contexts_1
4939
+ | Ai_Cf_Baai_Bge_M3_Input_Embedding_1
4940
+ )[];
4499
4941
  };
4500
- interface BGEM3InputQueryAndContexts {
4942
+ interface Ai_Cf_Baai_Bge_M3_Input_QueryAnd_Contexts {
4501
4943
  /**
4502
4944
  * A query you wish to perform against the provided contexts. If no query is provided the model with respond with embeddings for contexts
4503
4945
  */
@@ -4516,14 +4958,14 @@ interface BGEM3InputQueryAndContexts {
4516
4958
  */
4517
4959
  truncate_inputs?: boolean;
4518
4960
  }
4519
- interface BGEM3InputEmbedding {
4961
+ interface Ai_Cf_Baai_Bge_M3_Input_Embedding {
4520
4962
  text: string | string[];
4521
4963
  /**
4522
4964
  * When provided with too long context should the model error out or truncate the context to fit?
4523
4965
  */
4524
4966
  truncate_inputs?: boolean;
4525
4967
  }
4526
- interface BGEM3InputQueryAndContexts1 {
4968
+ interface Ai_Cf_Baai_Bge_M3_Input_QueryAnd_Contexts_1 {
4527
4969
  /**
4528
4970
  * A query you wish to perform against the provided contexts. If no query is provided the model with respond with embeddings for contexts
4529
4971
  */
@@ -4542,7 +4984,7 @@ interface BGEM3InputQueryAndContexts1 {
4542
4984
  */
4543
4985
  truncate_inputs?: boolean;
4544
4986
  }
4545
- interface BGEM3InputEmbedding1 {
4987
+ interface Ai_Cf_Baai_Bge_M3_Input_Embedding_1 {
4546
4988
  text: string | string[];
4547
4989
  /**
4548
4990
  * When provided with too long context should the model error out or truncate the context to fit?
@@ -4550,11 +4992,11 @@ interface BGEM3InputEmbedding1 {
4550
4992
  truncate_inputs?: boolean;
4551
4993
  }
4552
4994
  type Ai_Cf_Baai_Bge_M3_Output =
4553
- | BGEM3OuputQuery
4554
- | BGEM3OutputEmbeddingForContexts
4555
- | BGEM3OuputEmbedding
4556
- | AsyncResponse;
4557
- interface BGEM3OuputQuery {
4995
+ | Ai_Cf_Baai_Bge_M3_Ouput_Query
4996
+ | Ai_Cf_Baai_Bge_M3_Output_EmbeddingFor_Contexts
4997
+ | Ai_Cf_Baai_Bge_M3_Ouput_Embedding
4998
+ | Ai_Cf_Baai_Bge_M3_AsyncResponse;
4999
+ interface Ai_Cf_Baai_Bge_M3_Ouput_Query {
4558
5000
  response?: {
4559
5001
  /**
4560
5002
  * Index of the context in the request
@@ -4566,7 +5008,7 @@ interface BGEM3OuputQuery {
4566
5008
  score?: number;
4567
5009
  }[];
4568
5010
  }
4569
- interface BGEM3OutputEmbeddingForContexts {
5011
+ interface Ai_Cf_Baai_Bge_M3_Output_EmbeddingFor_Contexts {
4570
5012
  response?: number[][];
4571
5013
  shape?: number[];
4572
5014
  /**
@@ -4574,7 +5016,7 @@ interface BGEM3OutputEmbeddingForContexts {
4574
5016
  */
4575
5017
  pooling?: "mean" | "cls";
4576
5018
  }
4577
- interface BGEM3OuputEmbedding {
5019
+ interface Ai_Cf_Baai_Bge_M3_Ouput_Embedding {
4578
5020
  shape?: number[];
4579
5021
  /**
4580
5022
  * Embeddings of the requested text values
@@ -4585,6 +5027,12 @@ interface BGEM3OuputEmbedding {
4585
5027
  */
4586
5028
  pooling?: "mean" | "cls";
4587
5029
  }
5030
+ interface Ai_Cf_Baai_Bge_M3_AsyncResponse {
5031
+ /**
5032
+ * The async request id that can be used to obtain the results.
5033
+ */
5034
+ request_id?: string;
5035
+ }
4588
5036
  declare abstract class Base_Ai_Cf_Baai_Bge_M3 {
4589
5037
  inputs: Ai_Cf_Baai_Bge_M3_Input;
4590
5038
  postProcessedOutputs: Ai_Cf_Baai_Bge_M3_Output;
@@ -4609,8 +5057,10 @@ declare abstract class Base_Ai_Cf_Black_Forest_Labs_Flux_1_Schnell {
4609
5057
  inputs: Ai_Cf_Black_Forest_Labs_Flux_1_Schnell_Input;
4610
5058
  postProcessedOutputs: Ai_Cf_Black_Forest_Labs_Flux_1_Schnell_Output;
4611
5059
  }
4612
- type Ai_Cf_Meta_Llama_3_2_11B_Vision_Instruct_Input = Prompt | Messages;
4613
- interface Prompt {
5060
+ type Ai_Cf_Meta_Llama_3_2_11B_Vision_Instruct_Input =
5061
+ | Ai_Cf_Meta_Llama_3_2_11B_Vision_Instruct_Prompt
5062
+ | Ai_Cf_Meta_Llama_3_2_11B_Vision_Instruct_Messages;
5063
+ interface Ai_Cf_Meta_Llama_3_2_11B_Vision_Instruct_Prompt {
4614
5064
  /**
4615
5065
  * The input text prompt for the model to generate a response.
4616
5066
  */
@@ -4661,7 +5111,7 @@ interface Prompt {
4661
5111
  */
4662
5112
  lora?: string;
4663
5113
  }
4664
- interface Messages {
5114
+ interface Ai_Cf_Meta_Llama_3_2_11B_Vision_Instruct_Messages {
4665
5115
  /**
4666
5116
  * An array of message objects representing the conversation history.
4667
5117
  */
@@ -4859,10 +5309,10 @@ declare abstract class Base_Ai_Cf_Meta_Llama_3_2_11B_Vision_Instruct {
4859
5309
  postProcessedOutputs: Ai_Cf_Meta_Llama_3_2_11B_Vision_Instruct_Output;
4860
5310
  }
4861
5311
  type Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Input =
4862
- | Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Prompt
4863
- | Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Messages
4864
- | AsyncBatch;
4865
- interface Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Prompt {
5312
+ | Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Prompt
5313
+ | Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Messages
5314
+ | Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Async_Batch;
5315
+ interface Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Prompt {
4866
5316
  /**
4867
5317
  * The input text prompt for the model to generate a response.
4868
5318
  */
@@ -4871,7 +5321,7 @@ interface Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Prompt {
4871
5321
  * Name of the LoRA (Low-Rank Adaptation) model to fine-tune the base model.
4872
5322
  */
4873
5323
  lora?: string;
4874
- response_format?: JSONMode;
5324
+ response_format?: Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_JSON_Mode;
4875
5325
  /**
4876
5326
  * If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
4877
5327
  */
@@ -4913,11 +5363,11 @@ interface Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Prompt {
4913
5363
  */
4914
5364
  presence_penalty?: number;
4915
5365
  }
4916
- interface JSONMode {
5366
+ interface Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_JSON_Mode {
4917
5367
  type?: "json_object" | "json_schema";
4918
5368
  json_schema?: unknown;
4919
5369
  }
4920
- interface Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Messages {
5370
+ interface Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Messages {
4921
5371
  /**
4922
5372
  * An array of message objects representing the conversation history.
4923
5373
  */
@@ -5025,7 +5475,7 @@ interface Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Messages {
5025
5475
  };
5026
5476
  }
5027
5477
  )[];
5028
- response_format?: JSONMode;
5478
+ response_format?: Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_JSON_Mode_1;
5029
5479
  /**
5030
5480
  * If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
5031
5481
  */
@@ -5067,7 +5517,11 @@ interface Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Messages {
5067
5517
  */
5068
5518
  presence_penalty?: number;
5069
5519
  }
5070
- interface AsyncBatch {
5520
+ interface Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_JSON_Mode_1 {
5521
+ type?: "json_object" | "json_schema";
5522
+ json_schema?: unknown;
5523
+ }
5524
+ interface Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Async_Batch {
5071
5525
  requests?: {
5072
5526
  /**
5073
5527
  * User-supplied reference. This field will be present in the response as well it can be used to reference the request and response. It's NOT validated to be unique.
@@ -5109,9 +5563,13 @@ interface AsyncBatch {
5109
5563
  * Increases the likelihood of the model introducing new topics.
5110
5564
  */
5111
5565
  presence_penalty?: number;
5112
- response_format?: JSONMode;
5566
+ response_format?: Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_JSON_Mode_2;
5113
5567
  }[];
5114
5568
  }
5569
+ interface Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_JSON_Mode_2 {
5570
+ type?: "json_object" | "json_schema";
5571
+ json_schema?: unknown;
5572
+ }
5115
5573
  type Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Output =
5116
5574
  | {
5117
5575
  /**
@@ -5150,7 +5608,13 @@ type Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Output =
5150
5608
  }[];
5151
5609
  }
5152
5610
  | string
5153
- | AsyncResponse;
5611
+ | Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_AsyncResponse;
5612
+ interface Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_AsyncResponse {
5613
+ /**
5614
+ * The async request id that can be used to obtain the results.
5615
+ */
5616
+ request_id?: string;
5617
+ }
5154
5618
  declare abstract class Base_Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast {
5155
5619
  inputs: Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Input;
5156
5620
  postProcessedOutputs: Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Output;
@@ -5257,9 +5721,9 @@ declare abstract class Base_Ai_Cf_Baai_Bge_Reranker_Base {
5257
5721
  postProcessedOutputs: Ai_Cf_Baai_Bge_Reranker_Base_Output;
5258
5722
  }
5259
5723
  type Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_Input =
5260
- | Qwen2_5_Coder_32B_Instruct_Prompt
5261
- | Qwen2_5_Coder_32B_Instruct_Messages;
5262
- interface Qwen2_5_Coder_32B_Instruct_Prompt {
5724
+ | Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_Prompt
5725
+ | Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_Messages;
5726
+ interface Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_Prompt {
5263
5727
  /**
5264
5728
  * The input text prompt for the model to generate a response.
5265
5729
  */
@@ -5268,7 +5732,7 @@ interface Qwen2_5_Coder_32B_Instruct_Prompt {
5268
5732
  * Name of the LoRA (Low-Rank Adaptation) model to fine-tune the base model.
5269
5733
  */
5270
5734
  lora?: string;
5271
- response_format?: JSONMode;
5735
+ response_format?: Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_JSON_Mode;
5272
5736
  /**
5273
5737
  * If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
5274
5738
  */
@@ -5310,7 +5774,11 @@ interface Qwen2_5_Coder_32B_Instruct_Prompt {
5310
5774
  */
5311
5775
  presence_penalty?: number;
5312
5776
  }
5313
- interface Qwen2_5_Coder_32B_Instruct_Messages {
5777
+ interface Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_JSON_Mode {
5778
+ type?: "json_object" | "json_schema";
5779
+ json_schema?: unknown;
5780
+ }
5781
+ interface Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_Messages {
5314
5782
  /**
5315
5783
  * An array of message objects representing the conversation history.
5316
5784
  */
@@ -5418,7 +5886,7 @@ interface Qwen2_5_Coder_32B_Instruct_Messages {
5418
5886
  };
5419
5887
  }
5420
5888
  )[];
5421
- response_format?: JSONMode;
5889
+ response_format?: Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_JSON_Mode_1;
5422
5890
  /**
5423
5891
  * If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
5424
5892
  */
@@ -5460,6 +5928,10 @@ interface Qwen2_5_Coder_32B_Instruct_Messages {
5460
5928
  */
5461
5929
  presence_penalty?: number;
5462
5930
  }
5931
+ interface Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_JSON_Mode_1 {
5932
+ type?: "json_object" | "json_schema";
5933
+ json_schema?: unknown;
5934
+ }
5463
5935
  type Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_Output = {
5464
5936
  /**
5465
5937
  * The generated text response from the model
@@ -5500,8 +5972,10 @@ declare abstract class Base_Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct {
5500
5972
  inputs: Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_Input;
5501
5973
  postProcessedOutputs: Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_Output;
5502
5974
  }
5503
- type Ai_Cf_Qwen_Qwq_32B_Input = Qwen_Qwq_32B_Prompt | Qwen_Qwq_32B_Messages;
5504
- interface Qwen_Qwq_32B_Prompt {
5975
+ type Ai_Cf_Qwen_Qwq_32B_Input =
5976
+ | Ai_Cf_Qwen_Qwq_32B_Prompt
5977
+ | Ai_Cf_Qwen_Qwq_32B_Messages;
5978
+ interface Ai_Cf_Qwen_Qwq_32B_Prompt {
5505
5979
  /**
5506
5980
  * The input text prompt for the model to generate a response.
5507
5981
  */
@@ -5551,7 +6025,7 @@ interface Qwen_Qwq_32B_Prompt {
5551
6025
  */
5552
6026
  presence_penalty?: number;
5553
6027
  }
5554
- interface Qwen_Qwq_32B_Messages {
6028
+ interface Ai_Cf_Qwen_Qwq_32B_Messages {
5555
6029
  /**
5556
6030
  * An array of message objects representing the conversation history.
5557
6031
  */
@@ -5773,9 +6247,9 @@ declare abstract class Base_Ai_Cf_Qwen_Qwq_32B {
5773
6247
  postProcessedOutputs: Ai_Cf_Qwen_Qwq_32B_Output;
5774
6248
  }
5775
6249
  type Ai_Cf_Mistralai_Mistral_Small_3_1_24B_Instruct_Input =
5776
- | Mistral_Small_3_1_24B_Instruct_Prompt
5777
- | Mistral_Small_3_1_24B_Instruct_Messages;
5778
- interface Mistral_Small_3_1_24B_Instruct_Prompt {
6250
+ | Ai_Cf_Mistralai_Mistral_Small_3_1_24B_Instruct_Prompt
6251
+ | Ai_Cf_Mistralai_Mistral_Small_3_1_24B_Instruct_Messages;
6252
+ interface Ai_Cf_Mistralai_Mistral_Small_3_1_24B_Instruct_Prompt {
5779
6253
  /**
5780
6254
  * The input text prompt for the model to generate a response.
5781
6255
  */
@@ -5825,7 +6299,7 @@ interface Mistral_Small_3_1_24B_Instruct_Prompt {
5825
6299
  */
5826
6300
  presence_penalty?: number;
5827
6301
  }
5828
- interface Mistral_Small_3_1_24B_Instruct_Messages {
6302
+ interface Ai_Cf_Mistralai_Mistral_Small_3_1_24B_Instruct_Messages {
5829
6303
  /**
5830
6304
  * An array of message objects representing the conversation history.
5831
6305
  */
@@ -6047,9 +6521,9 @@ declare abstract class Base_Ai_Cf_Mistralai_Mistral_Small_3_1_24B_Instruct {
6047
6521
  postProcessedOutputs: Ai_Cf_Mistralai_Mistral_Small_3_1_24B_Instruct_Output;
6048
6522
  }
6049
6523
  type Ai_Cf_Google_Gemma_3_12B_It_Input =
6050
- | Google_Gemma_3_12B_It_Prompt
6051
- | Google_Gemma_3_12B_It_Messages;
6052
- interface Google_Gemma_3_12B_It_Prompt {
6524
+ | Ai_Cf_Google_Gemma_3_12B_It_Prompt
6525
+ | Ai_Cf_Google_Gemma_3_12B_It_Messages;
6526
+ interface Ai_Cf_Google_Gemma_3_12B_It_Prompt {
6053
6527
  /**
6054
6528
  * The input text prompt for the model to generate a response.
6055
6529
  */
@@ -6099,7 +6573,7 @@ interface Google_Gemma_3_12B_It_Prompt {
6099
6573
  */
6100
6574
  presence_penalty?: number;
6101
6575
  }
6102
- interface Google_Gemma_3_12B_It_Messages {
6576
+ interface Ai_Cf_Google_Gemma_3_12B_It_Messages {
6103
6577
  /**
6104
6578
  * An array of message objects representing the conversation history.
6105
6579
  */
@@ -6122,20 +6596,7 @@ interface Google_Gemma_3_12B_It_Messages {
6122
6596
  */
6123
6597
  url?: string;
6124
6598
  };
6125
- }[]
6126
- | {
6127
- /**
6128
- * Type of the content provided
6129
- */
6130
- type?: string;
6131
- text?: string;
6132
- image_url?: {
6133
- /**
6134
- * image uri with data (e.g. ...). HTTP URL will not be accepted
6135
- */
6136
- url?: string;
6137
- };
6138
- };
6599
+ }[];
6139
6600
  }[];
6140
6601
  functions?: {
6141
6602
  name: string;
@@ -6317,10 +6778,10 @@ declare abstract class Base_Ai_Cf_Google_Gemma_3_12B_It {
6317
6778
  postProcessedOutputs: Ai_Cf_Google_Gemma_3_12B_It_Output;
6318
6779
  }
6319
6780
  type Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Input =
6320
- | Ai_Cf_Meta_Llama_4_Prompt
6321
- | Ai_Cf_Meta_Llama_4_Messages
6322
- | Ai_Cf_Meta_Llama_4_Async_Batch;
6323
- interface Ai_Cf_Meta_Llama_4_Prompt {
6781
+ | Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Prompt
6782
+ | Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Messages
6783
+ | Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Async_Batch;
6784
+ interface Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Prompt {
6324
6785
  /**
6325
6786
  * The input text prompt for the model to generate a response.
6326
6787
  */
@@ -6329,7 +6790,7 @@ interface Ai_Cf_Meta_Llama_4_Prompt {
6329
6790
  * JSON schema that should be fulfilled for the response.
6330
6791
  */
6331
6792
  guided_json?: object;
6332
- response_format?: JSONMode;
6793
+ response_format?: Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_JSON_Mode;
6333
6794
  /**
6334
6795
  * If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
6335
6796
  */
@@ -6371,7 +6832,11 @@ interface Ai_Cf_Meta_Llama_4_Prompt {
6371
6832
  */
6372
6833
  presence_penalty?: number;
6373
6834
  }
6374
- interface Ai_Cf_Meta_Llama_4_Messages {
6835
+ interface Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_JSON_Mode {
6836
+ type?: "json_object" | "json_schema";
6837
+ json_schema?: unknown;
6838
+ }
6839
+ interface Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Messages {
6375
6840
  /**
6376
6841
  * An array of message objects representing the conversation history.
6377
6842
  */
@@ -6507,7 +6972,7 @@ interface Ai_Cf_Meta_Llama_4_Messages {
6507
6972
  };
6508
6973
  }
6509
6974
  )[];
6510
- response_format?: JSONMode;
6975
+ response_format?: Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_JSON_Mode;
6511
6976
  /**
6512
6977
  * JSON schema that should be fufilled for the response.
6513
6978
  */
@@ -6553,13 +7018,13 @@ interface Ai_Cf_Meta_Llama_4_Messages {
6553
7018
  */
6554
7019
  presence_penalty?: number;
6555
7020
  }
6556
- interface Ai_Cf_Meta_Llama_4_Async_Batch {
7021
+ interface Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Async_Batch {
6557
7022
  requests: (
6558
- | Ai_Cf_Meta_Llama_4_Prompt_Inner
6559
- | Ai_Cf_Meta_Llama_4_Messages_Inner
7023
+ | Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Prompt_Inner
7024
+ | Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Messages_Inner
6560
7025
  )[];
6561
7026
  }
6562
- interface Ai_Cf_Meta_Llama_4_Prompt_Inner {
7027
+ interface Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Prompt_Inner {
6563
7028
  /**
6564
7029
  * The input text prompt for the model to generate a response.
6565
7030
  */
@@ -6568,7 +7033,7 @@ interface Ai_Cf_Meta_Llama_4_Prompt_Inner {
6568
7033
  * JSON schema that should be fulfilled for the response.
6569
7034
  */
6570
7035
  guided_json?: object;
6571
- response_format?: JSONMode;
7036
+ response_format?: Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_JSON_Mode;
6572
7037
  /**
6573
7038
  * If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
6574
7039
  */
@@ -6610,7 +7075,7 @@ interface Ai_Cf_Meta_Llama_4_Prompt_Inner {
6610
7075
  */
6611
7076
  presence_penalty?: number;
6612
7077
  }
6613
- interface Ai_Cf_Meta_Llama_4_Messages_Inner {
7078
+ interface Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Messages_Inner {
6614
7079
  /**
6615
7080
  * An array of message objects representing the conversation history.
6616
7081
  */
@@ -6746,7 +7211,7 @@ interface Ai_Cf_Meta_Llama_4_Messages_Inner {
6746
7211
  };
6747
7212
  }
6748
7213
  )[];
6749
- response_format?: JSONMode;
7214
+ response_format?: Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_JSON_Mode;
6750
7215
  /**
6751
7216
  * JSON schema that should be fufilled for the response.
6752
7217
  */
@@ -6845,414 +7310,1813 @@ declare abstract class Base_Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct {
6845
7310
  inputs: Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Input;
6846
7311
  postProcessedOutputs: Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Output;
6847
7312
  }
6848
- interface Ai_Cf_Deepgram_Nova_3_Input {
6849
- audio: {
6850
- body: object;
6851
- contentType: string;
6852
- };
6853
- /**
6854
- * Sets how the model will interpret strings submitted to the custom_topic param. When strict, the model will only return topics submitted using the custom_topic param. When extended, the model will return its own detected topics in addition to those submitted using the custom_topic param.
6855
- */
6856
- custom_topic_mode?: "extended" | "strict";
6857
- /**
6858
- * Custom topics you want the model to detect within your input audio or text if present Submit up to 100
6859
- */
6860
- custom_topic?: string;
6861
- /**
6862
- * Sets how the model will interpret intents submitted to the custom_intent param. When strict, the model will only return intents submitted using the custom_intent param. When extended, the model will return its own detected intents in addition those submitted using the custom_intents param
6863
- */
6864
- custom_intent_mode?: "extended" | "strict";
6865
- /**
6866
- * Custom intents you want the model to detect within your input audio if present
6867
- */
6868
- custom_intent?: string;
6869
- /**
6870
- * Identifies and extracts key entities from content in submitted audio
6871
- */
6872
- detect_entities?: boolean;
6873
- /**
6874
- * Identifies the dominant language spoken in submitted audio
6875
- */
6876
- detect_language?: boolean;
6877
- /**
6878
- * Recognize speaker changes. Each word in the transcript will be assigned a speaker number starting at 0
6879
- */
6880
- diarize?: boolean;
7313
+ type Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Input =
7314
+ | Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Prompt
7315
+ | Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Messages
7316
+ | Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Async_Batch;
7317
+ interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Prompt {
6881
7318
  /**
6882
- * Identify and extract key entities from content in submitted audio
7319
+ * The input text prompt for the model to generate a response.
6883
7320
  */
6884
- dictation?: boolean;
7321
+ prompt: string;
6885
7322
  /**
6886
- * Specify the expected encoding of your submitted audio
7323
+ * Name of the LoRA (Low-Rank Adaptation) model to fine-tune the base model.
6887
7324
  */
6888
- encoding?:
6889
- | "linear16"
6890
- | "flac"
6891
- | "mulaw"
6892
- | "amr-nb"
6893
- | "amr-wb"
6894
- | "opus"
6895
- | "speex"
6896
- | "g729";
7325
+ lora?: string;
7326
+ response_format?: Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_JSON_Mode;
6897
7327
  /**
6898
- * Arbitrary key-value pairs that are attached to the API response for usage in downstream processing
7328
+ * If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
6899
7329
  */
6900
- extra?: string;
7330
+ raw?: boolean;
6901
7331
  /**
6902
- * Filler Words can help transcribe interruptions in your audio, like 'uh' and 'um'
7332
+ * If true, the response will be streamed back incrementally using SSE, Server Sent Events.
6903
7333
  */
6904
- filler_words?: boolean;
7334
+ stream?: boolean;
6905
7335
  /**
6906
- * Key term prompting can boost or suppress specialized terminology and brands.
7336
+ * The maximum number of tokens to generate in the response.
6907
7337
  */
6908
- keyterm?: string;
7338
+ max_tokens?: number;
6909
7339
  /**
6910
- * Keywords can boost or suppress specialized terminology and brands.
7340
+ * Controls the randomness of the output; higher values produce more random results.
6911
7341
  */
6912
- keywords?: string;
7342
+ temperature?: number;
6913
7343
  /**
6914
- * The BCP-47 language tag that hints at the primary spoken language. Depending on the Model and API endpoint you choose only certain languages are available.
7344
+ * Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses.
6915
7345
  */
6916
- language?: string;
7346
+ top_p?: number;
6917
7347
  /**
6918
- * Spoken measurements will be converted to their corresponding abbreviations.
7348
+ * Limits the AI to choose from the top 'k' most probable words. Lower values make responses more focused; higher values introduce more variety and potential surprises.
6919
7349
  */
6920
- measurements?: boolean;
7350
+ top_k?: number;
6921
7351
  /**
6922
- * Opts out requests from the Deepgram Model Improvement Program. Refer to our Docs for pricing impacts before setting this to true. https://dpgr.am/deepgram-mip.
7352
+ * Random seed for reproducibility of the generation.
6923
7353
  */
6924
- mip_opt_out?: boolean;
7354
+ seed?: number;
6925
7355
  /**
6926
- * Mode of operation for the model representing broad area of topic that will be talked about in the supplied audio
7356
+ * Penalty for repeated tokens; higher values discourage repetition.
6927
7357
  */
6928
- mode?: "general" | "medical" | "finance";
7358
+ repetition_penalty?: number;
6929
7359
  /**
6930
- * Transcribe each audio channel independently.
7360
+ * Decreases the likelihood of the model repeating the same lines verbatim.
6931
7361
  */
6932
- multichannel?: boolean;
7362
+ frequency_penalty?: number;
6933
7363
  /**
6934
- * Numerals converts numbers from written format to numerical format.
7364
+ * Increases the likelihood of the model introducing new topics.
6935
7365
  */
6936
- numerals?: boolean;
7366
+ presence_penalty?: number;
7367
+ }
7368
+ interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_JSON_Mode {
7369
+ type?: "json_object" | "json_schema";
7370
+ json_schema?: unknown;
7371
+ }
7372
+ interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Messages {
6937
7373
  /**
6938
- * Splits audio into paragraphs to improve transcript readability.
7374
+ * An array of message objects representing the conversation history.
6939
7375
  */
6940
- paragraphs?: boolean;
7376
+ messages: {
7377
+ /**
7378
+ * The role of the message sender (e.g., 'user', 'assistant', 'system', 'tool').
7379
+ */
7380
+ role: string;
7381
+ /**
7382
+ * The content of the message as a string.
7383
+ */
7384
+ content: string;
7385
+ }[];
7386
+ functions?: {
7387
+ name: string;
7388
+ code: string;
7389
+ }[];
6941
7390
  /**
6942
- * Profanity Filter looks for recognized profanity and converts it to the nearest recognized non-profane word or removes it from the transcript completely.
7391
+ * A list of tools available for the assistant to use.
7392
+ */
7393
+ tools?: (
7394
+ | {
7395
+ /**
7396
+ * The name of the tool. More descriptive the better.
7397
+ */
7398
+ name: string;
7399
+ /**
7400
+ * A brief description of what the tool does.
7401
+ */
7402
+ description: string;
7403
+ /**
7404
+ * Schema defining the parameters accepted by the tool.
7405
+ */
7406
+ parameters: {
7407
+ /**
7408
+ * The type of the parameters object (usually 'object').
7409
+ */
7410
+ type: string;
7411
+ /**
7412
+ * List of required parameter names.
7413
+ */
7414
+ required?: string[];
7415
+ /**
7416
+ * Definitions of each parameter.
7417
+ */
7418
+ properties: {
7419
+ [k: string]: {
7420
+ /**
7421
+ * The data type of the parameter.
7422
+ */
7423
+ type: string;
7424
+ /**
7425
+ * A description of the expected parameter.
7426
+ */
7427
+ description: string;
7428
+ };
7429
+ };
7430
+ };
7431
+ }
7432
+ | {
7433
+ /**
7434
+ * Specifies the type of tool (e.g., 'function').
7435
+ */
7436
+ type: string;
7437
+ /**
7438
+ * Details of the function tool.
7439
+ */
7440
+ function: {
7441
+ /**
7442
+ * The name of the function.
7443
+ */
7444
+ name: string;
7445
+ /**
7446
+ * A brief description of what the function does.
7447
+ */
7448
+ description: string;
7449
+ /**
7450
+ * Schema defining the parameters accepted by the function.
7451
+ */
7452
+ parameters: {
7453
+ /**
7454
+ * The type of the parameters object (usually 'object').
7455
+ */
7456
+ type: string;
7457
+ /**
7458
+ * List of required parameter names.
7459
+ */
7460
+ required?: string[];
7461
+ /**
7462
+ * Definitions of each parameter.
7463
+ */
7464
+ properties: {
7465
+ [k: string]: {
7466
+ /**
7467
+ * The data type of the parameter.
7468
+ */
7469
+ type: string;
7470
+ /**
7471
+ * A description of the expected parameter.
7472
+ */
7473
+ description: string;
7474
+ };
7475
+ };
7476
+ };
7477
+ };
7478
+ }
7479
+ )[];
7480
+ response_format?: Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_JSON_Mode_1;
7481
+ /**
7482
+ * If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
7483
+ */
7484
+ raw?: boolean;
7485
+ /**
7486
+ * If true, the response will be streamed back incrementally using SSE, Server Sent Events.
7487
+ */
7488
+ stream?: boolean;
7489
+ /**
7490
+ * The maximum number of tokens to generate in the response.
7491
+ */
7492
+ max_tokens?: number;
7493
+ /**
7494
+ * Controls the randomness of the output; higher values produce more random results.
7495
+ */
7496
+ temperature?: number;
7497
+ /**
7498
+ * Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses.
7499
+ */
7500
+ top_p?: number;
7501
+ /**
7502
+ * Limits the AI to choose from the top 'k' most probable words. Lower values make responses more focused; higher values introduce more variety and potential surprises.
7503
+ */
7504
+ top_k?: number;
7505
+ /**
7506
+ * Random seed for reproducibility of the generation.
7507
+ */
7508
+ seed?: number;
7509
+ /**
7510
+ * Penalty for repeated tokens; higher values discourage repetition.
7511
+ */
7512
+ repetition_penalty?: number;
7513
+ /**
7514
+ * Decreases the likelihood of the model repeating the same lines verbatim.
7515
+ */
7516
+ frequency_penalty?: number;
7517
+ /**
7518
+ * Increases the likelihood of the model introducing new topics.
7519
+ */
7520
+ presence_penalty?: number;
7521
+ }
7522
+ interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_JSON_Mode_1 {
7523
+ type?: "json_object" | "json_schema";
7524
+ json_schema?: unknown;
7525
+ }
7526
+ interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Async_Batch {
7527
+ requests: (
7528
+ | Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Prompt_1
7529
+ | Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Messages_1
7530
+ )[];
7531
+ }
7532
+ interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Prompt_1 {
7533
+ /**
7534
+ * The input text prompt for the model to generate a response.
7535
+ */
7536
+ prompt: string;
7537
+ /**
7538
+ * Name of the LoRA (Low-Rank Adaptation) model to fine-tune the base model.
7539
+ */
7540
+ lora?: string;
7541
+ response_format?: Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_JSON_Mode_2;
7542
+ /**
7543
+ * If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
7544
+ */
7545
+ raw?: boolean;
7546
+ /**
7547
+ * If true, the response will be streamed back incrementally using SSE, Server Sent Events.
7548
+ */
7549
+ stream?: boolean;
7550
+ /**
7551
+ * The maximum number of tokens to generate in the response.
7552
+ */
7553
+ max_tokens?: number;
7554
+ /**
7555
+ * Controls the randomness of the output; higher values produce more random results.
7556
+ */
7557
+ temperature?: number;
7558
+ /**
7559
+ * Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses.
7560
+ */
7561
+ top_p?: number;
7562
+ /**
7563
+ * Limits the AI to choose from the top 'k' most probable words. Lower values make responses more focused; higher values introduce more variety and potential surprises.
7564
+ */
7565
+ top_k?: number;
7566
+ /**
7567
+ * Random seed for reproducibility of the generation.
7568
+ */
7569
+ seed?: number;
7570
+ /**
7571
+ * Penalty for repeated tokens; higher values discourage repetition.
7572
+ */
7573
+ repetition_penalty?: number;
7574
+ /**
7575
+ * Decreases the likelihood of the model repeating the same lines verbatim.
7576
+ */
7577
+ frequency_penalty?: number;
7578
+ /**
7579
+ * Increases the likelihood of the model introducing new topics.
7580
+ */
7581
+ presence_penalty?: number;
7582
+ }
7583
+ interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_JSON_Mode_2 {
7584
+ type?: "json_object" | "json_schema";
7585
+ json_schema?: unknown;
7586
+ }
7587
+ interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Messages_1 {
7588
+ /**
7589
+ * An array of message objects representing the conversation history.
7590
+ */
7591
+ messages: {
7592
+ /**
7593
+ * The role of the message sender (e.g., 'user', 'assistant', 'system', 'tool').
7594
+ */
7595
+ role: string;
7596
+ /**
7597
+ * The content of the message as a string.
7598
+ */
7599
+ content: string;
7600
+ }[];
7601
+ functions?: {
7602
+ name: string;
7603
+ code: string;
7604
+ }[];
7605
+ /**
7606
+ * A list of tools available for the assistant to use.
7607
+ */
7608
+ tools?: (
7609
+ | {
7610
+ /**
7611
+ * The name of the tool. More descriptive the better.
7612
+ */
7613
+ name: string;
7614
+ /**
7615
+ * A brief description of what the tool does.
7616
+ */
7617
+ description: string;
7618
+ /**
7619
+ * Schema defining the parameters accepted by the tool.
7620
+ */
7621
+ parameters: {
7622
+ /**
7623
+ * The type of the parameters object (usually 'object').
7624
+ */
7625
+ type: string;
7626
+ /**
7627
+ * List of required parameter names.
7628
+ */
7629
+ required?: string[];
7630
+ /**
7631
+ * Definitions of each parameter.
7632
+ */
7633
+ properties: {
7634
+ [k: string]: {
7635
+ /**
7636
+ * The data type of the parameter.
7637
+ */
7638
+ type: string;
7639
+ /**
7640
+ * A description of the expected parameter.
7641
+ */
7642
+ description: string;
7643
+ };
7644
+ };
7645
+ };
7646
+ }
7647
+ | {
7648
+ /**
7649
+ * Specifies the type of tool (e.g., 'function').
7650
+ */
7651
+ type: string;
7652
+ /**
7653
+ * Details of the function tool.
7654
+ */
7655
+ function: {
7656
+ /**
7657
+ * The name of the function.
7658
+ */
7659
+ name: string;
7660
+ /**
7661
+ * A brief description of what the function does.
7662
+ */
7663
+ description: string;
7664
+ /**
7665
+ * Schema defining the parameters accepted by the function.
7666
+ */
7667
+ parameters: {
7668
+ /**
7669
+ * The type of the parameters object (usually 'object').
7670
+ */
7671
+ type: string;
7672
+ /**
7673
+ * List of required parameter names.
7674
+ */
7675
+ required?: string[];
7676
+ /**
7677
+ * Definitions of each parameter.
7678
+ */
7679
+ properties: {
7680
+ [k: string]: {
7681
+ /**
7682
+ * The data type of the parameter.
7683
+ */
7684
+ type: string;
7685
+ /**
7686
+ * A description of the expected parameter.
7687
+ */
7688
+ description: string;
7689
+ };
7690
+ };
7691
+ };
7692
+ };
7693
+ }
7694
+ )[];
7695
+ response_format?: Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_JSON_Mode_3;
7696
+ /**
7697
+ * If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
7698
+ */
7699
+ raw?: boolean;
7700
+ /**
7701
+ * If true, the response will be streamed back incrementally using SSE, Server Sent Events.
7702
+ */
7703
+ stream?: boolean;
7704
+ /**
7705
+ * The maximum number of tokens to generate in the response.
7706
+ */
7707
+ max_tokens?: number;
7708
+ /**
7709
+ * Controls the randomness of the output; higher values produce more random results.
7710
+ */
7711
+ temperature?: number;
7712
+ /**
7713
+ * Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses.
7714
+ */
7715
+ top_p?: number;
7716
+ /**
7717
+ * Limits the AI to choose from the top 'k' most probable words. Lower values make responses more focused; higher values introduce more variety and potential surprises.
7718
+ */
7719
+ top_k?: number;
7720
+ /**
7721
+ * Random seed for reproducibility of the generation.
7722
+ */
7723
+ seed?: number;
7724
+ /**
7725
+ * Penalty for repeated tokens; higher values discourage repetition.
7726
+ */
7727
+ repetition_penalty?: number;
7728
+ /**
7729
+ * Decreases the likelihood of the model repeating the same lines verbatim.
7730
+ */
7731
+ frequency_penalty?: number;
7732
+ /**
7733
+ * Increases the likelihood of the model introducing new topics.
7734
+ */
7735
+ presence_penalty?: number;
7736
+ }
7737
+ interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_JSON_Mode_3 {
7738
+ type?: "json_object" | "json_schema";
7739
+ json_schema?: unknown;
7740
+ }
7741
+ type Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Output =
7742
+ | Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Chat_Completion_Response
7743
+ | Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Text_Completion_Response
7744
+ | string
7745
+ | Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_AsyncResponse;
7746
+ interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Chat_Completion_Response {
7747
+ /**
7748
+ * Unique identifier for the completion
7749
+ */
7750
+ id?: string;
7751
+ /**
7752
+ * Object type identifier
7753
+ */
7754
+ object?: "chat.completion";
7755
+ /**
7756
+ * Unix timestamp of when the completion was created
7757
+ */
7758
+ created?: number;
7759
+ /**
7760
+ * Model used for the completion
7761
+ */
7762
+ model?: string;
7763
+ /**
7764
+ * List of completion choices
7765
+ */
7766
+ choices?: {
7767
+ /**
7768
+ * Index of the choice in the list
7769
+ */
7770
+ index?: number;
7771
+ /**
7772
+ * The message generated by the model
7773
+ */
7774
+ message?: {
7775
+ /**
7776
+ * Role of the message author
7777
+ */
7778
+ role: string;
7779
+ /**
7780
+ * The content of the message
7781
+ */
7782
+ content: string;
7783
+ /**
7784
+ * Internal reasoning content (if available)
7785
+ */
7786
+ reasoning_content?: string;
7787
+ /**
7788
+ * Tool calls made by the assistant
7789
+ */
7790
+ tool_calls?: {
7791
+ /**
7792
+ * Unique identifier for the tool call
7793
+ */
7794
+ id: string;
7795
+ /**
7796
+ * Type of tool call
7797
+ */
7798
+ type: "function";
7799
+ function: {
7800
+ /**
7801
+ * Name of the function to call
7802
+ */
7803
+ name: string;
7804
+ /**
7805
+ * JSON string of arguments for the function
7806
+ */
7807
+ arguments: string;
7808
+ };
7809
+ }[];
7810
+ };
7811
+ /**
7812
+ * Reason why the model stopped generating
7813
+ */
7814
+ finish_reason?: string;
7815
+ /**
7816
+ * Stop reason (may be null)
7817
+ */
7818
+ stop_reason?: string | null;
7819
+ /**
7820
+ * Log probabilities (if requested)
7821
+ */
7822
+ logprobs?: {} | null;
7823
+ }[];
7824
+ /**
7825
+ * Usage statistics for the inference request
7826
+ */
7827
+ usage?: {
7828
+ /**
7829
+ * Total number of tokens in input
7830
+ */
7831
+ prompt_tokens?: number;
7832
+ /**
7833
+ * Total number of tokens in output
7834
+ */
7835
+ completion_tokens?: number;
7836
+ /**
7837
+ * Total number of input and output tokens
7838
+ */
7839
+ total_tokens?: number;
7840
+ };
7841
+ /**
7842
+ * Log probabilities for the prompt (if requested)
7843
+ */
7844
+ prompt_logprobs?: {} | null;
7845
+ }
7846
+ interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Text_Completion_Response {
7847
+ /**
7848
+ * Unique identifier for the completion
7849
+ */
7850
+ id?: string;
7851
+ /**
7852
+ * Object type identifier
7853
+ */
7854
+ object?: "text_completion";
7855
+ /**
7856
+ * Unix timestamp of when the completion was created
7857
+ */
7858
+ created?: number;
7859
+ /**
7860
+ * Model used for the completion
7861
+ */
7862
+ model?: string;
7863
+ /**
7864
+ * List of completion choices
7865
+ */
7866
+ choices?: {
7867
+ /**
7868
+ * Index of the choice in the list
7869
+ */
7870
+ index: number;
7871
+ /**
7872
+ * The generated text completion
7873
+ */
7874
+ text: string;
7875
+ /**
7876
+ * Reason why the model stopped generating
7877
+ */
7878
+ finish_reason: string;
7879
+ /**
7880
+ * Stop reason (may be null)
7881
+ */
7882
+ stop_reason?: string | null;
7883
+ /**
7884
+ * Log probabilities (if requested)
7885
+ */
7886
+ logprobs?: {} | null;
7887
+ /**
7888
+ * Log probabilities for the prompt (if requested)
7889
+ */
7890
+ prompt_logprobs?: {} | null;
7891
+ }[];
7892
+ /**
7893
+ * Usage statistics for the inference request
7894
+ */
7895
+ usage?: {
7896
+ /**
7897
+ * Total number of tokens in input
7898
+ */
7899
+ prompt_tokens?: number;
7900
+ /**
7901
+ * Total number of tokens in output
7902
+ */
7903
+ completion_tokens?: number;
7904
+ /**
7905
+ * Total number of input and output tokens
7906
+ */
7907
+ total_tokens?: number;
7908
+ };
7909
+ }
7910
+ interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_AsyncResponse {
7911
+ /**
7912
+ * The async request id that can be used to obtain the results.
7913
+ */
7914
+ request_id?: string;
7915
+ }
7916
+ declare abstract class Base_Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8 {
7917
+ inputs: Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Input;
7918
+ postProcessedOutputs: Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Output;
7919
+ }
7920
+ interface Ai_Cf_Deepgram_Nova_3_Input {
7921
+ audio: {
7922
+ body: object;
7923
+ contentType: string;
7924
+ };
7925
+ /**
7926
+ * Sets how the model will interpret strings submitted to the custom_topic param. When strict, the model will only return topics submitted using the custom_topic param. When extended, the model will return its own detected topics in addition to those submitted using the custom_topic param.
7927
+ */
7928
+ custom_topic_mode?: "extended" | "strict";
7929
+ /**
7930
+ * Custom topics you want the model to detect within your input audio or text if present Submit up to 100
7931
+ */
7932
+ custom_topic?: string;
7933
+ /**
7934
+ * Sets how the model will interpret intents submitted to the custom_intent param. When strict, the model will only return intents submitted using the custom_intent param. When extended, the model will return its own detected intents in addition those submitted using the custom_intents param
7935
+ */
7936
+ custom_intent_mode?: "extended" | "strict";
7937
+ /**
7938
+ * Custom intents you want the model to detect within your input audio if present
7939
+ */
7940
+ custom_intent?: string;
7941
+ /**
7942
+ * Identifies and extracts key entities from content in submitted audio
7943
+ */
7944
+ detect_entities?: boolean;
7945
+ /**
7946
+ * Identifies the dominant language spoken in submitted audio
7947
+ */
7948
+ detect_language?: boolean;
7949
+ /**
7950
+ * Recognize speaker changes. Each word in the transcript will be assigned a speaker number starting at 0
7951
+ */
7952
+ diarize?: boolean;
7953
+ /**
7954
+ * Identify and extract key entities from content in submitted audio
7955
+ */
7956
+ dictation?: boolean;
7957
+ /**
7958
+ * Specify the expected encoding of your submitted audio
7959
+ */
7960
+ encoding?:
7961
+ | "linear16"
7962
+ | "flac"
7963
+ | "mulaw"
7964
+ | "amr-nb"
7965
+ | "amr-wb"
7966
+ | "opus"
7967
+ | "speex"
7968
+ | "g729";
7969
+ /**
7970
+ * Arbitrary key-value pairs that are attached to the API response for usage in downstream processing
7971
+ */
7972
+ extra?: string;
7973
+ /**
7974
+ * Filler Words can help transcribe interruptions in your audio, like 'uh' and 'um'
7975
+ */
7976
+ filler_words?: boolean;
7977
+ /**
7978
+ * Key term prompting can boost or suppress specialized terminology and brands.
7979
+ */
7980
+ keyterm?: string;
7981
+ /**
7982
+ * Keywords can boost or suppress specialized terminology and brands.
7983
+ */
7984
+ keywords?: string;
7985
+ /**
7986
+ * The BCP-47 language tag that hints at the primary spoken language. Depending on the Model and API endpoint you choose only certain languages are available.
7987
+ */
7988
+ language?: string;
7989
+ /**
7990
+ * Spoken measurements will be converted to their corresponding abbreviations.
7991
+ */
7992
+ measurements?: boolean;
7993
+ /**
7994
+ * Opts out requests from the Deepgram Model Improvement Program. Refer to our Docs for pricing impacts before setting this to true. https://dpgr.am/deepgram-mip.
7995
+ */
7996
+ mip_opt_out?: boolean;
7997
+ /**
7998
+ * Mode of operation for the model representing broad area of topic that will be talked about in the supplied audio
7999
+ */
8000
+ mode?: "general" | "medical" | "finance";
8001
+ /**
8002
+ * Transcribe each audio channel independently.
8003
+ */
8004
+ multichannel?: boolean;
8005
+ /**
8006
+ * Numerals converts numbers from written format to numerical format.
8007
+ */
8008
+ numerals?: boolean;
8009
+ /**
8010
+ * Splits audio into paragraphs to improve transcript readability.
8011
+ */
8012
+ paragraphs?: boolean;
8013
+ /**
8014
+ * Profanity Filter looks for recognized profanity and converts it to the nearest recognized non-profane word or removes it from the transcript completely.
6943
8015
  */
6944
8016
  profanity_filter?: boolean;
6945
8017
  /**
6946
- * Add punctuation and capitalization to the transcript.
8018
+ * Add punctuation and capitalization to the transcript.
8019
+ */
8020
+ punctuate?: boolean;
8021
+ /**
8022
+ * Redaction removes sensitive information from your transcripts.
8023
+ */
8024
+ redact?: string;
8025
+ /**
8026
+ * Search for terms or phrases in submitted audio and replaces them.
8027
+ */
8028
+ replace?: string;
8029
+ /**
8030
+ * Search for terms or phrases in submitted audio.
8031
+ */
8032
+ search?: string;
8033
+ /**
8034
+ * Recognizes the sentiment throughout a transcript or text.
8035
+ */
8036
+ sentiment?: boolean;
8037
+ /**
8038
+ * Apply formatting to transcript output. When set to true, additional formatting will be applied to transcripts to improve readability.
8039
+ */
8040
+ smart_format?: boolean;
8041
+ /**
8042
+ * Detect topics throughout a transcript or text.
8043
+ */
8044
+ topics?: boolean;
8045
+ /**
8046
+ * Segments speech into meaningful semantic units.
8047
+ */
8048
+ utterances?: boolean;
8049
+ /**
8050
+ * Seconds to wait before detecting a pause between words in submitted audio.
8051
+ */
8052
+ utt_split?: number;
8053
+ /**
8054
+ * The number of channels in the submitted audio
8055
+ */
8056
+ channels?: number;
8057
+ /**
8058
+ * Specifies whether the streaming endpoint should provide ongoing transcription updates as more audio is received. When set to true, the endpoint sends continuous updates, meaning transcription results may evolve over time. Note: Supported only for webosockets.
8059
+ */
8060
+ interim_results?: boolean;
8061
+ /**
8062
+ * Indicates how long model will wait to detect whether a speaker has finished speaking or pauses for a significant period of time. When set to a value, the streaming endpoint immediately finalizes the transcription for the processed time range and returns the transcript with a speech_final parameter set to true. Can also be set to false to disable endpointing
8063
+ */
8064
+ endpointing?: string;
8065
+ /**
8066
+ * Indicates that speech has started. You'll begin receiving Speech Started messages upon speech starting. Note: Supported only for webosockets.
8067
+ */
8068
+ vad_events?: boolean;
8069
+ /**
8070
+ * Indicates how long model will wait to send an UtteranceEnd message after a word has been transcribed. Use with interim_results. Note: Supported only for webosockets.
8071
+ */
8072
+ utterance_end_ms?: boolean;
8073
+ }
8074
+ interface Ai_Cf_Deepgram_Nova_3_Output {
8075
+ results?: {
8076
+ channels?: {
8077
+ alternatives?: {
8078
+ confidence?: number;
8079
+ transcript?: string;
8080
+ words?: {
8081
+ confidence?: number;
8082
+ end?: number;
8083
+ start?: number;
8084
+ word?: string;
8085
+ }[];
8086
+ }[];
8087
+ }[];
8088
+ summary?: {
8089
+ result?: string;
8090
+ short?: string;
8091
+ };
8092
+ sentiments?: {
8093
+ segments?: {
8094
+ text?: string;
8095
+ start_word?: number;
8096
+ end_word?: number;
8097
+ sentiment?: string;
8098
+ sentiment_score?: number;
8099
+ }[];
8100
+ average?: {
8101
+ sentiment?: string;
8102
+ sentiment_score?: number;
8103
+ };
8104
+ };
8105
+ };
8106
+ }
8107
+ declare abstract class Base_Ai_Cf_Deepgram_Nova_3 {
8108
+ inputs: Ai_Cf_Deepgram_Nova_3_Input;
8109
+ postProcessedOutputs: Ai_Cf_Deepgram_Nova_3_Output;
8110
+ }
8111
+ interface Ai_Cf_Qwen_Qwen3_Embedding_0_6B_Input {
8112
+ queries?: string | string[];
8113
+ /**
8114
+ * Optional instruction for the task
8115
+ */
8116
+ instruction?: string;
8117
+ documents?: string | string[];
8118
+ text?: string | string[];
8119
+ }
8120
+ interface Ai_Cf_Qwen_Qwen3_Embedding_0_6B_Output {
8121
+ data?: number[][];
8122
+ shape?: number[];
8123
+ }
8124
+ declare abstract class Base_Ai_Cf_Qwen_Qwen3_Embedding_0_6B {
8125
+ inputs: Ai_Cf_Qwen_Qwen3_Embedding_0_6B_Input;
8126
+ postProcessedOutputs: Ai_Cf_Qwen_Qwen3_Embedding_0_6B_Output;
8127
+ }
8128
+ type Ai_Cf_Pipecat_Ai_Smart_Turn_V2_Input =
8129
+ | {
8130
+ /**
8131
+ * readable stream with audio data and content-type specified for that data
8132
+ */
8133
+ audio: {
8134
+ body: object;
8135
+ contentType: string;
8136
+ };
8137
+ /**
8138
+ * type of data PCM data that's sent to the inference server as raw array
8139
+ */
8140
+ dtype?: "uint8" | "float32" | "float64";
8141
+ }
8142
+ | {
8143
+ /**
8144
+ * base64 encoded audio data
8145
+ */
8146
+ audio: string;
8147
+ /**
8148
+ * type of data PCM data that's sent to the inference server as raw array
8149
+ */
8150
+ dtype?: "uint8" | "float32" | "float64";
8151
+ };
8152
+ interface Ai_Cf_Pipecat_Ai_Smart_Turn_V2_Output {
8153
+ /**
8154
+ * if true, end-of-turn was detected
8155
+ */
8156
+ is_complete?: boolean;
8157
+ /**
8158
+ * probability of the end-of-turn detection
8159
+ */
8160
+ probability?: number;
8161
+ }
8162
+ declare abstract class Base_Ai_Cf_Pipecat_Ai_Smart_Turn_V2 {
8163
+ inputs: Ai_Cf_Pipecat_Ai_Smart_Turn_V2_Input;
8164
+ postProcessedOutputs: Ai_Cf_Pipecat_Ai_Smart_Turn_V2_Output;
8165
+ }
8166
+ declare abstract class Base_Ai_Cf_Openai_Gpt_Oss_120B {
8167
+ inputs: ResponsesInput;
8168
+ postProcessedOutputs: ResponsesOutput;
8169
+ }
8170
+ declare abstract class Base_Ai_Cf_Openai_Gpt_Oss_20B {
8171
+ inputs: ResponsesInput;
8172
+ postProcessedOutputs: ResponsesOutput;
8173
+ }
8174
+ interface Ai_Cf_Leonardo_Phoenix_1_0_Input {
8175
+ /**
8176
+ * A text description of the image you want to generate.
8177
+ */
8178
+ prompt: string;
8179
+ /**
8180
+ * Controls how closely the generated image should adhere to the prompt; higher values make the image more aligned with the prompt
8181
+ */
8182
+ guidance?: number;
8183
+ /**
8184
+ * Random seed for reproducibility of the image generation
8185
+ */
8186
+ seed?: number;
8187
+ /**
8188
+ * The height of the generated image in pixels
8189
+ */
8190
+ height?: number;
8191
+ /**
8192
+ * The width of the generated image in pixels
8193
+ */
8194
+ width?: number;
8195
+ /**
8196
+ * The number of diffusion steps; higher values can improve quality but take longer
8197
+ */
8198
+ num_steps?: number;
8199
+ /**
8200
+ * Specify what to exclude from the generated images
8201
+ */
8202
+ negative_prompt?: string;
8203
+ }
8204
+ /**
8205
+ * The generated image in JPEG format
8206
+ */
8207
+ type Ai_Cf_Leonardo_Phoenix_1_0_Output = string;
8208
+ declare abstract class Base_Ai_Cf_Leonardo_Phoenix_1_0 {
8209
+ inputs: Ai_Cf_Leonardo_Phoenix_1_0_Input;
8210
+ postProcessedOutputs: Ai_Cf_Leonardo_Phoenix_1_0_Output;
8211
+ }
8212
+ interface Ai_Cf_Leonardo_Lucid_Origin_Input {
8213
+ /**
8214
+ * A text description of the image you want to generate.
8215
+ */
8216
+ prompt: string;
8217
+ /**
8218
+ * Controls how closely the generated image should adhere to the prompt; higher values make the image more aligned with the prompt
8219
+ */
8220
+ guidance?: number;
8221
+ /**
8222
+ * Random seed for reproducibility of the image generation
8223
+ */
8224
+ seed?: number;
8225
+ /**
8226
+ * The height of the generated image in pixels
8227
+ */
8228
+ height?: number;
8229
+ /**
8230
+ * The width of the generated image in pixels
8231
+ */
8232
+ width?: number;
8233
+ /**
8234
+ * The number of diffusion steps; higher values can improve quality but take longer
8235
+ */
8236
+ num_steps?: number;
8237
+ /**
8238
+ * The number of diffusion steps; higher values can improve quality but take longer
8239
+ */
8240
+ steps?: number;
8241
+ }
8242
+ interface Ai_Cf_Leonardo_Lucid_Origin_Output {
8243
+ /**
8244
+ * The generated image in Base64 format.
8245
+ */
8246
+ image?: string;
8247
+ }
8248
+ declare abstract class Base_Ai_Cf_Leonardo_Lucid_Origin {
8249
+ inputs: Ai_Cf_Leonardo_Lucid_Origin_Input;
8250
+ postProcessedOutputs: Ai_Cf_Leonardo_Lucid_Origin_Output;
8251
+ }
8252
+ interface Ai_Cf_Deepgram_Aura_1_Input {
8253
+ /**
8254
+ * Speaker used to produce the audio.
8255
+ */
8256
+ speaker?:
8257
+ | "angus"
8258
+ | "asteria"
8259
+ | "arcas"
8260
+ | "orion"
8261
+ | "orpheus"
8262
+ | "athena"
8263
+ | "luna"
8264
+ | "zeus"
8265
+ | "perseus"
8266
+ | "helios"
8267
+ | "hera"
8268
+ | "stella";
8269
+ /**
8270
+ * Encoding of the output audio.
8271
+ */
8272
+ encoding?: "linear16" | "flac" | "mulaw" | "alaw" | "mp3" | "opus" | "aac";
8273
+ /**
8274
+ * Container specifies the file format wrapper for the output audio. The available options depend on the encoding type..
8275
+ */
8276
+ container?: "none" | "wav" | "ogg";
8277
+ /**
8278
+ * The text content to be converted to speech
8279
+ */
8280
+ text: string;
8281
+ /**
8282
+ * Sample Rate specifies the sample rate for the output audio. Based on the encoding, different sample rates are supported. For some encodings, the sample rate is not configurable
8283
+ */
8284
+ sample_rate?: number;
8285
+ /**
8286
+ * The bitrate of the audio in bits per second. Choose from predefined ranges or specific values based on the encoding type.
8287
+ */
8288
+ bit_rate?: number;
8289
+ }
8290
+ /**
8291
+ * The generated audio in MP3 format
8292
+ */
8293
+ type Ai_Cf_Deepgram_Aura_1_Output = string;
8294
+ declare abstract class Base_Ai_Cf_Deepgram_Aura_1 {
8295
+ inputs: Ai_Cf_Deepgram_Aura_1_Input;
8296
+ postProcessedOutputs: Ai_Cf_Deepgram_Aura_1_Output;
8297
+ }
8298
+ interface Ai_Cf_Ai4Bharat_Indictrans2_En_Indic_1B_Input {
8299
+ /**
8300
+ * Input text to translate. Can be a single string or a list of strings.
8301
+ */
8302
+ text: string | string[];
8303
+ /**
8304
+ * Target langauge to translate to
8305
+ */
8306
+ target_language:
8307
+ | "asm_Beng"
8308
+ | "awa_Deva"
8309
+ | "ben_Beng"
8310
+ | "bho_Deva"
8311
+ | "brx_Deva"
8312
+ | "doi_Deva"
8313
+ | "eng_Latn"
8314
+ | "gom_Deva"
8315
+ | "gon_Deva"
8316
+ | "guj_Gujr"
8317
+ | "hin_Deva"
8318
+ | "hne_Deva"
8319
+ | "kan_Knda"
8320
+ | "kas_Arab"
8321
+ | "kas_Deva"
8322
+ | "kha_Latn"
8323
+ | "lus_Latn"
8324
+ | "mag_Deva"
8325
+ | "mai_Deva"
8326
+ | "mal_Mlym"
8327
+ | "mar_Deva"
8328
+ | "mni_Beng"
8329
+ | "mni_Mtei"
8330
+ | "npi_Deva"
8331
+ | "ory_Orya"
8332
+ | "pan_Guru"
8333
+ | "san_Deva"
8334
+ | "sat_Olck"
8335
+ | "snd_Arab"
8336
+ | "snd_Deva"
8337
+ | "tam_Taml"
8338
+ | "tel_Telu"
8339
+ | "urd_Arab"
8340
+ | "unr_Deva";
8341
+ }
8342
+ interface Ai_Cf_Ai4Bharat_Indictrans2_En_Indic_1B_Output {
8343
+ /**
8344
+ * Translated texts
8345
+ */
8346
+ translations: string[];
8347
+ }
8348
+ declare abstract class Base_Ai_Cf_Ai4Bharat_Indictrans2_En_Indic_1B {
8349
+ inputs: Ai_Cf_Ai4Bharat_Indictrans2_En_Indic_1B_Input;
8350
+ postProcessedOutputs: Ai_Cf_Ai4Bharat_Indictrans2_En_Indic_1B_Output;
8351
+ }
8352
+ type Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Input =
8353
+ | Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Prompt
8354
+ | Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Messages
8355
+ | Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Async_Batch;
8356
+ interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Prompt {
8357
+ /**
8358
+ * The input text prompt for the model to generate a response.
8359
+ */
8360
+ prompt: string;
8361
+ /**
8362
+ * Name of the LoRA (Low-Rank Adaptation) model to fine-tune the base model.
8363
+ */
8364
+ lora?: string;
8365
+ response_format?: Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_JSON_Mode;
8366
+ /**
8367
+ * If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
8368
+ */
8369
+ raw?: boolean;
8370
+ /**
8371
+ * If true, the response will be streamed back incrementally using SSE, Server Sent Events.
8372
+ */
8373
+ stream?: boolean;
8374
+ /**
8375
+ * The maximum number of tokens to generate in the response.
8376
+ */
8377
+ max_tokens?: number;
8378
+ /**
8379
+ * Controls the randomness of the output; higher values produce more random results.
8380
+ */
8381
+ temperature?: number;
8382
+ /**
8383
+ * Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses.
8384
+ */
8385
+ top_p?: number;
8386
+ /**
8387
+ * Limits the AI to choose from the top 'k' most probable words. Lower values make responses more focused; higher values introduce more variety and potential surprises.
8388
+ */
8389
+ top_k?: number;
8390
+ /**
8391
+ * Random seed for reproducibility of the generation.
8392
+ */
8393
+ seed?: number;
8394
+ /**
8395
+ * Penalty for repeated tokens; higher values discourage repetition.
8396
+ */
8397
+ repetition_penalty?: number;
8398
+ /**
8399
+ * Decreases the likelihood of the model repeating the same lines verbatim.
8400
+ */
8401
+ frequency_penalty?: number;
8402
+ /**
8403
+ * Increases the likelihood of the model introducing new topics.
8404
+ */
8405
+ presence_penalty?: number;
8406
+ }
8407
+ interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_JSON_Mode {
8408
+ type?: "json_object" | "json_schema";
8409
+ json_schema?: unknown;
8410
+ }
8411
+ interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Messages {
8412
+ /**
8413
+ * An array of message objects representing the conversation history.
8414
+ */
8415
+ messages: {
8416
+ /**
8417
+ * The role of the message sender (e.g., 'user', 'assistant', 'system', 'tool').
8418
+ */
8419
+ role: string;
8420
+ /**
8421
+ * The content of the message as a string.
8422
+ */
8423
+ content: string;
8424
+ }[];
8425
+ functions?: {
8426
+ name: string;
8427
+ code: string;
8428
+ }[];
8429
+ /**
8430
+ * A list of tools available for the assistant to use.
8431
+ */
8432
+ tools?: (
8433
+ | {
8434
+ /**
8435
+ * The name of the tool. More descriptive the better.
8436
+ */
8437
+ name: string;
8438
+ /**
8439
+ * A brief description of what the tool does.
8440
+ */
8441
+ description: string;
8442
+ /**
8443
+ * Schema defining the parameters accepted by the tool.
8444
+ */
8445
+ parameters: {
8446
+ /**
8447
+ * The type of the parameters object (usually 'object').
8448
+ */
8449
+ type: string;
8450
+ /**
8451
+ * List of required parameter names.
8452
+ */
8453
+ required?: string[];
8454
+ /**
8455
+ * Definitions of each parameter.
8456
+ */
8457
+ properties: {
8458
+ [k: string]: {
8459
+ /**
8460
+ * The data type of the parameter.
8461
+ */
8462
+ type: string;
8463
+ /**
8464
+ * A description of the expected parameter.
8465
+ */
8466
+ description: string;
8467
+ };
8468
+ };
8469
+ };
8470
+ }
8471
+ | {
8472
+ /**
8473
+ * Specifies the type of tool (e.g., 'function').
8474
+ */
8475
+ type: string;
8476
+ /**
8477
+ * Details of the function tool.
8478
+ */
8479
+ function: {
8480
+ /**
8481
+ * The name of the function.
8482
+ */
8483
+ name: string;
8484
+ /**
8485
+ * A brief description of what the function does.
8486
+ */
8487
+ description: string;
8488
+ /**
8489
+ * Schema defining the parameters accepted by the function.
8490
+ */
8491
+ parameters: {
8492
+ /**
8493
+ * The type of the parameters object (usually 'object').
8494
+ */
8495
+ type: string;
8496
+ /**
8497
+ * List of required parameter names.
8498
+ */
8499
+ required?: string[];
8500
+ /**
8501
+ * Definitions of each parameter.
8502
+ */
8503
+ properties: {
8504
+ [k: string]: {
8505
+ /**
8506
+ * The data type of the parameter.
8507
+ */
8508
+ type: string;
8509
+ /**
8510
+ * A description of the expected parameter.
8511
+ */
8512
+ description: string;
8513
+ };
8514
+ };
8515
+ };
8516
+ };
8517
+ }
8518
+ )[];
8519
+ response_format?: Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_JSON_Mode_1;
8520
+ /**
8521
+ * If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
8522
+ */
8523
+ raw?: boolean;
8524
+ /**
8525
+ * If true, the response will be streamed back incrementally using SSE, Server Sent Events.
8526
+ */
8527
+ stream?: boolean;
8528
+ /**
8529
+ * The maximum number of tokens to generate in the response.
8530
+ */
8531
+ max_tokens?: number;
8532
+ /**
8533
+ * Controls the randomness of the output; higher values produce more random results.
8534
+ */
8535
+ temperature?: number;
8536
+ /**
8537
+ * Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses.
6947
8538
  */
6948
- punctuate?: boolean;
8539
+ top_p?: number;
6949
8540
  /**
6950
- * Redaction removes sensitive information from your transcripts.
8541
+ * Limits the AI to choose from the top 'k' most probable words. Lower values make responses more focused; higher values introduce more variety and potential surprises.
6951
8542
  */
6952
- redact?: string;
8543
+ top_k?: number;
6953
8544
  /**
6954
- * Search for terms or phrases in submitted audio and replaces them.
8545
+ * Random seed for reproducibility of the generation.
6955
8546
  */
6956
- replace?: string;
8547
+ seed?: number;
6957
8548
  /**
6958
- * Search for terms or phrases in submitted audio.
8549
+ * Penalty for repeated tokens; higher values discourage repetition.
6959
8550
  */
6960
- search?: string;
8551
+ repetition_penalty?: number;
6961
8552
  /**
6962
- * Recognizes the sentiment throughout a transcript or text.
8553
+ * Decreases the likelihood of the model repeating the same lines verbatim.
6963
8554
  */
6964
- sentiment?: boolean;
8555
+ frequency_penalty?: number;
6965
8556
  /**
6966
- * Apply formatting to transcript output. When set to true, additional formatting will be applied to transcripts to improve readability.
8557
+ * Increases the likelihood of the model introducing new topics.
6967
8558
  */
6968
- smart_format?: boolean;
8559
+ presence_penalty?: number;
8560
+ }
8561
+ interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_JSON_Mode_1 {
8562
+ type?: "json_object" | "json_schema";
8563
+ json_schema?: unknown;
8564
+ }
8565
+ interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Async_Batch {
8566
+ requests: (
8567
+ | Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Prompt_1
8568
+ | Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Messages_1
8569
+ )[];
8570
+ }
8571
+ interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Prompt_1 {
6969
8572
  /**
6970
- * Detect topics throughout a transcript or text.
8573
+ * The input text prompt for the model to generate a response.
6971
8574
  */
6972
- topics?: boolean;
8575
+ prompt: string;
6973
8576
  /**
6974
- * Segments speech into meaningful semantic units.
8577
+ * Name of the LoRA (Low-Rank Adaptation) model to fine-tune the base model.
6975
8578
  */
6976
- utterances?: boolean;
8579
+ lora?: string;
8580
+ response_format?: Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_JSON_Mode_2;
6977
8581
  /**
6978
- * Seconds to wait before detecting a pause between words in submitted audio.
8582
+ * If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
6979
8583
  */
6980
- utt_split?: number;
8584
+ raw?: boolean;
6981
8585
  /**
6982
- * The number of channels in the submitted audio
8586
+ * If true, the response will be streamed back incrementally using SSE, Server Sent Events.
6983
8587
  */
6984
- channels?: number;
8588
+ stream?: boolean;
6985
8589
  /**
6986
- * Specifies whether the streaming endpoint should provide ongoing transcription updates as more audio is received. When set to true, the endpoint sends continuous updates, meaning transcription results may evolve over time. Note: Supported only for webosockets.
8590
+ * The maximum number of tokens to generate in the response.
6987
8591
  */
6988
- interim_results?: boolean;
8592
+ max_tokens?: number;
6989
8593
  /**
6990
- * Indicates how long model will wait to detect whether a speaker has finished speaking or pauses for a significant period of time. When set to a value, the streaming endpoint immediately finalizes the transcription for the processed time range and returns the transcript with a speech_final parameter set to true. Can also be set to false to disable endpointing
8594
+ * Controls the randomness of the output; higher values produce more random results.
6991
8595
  */
6992
- endpointing?: string;
8596
+ temperature?: number;
6993
8597
  /**
6994
- * Indicates that speech has started. You'll begin receiving Speech Started messages upon speech starting. Note: Supported only for webosockets.
8598
+ * Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses.
6995
8599
  */
6996
- vad_events?: boolean;
8600
+ top_p?: number;
6997
8601
  /**
6998
- * Indicates how long model will wait to send an UtteranceEnd message after a word has been transcribed. Use with interim_results. Note: Supported only for webosockets.
8602
+ * Limits the AI to choose from the top 'k' most probable words. Lower values make responses more focused; higher values introduce more variety and potential surprises.
6999
8603
  */
7000
- utterance_end_ms?: boolean;
8604
+ top_k?: number;
8605
+ /**
8606
+ * Random seed for reproducibility of the generation.
8607
+ */
8608
+ seed?: number;
8609
+ /**
8610
+ * Penalty for repeated tokens; higher values discourage repetition.
8611
+ */
8612
+ repetition_penalty?: number;
8613
+ /**
8614
+ * Decreases the likelihood of the model repeating the same lines verbatim.
8615
+ */
8616
+ frequency_penalty?: number;
8617
+ /**
8618
+ * Increases the likelihood of the model introducing new topics.
8619
+ */
8620
+ presence_penalty?: number;
7001
8621
  }
7002
- interface Ai_Cf_Deepgram_Nova_3_Output {
7003
- results?: {
7004
- channels?: {
7005
- alternatives?: {
7006
- confidence?: number;
7007
- transcript?: string;
7008
- words?: {
7009
- confidence?: number;
7010
- end?: number;
7011
- start?: number;
7012
- word?: string;
7013
- }[];
7014
- }[];
7015
- }[];
7016
- summary?: {
7017
- result?: string;
7018
- short?: string;
7019
- };
7020
- sentiments?: {
7021
- segments?: {
7022
- text?: string;
7023
- start_word?: number;
7024
- end_word?: number;
7025
- sentiment?: string;
7026
- sentiment_score?: number;
7027
- }[];
7028
- average?: {
7029
- sentiment?: string;
7030
- sentiment_score?: number;
7031
- };
7032
- };
7033
- };
8622
+ interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_JSON_Mode_2 {
8623
+ type?: "json_object" | "json_schema";
8624
+ json_schema?: unknown;
8625
+ }
8626
+ interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Messages_1 {
8627
+ /**
8628
+ * An array of message objects representing the conversation history.
8629
+ */
8630
+ messages: {
8631
+ /**
8632
+ * The role of the message sender (e.g., 'user', 'assistant', 'system', 'tool').
8633
+ */
8634
+ role: string;
8635
+ /**
8636
+ * The content of the message as a string.
8637
+ */
8638
+ content: string;
8639
+ }[];
8640
+ functions?: {
8641
+ name: string;
8642
+ code: string;
8643
+ }[];
8644
+ /**
8645
+ * A list of tools available for the assistant to use.
8646
+ */
8647
+ tools?: (
8648
+ | {
8649
+ /**
8650
+ * The name of the tool. More descriptive the better.
8651
+ */
8652
+ name: string;
8653
+ /**
8654
+ * A brief description of what the tool does.
8655
+ */
8656
+ description: string;
8657
+ /**
8658
+ * Schema defining the parameters accepted by the tool.
8659
+ */
8660
+ parameters: {
8661
+ /**
8662
+ * The type of the parameters object (usually 'object').
8663
+ */
8664
+ type: string;
8665
+ /**
8666
+ * List of required parameter names.
8667
+ */
8668
+ required?: string[];
8669
+ /**
8670
+ * Definitions of each parameter.
8671
+ */
8672
+ properties: {
8673
+ [k: string]: {
8674
+ /**
8675
+ * The data type of the parameter.
8676
+ */
8677
+ type: string;
8678
+ /**
8679
+ * A description of the expected parameter.
8680
+ */
8681
+ description: string;
8682
+ };
8683
+ };
8684
+ };
8685
+ }
8686
+ | {
8687
+ /**
8688
+ * Specifies the type of tool (e.g., 'function').
8689
+ */
8690
+ type: string;
8691
+ /**
8692
+ * Details of the function tool.
8693
+ */
8694
+ function: {
8695
+ /**
8696
+ * The name of the function.
8697
+ */
8698
+ name: string;
8699
+ /**
8700
+ * A brief description of what the function does.
8701
+ */
8702
+ description: string;
8703
+ /**
8704
+ * Schema defining the parameters accepted by the function.
8705
+ */
8706
+ parameters: {
8707
+ /**
8708
+ * The type of the parameters object (usually 'object').
8709
+ */
8710
+ type: string;
8711
+ /**
8712
+ * List of required parameter names.
8713
+ */
8714
+ required?: string[];
8715
+ /**
8716
+ * Definitions of each parameter.
8717
+ */
8718
+ properties: {
8719
+ [k: string]: {
8720
+ /**
8721
+ * The data type of the parameter.
8722
+ */
8723
+ type: string;
8724
+ /**
8725
+ * A description of the expected parameter.
8726
+ */
8727
+ description: string;
8728
+ };
8729
+ };
8730
+ };
8731
+ };
8732
+ }
8733
+ )[];
8734
+ response_format?: Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_JSON_Mode_3;
8735
+ /**
8736
+ * If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
8737
+ */
8738
+ raw?: boolean;
8739
+ /**
8740
+ * If true, the response will be streamed back incrementally using SSE, Server Sent Events.
8741
+ */
8742
+ stream?: boolean;
8743
+ /**
8744
+ * The maximum number of tokens to generate in the response.
8745
+ */
8746
+ max_tokens?: number;
8747
+ /**
8748
+ * Controls the randomness of the output; higher values produce more random results.
8749
+ */
8750
+ temperature?: number;
8751
+ /**
8752
+ * Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses.
8753
+ */
8754
+ top_p?: number;
8755
+ /**
8756
+ * Limits the AI to choose from the top 'k' most probable words. Lower values make responses more focused; higher values introduce more variety and potential surprises.
8757
+ */
8758
+ top_k?: number;
8759
+ /**
8760
+ * Random seed for reproducibility of the generation.
8761
+ */
8762
+ seed?: number;
8763
+ /**
8764
+ * Penalty for repeated tokens; higher values discourage repetition.
8765
+ */
8766
+ repetition_penalty?: number;
8767
+ /**
8768
+ * Decreases the likelihood of the model repeating the same lines verbatim.
8769
+ */
8770
+ frequency_penalty?: number;
8771
+ /**
8772
+ * Increases the likelihood of the model introducing new topics.
8773
+ */
8774
+ presence_penalty?: number;
7034
8775
  }
7035
- declare abstract class Base_Ai_Cf_Deepgram_Nova_3 {
7036
- inputs: Ai_Cf_Deepgram_Nova_3_Input;
7037
- postProcessedOutputs: Ai_Cf_Deepgram_Nova_3_Output;
8776
+ interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_JSON_Mode_3 {
8777
+ type?: "json_object" | "json_schema";
8778
+ json_schema?: unknown;
7038
8779
  }
7039
- type Ai_Cf_Pipecat_Ai_Smart_Turn_V2_Input =
7040
- | {
8780
+ type Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Output =
8781
+ | Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Chat_Completion_Response
8782
+ | Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Text_Completion_Response
8783
+ | string
8784
+ | Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_AsyncResponse;
8785
+ interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Chat_Completion_Response {
8786
+ /**
8787
+ * Unique identifier for the completion
8788
+ */
8789
+ id?: string;
8790
+ /**
8791
+ * Object type identifier
8792
+ */
8793
+ object?: "chat.completion";
8794
+ /**
8795
+ * Unix timestamp of when the completion was created
8796
+ */
8797
+ created?: number;
8798
+ /**
8799
+ * Model used for the completion
8800
+ */
8801
+ model?: string;
8802
+ /**
8803
+ * List of completion choices
8804
+ */
8805
+ choices?: {
8806
+ /**
8807
+ * Index of the choice in the list
8808
+ */
8809
+ index?: number;
8810
+ /**
8811
+ * The message generated by the model
8812
+ */
8813
+ message?: {
7041
8814
  /**
7042
- * readable stream with audio data and content-type specified for that data
8815
+ * Role of the message author
7043
8816
  */
7044
- audio: {
7045
- body: object;
7046
- contentType: string;
7047
- };
8817
+ role: string;
7048
8818
  /**
7049
- * type of data PCM data that's sent to the inference server as raw array
8819
+ * The content of the message
7050
8820
  */
7051
- dtype?: "uint8" | "float32" | "float64";
7052
- }
7053
- | {
8821
+ content: string;
7054
8822
  /**
7055
- * base64 encoded audio data
8823
+ * Internal reasoning content (if available)
7056
8824
  */
7057
- audio: string;
8825
+ reasoning_content?: string;
7058
8826
  /**
7059
- * type of data PCM data that's sent to the inference server as raw array
8827
+ * Tool calls made by the assistant
7060
8828
  */
7061
- dtype?: "uint8" | "float32" | "float64";
8829
+ tool_calls?: {
8830
+ /**
8831
+ * Unique identifier for the tool call
8832
+ */
8833
+ id: string;
8834
+ /**
8835
+ * Type of tool call
8836
+ */
8837
+ type: "function";
8838
+ function: {
8839
+ /**
8840
+ * Name of the function to call
8841
+ */
8842
+ name: string;
8843
+ /**
8844
+ * JSON string of arguments for the function
8845
+ */
8846
+ arguments: string;
8847
+ };
8848
+ }[];
7062
8849
  };
7063
- interface Ai_Cf_Pipecat_Ai_Smart_Turn_V2_Output {
8850
+ /**
8851
+ * Reason why the model stopped generating
8852
+ */
8853
+ finish_reason?: string;
8854
+ /**
8855
+ * Stop reason (may be null)
8856
+ */
8857
+ stop_reason?: string | null;
8858
+ /**
8859
+ * Log probabilities (if requested)
8860
+ */
8861
+ logprobs?: {} | null;
8862
+ }[];
7064
8863
  /**
7065
- * if true, end-of-turn was detected
8864
+ * Usage statistics for the inference request
7066
8865
  */
7067
- is_complete?: boolean;
8866
+ usage?: {
8867
+ /**
8868
+ * Total number of tokens in input
8869
+ */
8870
+ prompt_tokens?: number;
8871
+ /**
8872
+ * Total number of tokens in output
8873
+ */
8874
+ completion_tokens?: number;
8875
+ /**
8876
+ * Total number of input and output tokens
8877
+ */
8878
+ total_tokens?: number;
8879
+ };
7068
8880
  /**
7069
- * probability of the end-of-turn detection
8881
+ * Log probabilities for the prompt (if requested)
7070
8882
  */
7071
- probability?: number;
7072
- }
7073
- declare abstract class Base_Ai_Cf_Pipecat_Ai_Smart_Turn_V2 {
7074
- inputs: Ai_Cf_Pipecat_Ai_Smart_Turn_V2_Input;
7075
- postProcessedOutputs: Ai_Cf_Pipecat_Ai_Smart_Turn_V2_Output;
8883
+ prompt_logprobs?: {} | null;
7076
8884
  }
7077
- type Ai_Cf_Openai_Gpt_Oss_120B_Input =
7078
- | GPT_OSS_120B_Responses
7079
- | GPT_OSS_120B_Responses_Async;
7080
- interface GPT_OSS_120B_Responses {
8885
+ interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Text_Completion_Response {
8886
+ /**
8887
+ * Unique identifier for the completion
8888
+ */
8889
+ id?: string;
8890
+ /**
8891
+ * Object type identifier
8892
+ */
8893
+ object?: "text_completion";
8894
+ /**
8895
+ * Unix timestamp of when the completion was created
8896
+ */
8897
+ created?: number;
8898
+ /**
8899
+ * Model used for the completion
8900
+ */
8901
+ model?: string;
7081
8902
  /**
7082
- * Responses API Input messages. Refer to OpenAI Responses API docs to learn more about supported content types
8903
+ * List of completion choices
7083
8904
  */
7084
- input: string | unknown[];
7085
- reasoning?: {
8905
+ choices?: {
7086
8906
  /**
7087
- * Constrains effort on reasoning for reasoning models. Currently supported values are low, medium, and high. Reducing reasoning effort can result in faster responses and fewer tokens used on reasoning in a response.
8907
+ * Index of the choice in the list
7088
8908
  */
7089
- effort?: "low" | "medium" | "high";
8909
+ index: number;
7090
8910
  /**
7091
- * A summary of the reasoning performed by the model. This can be useful for debugging and understanding the model's reasoning process. One of auto, concise, or detailed.
8911
+ * The generated text completion
7092
8912
  */
7093
- summary?: "auto" | "concise" | "detailed";
7094
- };
7095
- }
7096
- interface GPT_OSS_120B_Responses_Async {
7097
- requests: {
8913
+ text: string;
7098
8914
  /**
7099
- * Responses API Input messages. Refer to OpenAI Responses API docs to learn more about supported content types
8915
+ * Reason why the model stopped generating
7100
8916
  */
7101
- input: string | unknown[];
7102
- reasoning?: {
7103
- /**
7104
- * Constrains effort on reasoning for reasoning models. Currently supported values are low, medium, and high. Reducing reasoning effort can result in faster responses and fewer tokens used on reasoning in a response.
7105
- */
7106
- effort?: "low" | "medium" | "high";
7107
- /**
7108
- * A summary of the reasoning performed by the model. This can be useful for debugging and understanding the model's reasoning process. One of auto, concise, or detailed.
7109
- */
7110
- summary?: "auto" | "concise" | "detailed";
7111
- };
8917
+ finish_reason: string;
8918
+ /**
8919
+ * Stop reason (may be null)
8920
+ */
8921
+ stop_reason?: string | null;
8922
+ /**
8923
+ * Log probabilities (if requested)
8924
+ */
8925
+ logprobs?: {} | null;
8926
+ /**
8927
+ * Log probabilities for the prompt (if requested)
8928
+ */
8929
+ prompt_logprobs?: {} | null;
7112
8930
  }[];
7113
- }
7114
- type Ai_Cf_Openai_Gpt_Oss_120B_Output = {} | (string & NonNullable<unknown>);
7115
- declare abstract class Base_Ai_Cf_Openai_Gpt_Oss_120B {
7116
- inputs: Ai_Cf_Openai_Gpt_Oss_120B_Input;
7117
- postProcessedOutputs: Ai_Cf_Openai_Gpt_Oss_120B_Output;
7118
- }
7119
- type Ai_Cf_Openai_Gpt_Oss_20B_Input =
7120
- | GPT_OSS_20B_Responses
7121
- | GPT_OSS_20B_Responses_Async;
7122
- interface GPT_OSS_20B_Responses {
7123
8931
  /**
7124
- * Responses API Input messages. Refer to OpenAI Responses API docs to learn more about supported content types
8932
+ * Usage statistics for the inference request
7125
8933
  */
7126
- input: string | unknown[];
7127
- reasoning?: {
8934
+ usage?: {
7128
8935
  /**
7129
- * Constrains effort on reasoning for reasoning models. Currently supported values are low, medium, and high. Reducing reasoning effort can result in faster responses and fewer tokens used on reasoning in a response.
8936
+ * Total number of tokens in input
7130
8937
  */
7131
- effort?: "low" | "medium" | "high";
8938
+ prompt_tokens?: number;
7132
8939
  /**
7133
- * A summary of the reasoning performed by the model. This can be useful for debugging and understanding the model's reasoning process. One of auto, concise, or detailed.
8940
+ * Total number of tokens in output
7134
8941
  */
7135
- summary?: "auto" | "concise" | "detailed";
7136
- };
7137
- }
7138
- interface GPT_OSS_20B_Responses_Async {
7139
- requests: {
8942
+ completion_tokens?: number;
7140
8943
  /**
7141
- * Responses API Input messages. Refer to OpenAI Responses API docs to learn more about supported content types
8944
+ * Total number of input and output tokens
7142
8945
  */
7143
- input: string | unknown[];
7144
- reasoning?: {
7145
- /**
7146
- * Constrains effort on reasoning for reasoning models. Currently supported values are low, medium, and high. Reducing reasoning effort can result in faster responses and fewer tokens used on reasoning in a response.
7147
- */
7148
- effort?: "low" | "medium" | "high";
7149
- /**
7150
- * A summary of the reasoning performed by the model. This can be useful for debugging and understanding the model's reasoning process. One of auto, concise, or detailed.
7151
- */
7152
- summary?: "auto" | "concise" | "detailed";
7153
- };
7154
- }[];
8946
+ total_tokens?: number;
8947
+ };
7155
8948
  }
7156
- type Ai_Cf_Openai_Gpt_Oss_20B_Output = {} | (string & NonNullable<unknown>);
7157
- declare abstract class Base_Ai_Cf_Openai_Gpt_Oss_20B {
7158
- inputs: Ai_Cf_Openai_Gpt_Oss_20B_Input;
7159
- postProcessedOutputs: Ai_Cf_Openai_Gpt_Oss_20B_Output;
8949
+ interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_AsyncResponse {
8950
+ /**
8951
+ * The async request id that can be used to obtain the results.
8952
+ */
8953
+ request_id?: string;
7160
8954
  }
7161
- interface Ai_Cf_Leonardo_Phoenix_1_0_Input {
8955
+ declare abstract class Base_Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It {
8956
+ inputs: Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Input;
8957
+ postProcessedOutputs: Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Output;
8958
+ }
8959
+ interface Ai_Cf_Pfnet_Plamo_Embedding_1B_Input {
7162
8960
  /**
7163
- * A text description of the image you want to generate.
8961
+ * Input text to embed. Can be a single string or a list of strings.
7164
8962
  */
7165
- prompt: string;
8963
+ text: string | string[];
8964
+ }
8965
+ interface Ai_Cf_Pfnet_Plamo_Embedding_1B_Output {
7166
8966
  /**
7167
- * Controls how closely the generated image should adhere to the prompt; higher values make the image more aligned with the prompt
8967
+ * Embedding vectors, where each vector is a list of floats.
7168
8968
  */
7169
- guidance?: number;
8969
+ data: number[][];
7170
8970
  /**
7171
- * Random seed for reproducibility of the image generation
8971
+ * Shape of the embedding data as [number_of_embeddings, embedding_dimension].
8972
+ *
8973
+ * @minItems 2
8974
+ * @maxItems 2
7172
8975
  */
7173
- seed?: number;
8976
+ shape: [number, number];
8977
+ }
8978
+ declare abstract class Base_Ai_Cf_Pfnet_Plamo_Embedding_1B {
8979
+ inputs: Ai_Cf_Pfnet_Plamo_Embedding_1B_Input;
8980
+ postProcessedOutputs: Ai_Cf_Pfnet_Plamo_Embedding_1B_Output;
8981
+ }
8982
+ interface Ai_Cf_Deepgram_Flux_Input {
7174
8983
  /**
7175
- * The height of the generated image in pixels
8984
+ * Encoding of the audio stream. Currently only supports raw signed little-endian 16-bit PCM.
7176
8985
  */
7177
- height?: number;
8986
+ encoding: "linear16";
7178
8987
  /**
7179
- * The width of the generated image in pixels
8988
+ * Sample rate of the audio stream in Hz.
7180
8989
  */
7181
- width?: number;
8990
+ sample_rate: string;
7182
8991
  /**
7183
- * The number of diffusion steps; higher values can improve quality but take longer
8992
+ * End-of-turn confidence required to fire an eager end-of-turn event. When set, enables EagerEndOfTurn and TurnResumed events. Valid Values 0.3 - 0.9.
7184
8993
  */
7185
- num_steps?: number;
8994
+ eager_eot_threshold?: string;
7186
8995
  /**
7187
- * Specify what to exclude from the generated images
8996
+ * End-of-turn confidence required to finish a turn. Valid Values 0.5 - 0.9.
7188
8997
  */
7189
- negative_prompt?: string;
8998
+ eot_threshold?: string;
8999
+ /**
9000
+ * A turn will be finished when this much time has passed after speech, regardless of EOT confidence.
9001
+ */
9002
+ eot_timeout_ms?: string;
9003
+ /**
9004
+ * Keyterm prompting can improve recognition of specialized terminology. Pass multiple keyterm query parameters to boost multiple keyterms.
9005
+ */
9006
+ keyterm?: string;
9007
+ /**
9008
+ * Opts out requests from the Deepgram Model Improvement Program. Refer to Deepgram Docs for pricing impacts before setting this to true. https://dpgr.am/deepgram-mip
9009
+ */
9010
+ mip_opt_out?: "true" | "false";
9011
+ /**
9012
+ * Label your requests for the purpose of identification during usage reporting
9013
+ */
9014
+ tag?: string;
7190
9015
  }
7191
9016
  /**
7192
- * The generated image in JPEG format
9017
+ * Output will be returned as websocket messages.
7193
9018
  */
7194
- type Ai_Cf_Leonardo_Phoenix_1_0_Output = string;
7195
- declare abstract class Base_Ai_Cf_Leonardo_Phoenix_1_0 {
7196
- inputs: Ai_Cf_Leonardo_Phoenix_1_0_Input;
7197
- postProcessedOutputs: Ai_Cf_Leonardo_Phoenix_1_0_Output;
7198
- }
7199
- interface Ai_Cf_Leonardo_Lucid_Origin_Input {
9019
+ interface Ai_Cf_Deepgram_Flux_Output {
7200
9020
  /**
7201
- * A text description of the image you want to generate.
9021
+ * The unique identifier of the request (uuid)
7202
9022
  */
7203
- prompt: string;
9023
+ request_id?: string;
7204
9024
  /**
7205
- * Controls how closely the generated image should adhere to the prompt; higher values make the image more aligned with the prompt
9025
+ * Starts at 0 and increments for each message the server sends to the client.
7206
9026
  */
7207
- guidance?: number;
9027
+ sequence_id?: number;
7208
9028
  /**
7209
- * Random seed for reproducibility of the image generation
9029
+ * The type of event being reported.
7210
9030
  */
7211
- seed?: number;
9031
+ event?:
9032
+ | "Update"
9033
+ | "StartOfTurn"
9034
+ | "EagerEndOfTurn"
9035
+ | "TurnResumed"
9036
+ | "EndOfTurn";
7212
9037
  /**
7213
- * The height of the generated image in pixels
9038
+ * The index of the current turn
7214
9039
  */
7215
- height?: number;
9040
+ turn_index?: number;
7216
9041
  /**
7217
- * The width of the generated image in pixels
9042
+ * Start time in seconds of the audio range that was transcribed
7218
9043
  */
7219
- width?: number;
9044
+ audio_window_start?: number;
7220
9045
  /**
7221
- * The number of diffusion steps; higher values can improve quality but take longer
9046
+ * End time in seconds of the audio range that was transcribed
7222
9047
  */
7223
- num_steps?: number;
9048
+ audio_window_end?: number;
7224
9049
  /**
7225
- * The number of diffusion steps; higher values can improve quality but take longer
9050
+ * Text that was said over the course of the current turn
7226
9051
  */
7227
- steps?: number;
7228
- }
7229
- interface Ai_Cf_Leonardo_Lucid_Origin_Output {
9052
+ transcript?: string;
7230
9053
  /**
7231
- * The generated image in Base64 format.
9054
+ * The words in the transcript
7232
9055
  */
7233
- image?: string;
9056
+ words?: {
9057
+ /**
9058
+ * The individual punctuated, properly-cased word from the transcript
9059
+ */
9060
+ word: string;
9061
+ /**
9062
+ * Confidence that this word was transcribed correctly
9063
+ */
9064
+ confidence: number;
9065
+ }[];
9066
+ /**
9067
+ * Confidence that no more speech is coming in this turn
9068
+ */
9069
+ end_of_turn_confidence?: number;
7234
9070
  }
7235
- declare abstract class Base_Ai_Cf_Leonardo_Lucid_Origin {
7236
- inputs: Ai_Cf_Leonardo_Lucid_Origin_Input;
7237
- postProcessedOutputs: Ai_Cf_Leonardo_Lucid_Origin_Output;
9071
+ declare abstract class Base_Ai_Cf_Deepgram_Flux {
9072
+ inputs: Ai_Cf_Deepgram_Flux_Input;
9073
+ postProcessedOutputs: Ai_Cf_Deepgram_Flux_Output;
7238
9074
  }
7239
- interface Ai_Cf_Deepgram_Aura_1_Input {
9075
+ interface Ai_Cf_Deepgram_Aura_2_En_Input {
7240
9076
  /**
7241
9077
  * Speaker used to produce the audio.
7242
9078
  */
7243
9079
  speaker?:
7244
- | "angus"
7245
- | "asteria"
9080
+ | "amalthea"
9081
+ | "andromeda"
9082
+ | "apollo"
7246
9083
  | "arcas"
7247
- | "orion"
7248
- | "orpheus"
9084
+ | "aries"
9085
+ | "asteria"
7249
9086
  | "athena"
7250
- | "luna"
7251
- | "zeus"
7252
- | "perseus"
7253
- | "helios"
9087
+ | "atlas"
9088
+ | "aurora"
9089
+ | "callista"
9090
+ | "cora"
9091
+ | "cordelia"
9092
+ | "delia"
9093
+ | "draco"
9094
+ | "electra"
9095
+ | "harmonia"
9096
+ | "helena"
7254
9097
  | "hera"
7255
- | "stella";
9098
+ | "hermes"
9099
+ | "hyperion"
9100
+ | "iris"
9101
+ | "janus"
9102
+ | "juno"
9103
+ | "jupiter"
9104
+ | "luna"
9105
+ | "mars"
9106
+ | "minerva"
9107
+ | "neptune"
9108
+ | "odysseus"
9109
+ | "ophelia"
9110
+ | "orion"
9111
+ | "orpheus"
9112
+ | "pandora"
9113
+ | "phoebe"
9114
+ | "pluto"
9115
+ | "saturn"
9116
+ | "thalia"
9117
+ | "theia"
9118
+ | "vesta"
9119
+ | "zeus";
7256
9120
  /**
7257
9121
  * Encoding of the output audio.
7258
9122
  */
@@ -7277,10 +9141,54 @@ interface Ai_Cf_Deepgram_Aura_1_Input {
7277
9141
  /**
7278
9142
  * The generated audio in MP3 format
7279
9143
  */
7280
- type Ai_Cf_Deepgram_Aura_1_Output = string;
7281
- declare abstract class Base_Ai_Cf_Deepgram_Aura_1 {
7282
- inputs: Ai_Cf_Deepgram_Aura_1_Input;
7283
- postProcessedOutputs: Ai_Cf_Deepgram_Aura_1_Output;
9144
+ type Ai_Cf_Deepgram_Aura_2_En_Output = string;
9145
+ declare abstract class Base_Ai_Cf_Deepgram_Aura_2_En {
9146
+ inputs: Ai_Cf_Deepgram_Aura_2_En_Input;
9147
+ postProcessedOutputs: Ai_Cf_Deepgram_Aura_2_En_Output;
9148
+ }
9149
+ interface Ai_Cf_Deepgram_Aura_2_Es_Input {
9150
+ /**
9151
+ * Speaker used to produce the audio.
9152
+ */
9153
+ speaker?:
9154
+ | "sirio"
9155
+ | "nestor"
9156
+ | "carina"
9157
+ | "celeste"
9158
+ | "alvaro"
9159
+ | "diana"
9160
+ | "aquila"
9161
+ | "selena"
9162
+ | "estrella"
9163
+ | "javier";
9164
+ /**
9165
+ * Encoding of the output audio.
9166
+ */
9167
+ encoding?: "linear16" | "flac" | "mulaw" | "alaw" | "mp3" | "opus" | "aac";
9168
+ /**
9169
+ * Container specifies the file format wrapper for the output audio. The available options depend on the encoding type..
9170
+ */
9171
+ container?: "none" | "wav" | "ogg";
9172
+ /**
9173
+ * The text content to be converted to speech
9174
+ */
9175
+ text: string;
9176
+ /**
9177
+ * Sample Rate specifies the sample rate for the output audio. Based on the encoding, different sample rates are supported. For some encodings, the sample rate is not configurable
9178
+ */
9179
+ sample_rate?: number;
9180
+ /**
9181
+ * The bitrate of the audio in bits per second. Choose from predefined ranges or specific values based on the encoding type.
9182
+ */
9183
+ bit_rate?: number;
9184
+ }
9185
+ /**
9186
+ * The generated audio in MP3 format
9187
+ */
9188
+ type Ai_Cf_Deepgram_Aura_2_Es_Output = string;
9189
+ declare abstract class Base_Ai_Cf_Deepgram_Aura_2_Es {
9190
+ inputs: Ai_Cf_Deepgram_Aura_2_Es_Input;
9191
+ postProcessedOutputs: Ai_Cf_Deepgram_Aura_2_Es_Output;
7284
9192
  }
7285
9193
  interface AiModels {
7286
9194
  "@cf/huggingface/distilbert-sst-2-int8": BaseAiTextClassification;
@@ -7325,12 +9233,12 @@ interface AiModels {
7325
9233
  "@cf/meta/llama-3-8b-instruct": BaseAiTextGeneration;
7326
9234
  "@cf/fblgit/una-cybertron-7b-v2-bf16": BaseAiTextGeneration;
7327
9235
  "@cf/meta/llama-3-8b-instruct-awq": BaseAiTextGeneration;
7328
- "@hf/meta-llama/meta-llama-3-8b-instruct": BaseAiTextGeneration;
7329
9236
  "@cf/meta/llama-3.1-8b-instruct-fp8": BaseAiTextGeneration;
7330
9237
  "@cf/meta/llama-3.1-8b-instruct-awq": BaseAiTextGeneration;
7331
9238
  "@cf/meta/llama-3.2-3b-instruct": BaseAiTextGeneration;
7332
9239
  "@cf/meta/llama-3.2-1b-instruct": BaseAiTextGeneration;
7333
9240
  "@cf/deepseek-ai/deepseek-r1-distill-qwen-32b": BaseAiTextGeneration;
9241
+ "@cf/ibm-granite/granite-4.0-h-micro": BaseAiTextGeneration;
7334
9242
  "@cf/facebook/bart-large-cnn": BaseAiSummarization;
7335
9243
  "@cf/llava-hf/llava-1.5-7b-hf": BaseAiImageToText;
7336
9244
  "@cf/baai/bge-base-en-v1.5": Base_Ai_Cf_Baai_Bge_Base_En_V1_5;
@@ -7352,13 +9260,21 @@ interface AiModels {
7352
9260
  "@cf/mistralai/mistral-small-3.1-24b-instruct": Base_Ai_Cf_Mistralai_Mistral_Small_3_1_24B_Instruct;
7353
9261
  "@cf/google/gemma-3-12b-it": Base_Ai_Cf_Google_Gemma_3_12B_It;
7354
9262
  "@cf/meta/llama-4-scout-17b-16e-instruct": Base_Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct;
9263
+ "@cf/qwen/qwen3-30b-a3b-fp8": Base_Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8;
7355
9264
  "@cf/deepgram/nova-3": Base_Ai_Cf_Deepgram_Nova_3;
9265
+ "@cf/qwen/qwen3-embedding-0.6b": Base_Ai_Cf_Qwen_Qwen3_Embedding_0_6B;
7356
9266
  "@cf/pipecat-ai/smart-turn-v2": Base_Ai_Cf_Pipecat_Ai_Smart_Turn_V2;
7357
9267
  "@cf/openai/gpt-oss-120b": Base_Ai_Cf_Openai_Gpt_Oss_120B;
7358
9268
  "@cf/openai/gpt-oss-20b": Base_Ai_Cf_Openai_Gpt_Oss_20B;
7359
9269
  "@cf/leonardo/phoenix-1.0": Base_Ai_Cf_Leonardo_Phoenix_1_0;
7360
9270
  "@cf/leonardo/lucid-origin": Base_Ai_Cf_Leonardo_Lucid_Origin;
7361
9271
  "@cf/deepgram/aura-1": Base_Ai_Cf_Deepgram_Aura_1;
9272
+ "@cf/ai4bharat/indictrans2-en-indic-1B": Base_Ai_Cf_Ai4Bharat_Indictrans2_En_Indic_1B;
9273
+ "@cf/aisingapore/gemma-sea-lion-v4-27b-it": Base_Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It;
9274
+ "@cf/pfnet/plamo-embedding-1b": Base_Ai_Cf_Pfnet_Plamo_Embedding_1B;
9275
+ "@cf/deepgram/flux": Base_Ai_Cf_Deepgram_Flux;
9276
+ "@cf/deepgram/aura-2-en": Base_Ai_Cf_Deepgram_Aura_2_En;
9277
+ "@cf/deepgram/aura-2-es": Base_Ai_Cf_Deepgram_Aura_2_Es;
7362
9278
  }
7363
9279
  type AiOptions = {
7364
9280
  /**
@@ -7370,6 +9286,16 @@ type AiOptions = {
7370
9286
  * Establish websocket connections, only works for supported models
7371
9287
  */
7372
9288
  websocket?: boolean;
9289
+ /**
9290
+ * Tag your requests to group and view them in Cloudflare dashboard.
9291
+ *
9292
+ * Rules:
9293
+ * Tags must only contain letters, numbers, and the symbols: : - . / @
9294
+ * Each tag can have maximum 50 characters.
9295
+ * Maximum 5 tags are allowed each request.
9296
+ * Duplicate tags will removed.
9297
+ */
9298
+ tags: string[];
7373
9299
  gateway?: GatewayOptions;
7374
9300
  returnRawResponse?: boolean;
7375
9301
  prefix?: string;
@@ -9457,12 +11383,13 @@ declare namespace Rpc {
9457
11383
  export type Provider<
9458
11384
  T extends object,
9459
11385
  Reserved extends string = never,
9460
- > = MaybeCallableProvider<T> & {
9461
- [K in Exclude<
9462
- keyof T,
9463
- Reserved | symbol | keyof StubBase<never>
9464
- >]: MethodOrProperty<T[K]>;
9465
- };
11386
+ > = MaybeCallableProvider<T> &
11387
+ Pick<
11388
+ {
11389
+ [K in keyof T]: MethodOrProperty<T[K]>;
11390
+ },
11391
+ Exclude<keyof T, Reserved | symbol | keyof StubBase<never>>
11392
+ >;
9466
11393
  }
9467
11394
  declare namespace Cloudflare {
9468
11395
  // Type of `env`.