@cloudflare/workers-types 4.20251121.0 → 4.20251126.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/2021-11-03/index.d.ts +2289 -362
- package/2021-11-03/index.ts +2289 -367
- package/2022-01-31/index.d.ts +2289 -362
- package/2022-01-31/index.ts +2289 -367
- package/2022-03-21/index.d.ts +2289 -362
- package/2022-03-21/index.ts +2289 -367
- package/2022-08-04/index.d.ts +2289 -362
- package/2022-08-04/index.ts +2289 -367
- package/2022-10-31/index.d.ts +2289 -362
- package/2022-10-31/index.ts +2289 -367
- package/2022-11-30/index.d.ts +2289 -362
- package/2022-11-30/index.ts +2289 -367
- package/2023-03-01/index.d.ts +2289 -362
- package/2023-03-01/index.ts +2289 -367
- package/2023-07-01/index.d.ts +2289 -362
- package/2023-07-01/index.ts +2289 -367
- package/experimental/index.d.ts +2289 -362
- package/experimental/index.ts +2289 -367
- package/index.d.ts +2289 -362
- package/index.ts +2289 -367
- package/latest/index.d.ts +2289 -362
- package/latest/index.ts +2289 -367
- package/oldest/index.d.ts +2289 -362
- package/oldest/index.ts +2289 -367
- package/package.json +1 -1
package/2021-11-03/index.d.ts
CHANGED
|
@@ -4002,6 +4002,427 @@ declare abstract class BaseAiTranslation {
|
|
|
4002
4002
|
inputs: AiTranslationInput;
|
|
4003
4003
|
postProcessedOutputs: AiTranslationOutput;
|
|
4004
4004
|
}
|
|
4005
|
+
/**
|
|
4006
|
+
* Workers AI support for OpenAI's Responses API
|
|
4007
|
+
* Reference: https://github.com/openai/openai-node/blob/master/src/resources/responses/responses.ts
|
|
4008
|
+
*
|
|
4009
|
+
* It's a stripped down version from its source.
|
|
4010
|
+
* It currently supports basic function calling, json mode and accepts images as input.
|
|
4011
|
+
*
|
|
4012
|
+
* It does not include types for WebSearch, CodeInterpreter, FileInputs, MCP, CustomTools.
|
|
4013
|
+
* We plan to add those incrementally as model + platform capabilities evolve.
|
|
4014
|
+
*/
|
|
4015
|
+
type ResponsesInput = {
|
|
4016
|
+
background?: boolean | null;
|
|
4017
|
+
conversation?: string | ResponseConversationParam | null;
|
|
4018
|
+
include?: Array<ResponseIncludable> | null;
|
|
4019
|
+
input?: string | ResponseInput;
|
|
4020
|
+
instructions?: string | null;
|
|
4021
|
+
max_output_tokens?: number | null;
|
|
4022
|
+
parallel_tool_calls?: boolean | null;
|
|
4023
|
+
previous_response_id?: string | null;
|
|
4024
|
+
prompt_cache_key?: string;
|
|
4025
|
+
reasoning?: Reasoning | null;
|
|
4026
|
+
safety_identifier?: string;
|
|
4027
|
+
service_tier?: "auto" | "default" | "flex" | "scale" | "priority" | null;
|
|
4028
|
+
stream?: boolean | null;
|
|
4029
|
+
stream_options?: StreamOptions | null;
|
|
4030
|
+
temperature?: number | null;
|
|
4031
|
+
text?: ResponseTextConfig;
|
|
4032
|
+
tool_choice?: ToolChoiceOptions | ToolChoiceFunction;
|
|
4033
|
+
tools?: Array<Tool>;
|
|
4034
|
+
top_p?: number | null;
|
|
4035
|
+
truncation?: "auto" | "disabled" | null;
|
|
4036
|
+
};
|
|
4037
|
+
type ResponsesOutput = {
|
|
4038
|
+
id?: string;
|
|
4039
|
+
created_at?: number;
|
|
4040
|
+
output_text?: string;
|
|
4041
|
+
error?: ResponseError | null;
|
|
4042
|
+
incomplete_details?: ResponseIncompleteDetails | null;
|
|
4043
|
+
instructions?: string | Array<ResponseInputItem> | null;
|
|
4044
|
+
object?: "response";
|
|
4045
|
+
output?: Array<ResponseOutputItem>;
|
|
4046
|
+
parallel_tool_calls?: boolean;
|
|
4047
|
+
temperature?: number | null;
|
|
4048
|
+
tool_choice?: ToolChoiceOptions | ToolChoiceFunction;
|
|
4049
|
+
tools?: Array<Tool>;
|
|
4050
|
+
top_p?: number | null;
|
|
4051
|
+
max_output_tokens?: number | null;
|
|
4052
|
+
previous_response_id?: string | null;
|
|
4053
|
+
prompt?: ResponsePrompt | null;
|
|
4054
|
+
reasoning?: Reasoning | null;
|
|
4055
|
+
safety_identifier?: string;
|
|
4056
|
+
service_tier?: "auto" | "default" | "flex" | "scale" | "priority" | null;
|
|
4057
|
+
status?: ResponseStatus;
|
|
4058
|
+
text?: ResponseTextConfig;
|
|
4059
|
+
truncation?: "auto" | "disabled" | null;
|
|
4060
|
+
usage?: ResponseUsage;
|
|
4061
|
+
};
|
|
4062
|
+
type EasyInputMessage = {
|
|
4063
|
+
content: string | ResponseInputMessageContentList;
|
|
4064
|
+
role: "user" | "assistant" | "system" | "developer";
|
|
4065
|
+
type?: "message";
|
|
4066
|
+
};
|
|
4067
|
+
type ResponsesFunctionTool = {
|
|
4068
|
+
name: string;
|
|
4069
|
+
parameters: {
|
|
4070
|
+
[key: string]: unknown;
|
|
4071
|
+
} | null;
|
|
4072
|
+
strict: boolean | null;
|
|
4073
|
+
type: "function";
|
|
4074
|
+
description?: string | null;
|
|
4075
|
+
};
|
|
4076
|
+
type ResponseIncompleteDetails = {
|
|
4077
|
+
reason?: "max_output_tokens" | "content_filter";
|
|
4078
|
+
};
|
|
4079
|
+
type ResponsePrompt = {
|
|
4080
|
+
id: string;
|
|
4081
|
+
variables?: {
|
|
4082
|
+
[key: string]: string | ResponseInputText | ResponseInputImage;
|
|
4083
|
+
} | null;
|
|
4084
|
+
version?: string | null;
|
|
4085
|
+
};
|
|
4086
|
+
type Reasoning = {
|
|
4087
|
+
effort?: ReasoningEffort | null;
|
|
4088
|
+
generate_summary?: "auto" | "concise" | "detailed" | null;
|
|
4089
|
+
summary?: "auto" | "concise" | "detailed" | null;
|
|
4090
|
+
};
|
|
4091
|
+
type ResponseContent =
|
|
4092
|
+
| ResponseInputText
|
|
4093
|
+
| ResponseInputImage
|
|
4094
|
+
| ResponseOutputText
|
|
4095
|
+
| ResponseOutputRefusal
|
|
4096
|
+
| ResponseContentReasoningText;
|
|
4097
|
+
type ResponseContentReasoningText = {
|
|
4098
|
+
text: string;
|
|
4099
|
+
type: "reasoning_text";
|
|
4100
|
+
};
|
|
4101
|
+
type ResponseConversationParam = {
|
|
4102
|
+
id: string;
|
|
4103
|
+
};
|
|
4104
|
+
type ResponseCreatedEvent = {
|
|
4105
|
+
response: Response;
|
|
4106
|
+
sequence_number: number;
|
|
4107
|
+
type: "response.created";
|
|
4108
|
+
};
|
|
4109
|
+
type ResponseCustomToolCallOutput = {
|
|
4110
|
+
call_id: string;
|
|
4111
|
+
output: string | Array<ResponseInputText | ResponseInputImage>;
|
|
4112
|
+
type: "custom_tool_call_output";
|
|
4113
|
+
id?: string;
|
|
4114
|
+
};
|
|
4115
|
+
type ResponseError = {
|
|
4116
|
+
code:
|
|
4117
|
+
| "server_error"
|
|
4118
|
+
| "rate_limit_exceeded"
|
|
4119
|
+
| "invalid_prompt"
|
|
4120
|
+
| "vector_store_timeout"
|
|
4121
|
+
| "invalid_image"
|
|
4122
|
+
| "invalid_image_format"
|
|
4123
|
+
| "invalid_base64_image"
|
|
4124
|
+
| "invalid_image_url"
|
|
4125
|
+
| "image_too_large"
|
|
4126
|
+
| "image_too_small"
|
|
4127
|
+
| "image_parse_error"
|
|
4128
|
+
| "image_content_policy_violation"
|
|
4129
|
+
| "invalid_image_mode"
|
|
4130
|
+
| "image_file_too_large"
|
|
4131
|
+
| "unsupported_image_media_type"
|
|
4132
|
+
| "empty_image_file"
|
|
4133
|
+
| "failed_to_download_image"
|
|
4134
|
+
| "image_file_not_found";
|
|
4135
|
+
message: string;
|
|
4136
|
+
};
|
|
4137
|
+
type ResponseErrorEvent = {
|
|
4138
|
+
code: string | null;
|
|
4139
|
+
message: string;
|
|
4140
|
+
param: string | null;
|
|
4141
|
+
sequence_number: number;
|
|
4142
|
+
type: "error";
|
|
4143
|
+
};
|
|
4144
|
+
type ResponseFailedEvent = {
|
|
4145
|
+
response: Response;
|
|
4146
|
+
sequence_number: number;
|
|
4147
|
+
type: "response.failed";
|
|
4148
|
+
};
|
|
4149
|
+
type ResponseFormatText = {
|
|
4150
|
+
type: "text";
|
|
4151
|
+
};
|
|
4152
|
+
type ResponseFormatJSONObject = {
|
|
4153
|
+
type: "json_object";
|
|
4154
|
+
};
|
|
4155
|
+
type ResponseFormatTextConfig =
|
|
4156
|
+
| ResponseFormatText
|
|
4157
|
+
| ResponseFormatTextJSONSchemaConfig
|
|
4158
|
+
| ResponseFormatJSONObject;
|
|
4159
|
+
type ResponseFormatTextJSONSchemaConfig = {
|
|
4160
|
+
name: string;
|
|
4161
|
+
schema: {
|
|
4162
|
+
[key: string]: unknown;
|
|
4163
|
+
};
|
|
4164
|
+
type: "json_schema";
|
|
4165
|
+
description?: string;
|
|
4166
|
+
strict?: boolean | null;
|
|
4167
|
+
};
|
|
4168
|
+
type ResponseFunctionCallArgumentsDeltaEvent = {
|
|
4169
|
+
delta: string;
|
|
4170
|
+
item_id: string;
|
|
4171
|
+
output_index: number;
|
|
4172
|
+
sequence_number: number;
|
|
4173
|
+
type: "response.function_call_arguments.delta";
|
|
4174
|
+
};
|
|
4175
|
+
type ResponseFunctionCallArgumentsDoneEvent = {
|
|
4176
|
+
arguments: string;
|
|
4177
|
+
item_id: string;
|
|
4178
|
+
name: string;
|
|
4179
|
+
output_index: number;
|
|
4180
|
+
sequence_number: number;
|
|
4181
|
+
type: "response.function_call_arguments.done";
|
|
4182
|
+
};
|
|
4183
|
+
type ResponseFunctionCallOutputItem =
|
|
4184
|
+
| ResponseInputTextContent
|
|
4185
|
+
| ResponseInputImageContent;
|
|
4186
|
+
type ResponseFunctionCallOutputItemList = Array<ResponseFunctionCallOutputItem>;
|
|
4187
|
+
type ResponseFunctionToolCall = {
|
|
4188
|
+
arguments: string;
|
|
4189
|
+
call_id: string;
|
|
4190
|
+
name: string;
|
|
4191
|
+
type: "function_call";
|
|
4192
|
+
id?: string;
|
|
4193
|
+
status?: "in_progress" | "completed" | "incomplete";
|
|
4194
|
+
};
|
|
4195
|
+
interface ResponseFunctionToolCallItem extends ResponseFunctionToolCall {
|
|
4196
|
+
id: string;
|
|
4197
|
+
}
|
|
4198
|
+
type ResponseFunctionToolCallOutputItem = {
|
|
4199
|
+
id: string;
|
|
4200
|
+
call_id: string;
|
|
4201
|
+
output: string | Array<ResponseInputText | ResponseInputImage>;
|
|
4202
|
+
type: "function_call_output";
|
|
4203
|
+
status?: "in_progress" | "completed" | "incomplete";
|
|
4204
|
+
};
|
|
4205
|
+
type ResponseIncludable =
|
|
4206
|
+
| "message.input_image.image_url"
|
|
4207
|
+
| "message.output_text.logprobs";
|
|
4208
|
+
type ResponseIncompleteEvent = {
|
|
4209
|
+
response: Response;
|
|
4210
|
+
sequence_number: number;
|
|
4211
|
+
type: "response.incomplete";
|
|
4212
|
+
};
|
|
4213
|
+
type ResponseInput = Array<ResponseInputItem>;
|
|
4214
|
+
type ResponseInputContent = ResponseInputText | ResponseInputImage;
|
|
4215
|
+
type ResponseInputImage = {
|
|
4216
|
+
detail: "low" | "high" | "auto";
|
|
4217
|
+
type: "input_image";
|
|
4218
|
+
/**
|
|
4219
|
+
* Base64 encoded image
|
|
4220
|
+
*/
|
|
4221
|
+
image_url?: string | null;
|
|
4222
|
+
};
|
|
4223
|
+
type ResponseInputImageContent = {
|
|
4224
|
+
type: "input_image";
|
|
4225
|
+
detail?: "low" | "high" | "auto" | null;
|
|
4226
|
+
/**
|
|
4227
|
+
* Base64 encoded image
|
|
4228
|
+
*/
|
|
4229
|
+
image_url?: string | null;
|
|
4230
|
+
};
|
|
4231
|
+
type ResponseInputItem =
|
|
4232
|
+
| EasyInputMessage
|
|
4233
|
+
| ResponseInputItemMessage
|
|
4234
|
+
| ResponseOutputMessage
|
|
4235
|
+
| ResponseFunctionToolCall
|
|
4236
|
+
| ResponseInputItemFunctionCallOutput
|
|
4237
|
+
| ResponseReasoningItem;
|
|
4238
|
+
type ResponseInputItemFunctionCallOutput = {
|
|
4239
|
+
call_id: string;
|
|
4240
|
+
output: string | ResponseFunctionCallOutputItemList;
|
|
4241
|
+
type: "function_call_output";
|
|
4242
|
+
id?: string | null;
|
|
4243
|
+
status?: "in_progress" | "completed" | "incomplete" | null;
|
|
4244
|
+
};
|
|
4245
|
+
type ResponseInputItemMessage = {
|
|
4246
|
+
content: ResponseInputMessageContentList;
|
|
4247
|
+
role: "user" | "system" | "developer";
|
|
4248
|
+
status?: "in_progress" | "completed" | "incomplete";
|
|
4249
|
+
type?: "message";
|
|
4250
|
+
};
|
|
4251
|
+
type ResponseInputMessageContentList = Array<ResponseInputContent>;
|
|
4252
|
+
type ResponseInputMessageItem = {
|
|
4253
|
+
id: string;
|
|
4254
|
+
content: ResponseInputMessageContentList;
|
|
4255
|
+
role: "user" | "system" | "developer";
|
|
4256
|
+
status?: "in_progress" | "completed" | "incomplete";
|
|
4257
|
+
type?: "message";
|
|
4258
|
+
};
|
|
4259
|
+
type ResponseInputText = {
|
|
4260
|
+
text: string;
|
|
4261
|
+
type: "input_text";
|
|
4262
|
+
};
|
|
4263
|
+
type ResponseInputTextContent = {
|
|
4264
|
+
text: string;
|
|
4265
|
+
type: "input_text";
|
|
4266
|
+
};
|
|
4267
|
+
type ResponseItem =
|
|
4268
|
+
| ResponseInputMessageItem
|
|
4269
|
+
| ResponseOutputMessage
|
|
4270
|
+
| ResponseFunctionToolCallItem
|
|
4271
|
+
| ResponseFunctionToolCallOutputItem;
|
|
4272
|
+
type ResponseOutputItem =
|
|
4273
|
+
| ResponseOutputMessage
|
|
4274
|
+
| ResponseFunctionToolCall
|
|
4275
|
+
| ResponseReasoningItem;
|
|
4276
|
+
type ResponseOutputItemAddedEvent = {
|
|
4277
|
+
item: ResponseOutputItem;
|
|
4278
|
+
output_index: number;
|
|
4279
|
+
sequence_number: number;
|
|
4280
|
+
type: "response.output_item.added";
|
|
4281
|
+
};
|
|
4282
|
+
type ResponseOutputItemDoneEvent = {
|
|
4283
|
+
item: ResponseOutputItem;
|
|
4284
|
+
output_index: number;
|
|
4285
|
+
sequence_number: number;
|
|
4286
|
+
type: "response.output_item.done";
|
|
4287
|
+
};
|
|
4288
|
+
type ResponseOutputMessage = {
|
|
4289
|
+
id: string;
|
|
4290
|
+
content: Array<ResponseOutputText | ResponseOutputRefusal>;
|
|
4291
|
+
role: "assistant";
|
|
4292
|
+
status: "in_progress" | "completed" | "incomplete";
|
|
4293
|
+
type: "message";
|
|
4294
|
+
};
|
|
4295
|
+
type ResponseOutputRefusal = {
|
|
4296
|
+
refusal: string;
|
|
4297
|
+
type: "refusal";
|
|
4298
|
+
};
|
|
4299
|
+
type ResponseOutputText = {
|
|
4300
|
+
text: string;
|
|
4301
|
+
type: "output_text";
|
|
4302
|
+
logprobs?: Array<Logprob>;
|
|
4303
|
+
};
|
|
4304
|
+
type ResponseReasoningItem = {
|
|
4305
|
+
id: string;
|
|
4306
|
+
summary: Array<ResponseReasoningSummaryItem>;
|
|
4307
|
+
type: "reasoning";
|
|
4308
|
+
content?: Array<ResponseReasoningContentItem>;
|
|
4309
|
+
encrypted_content?: string | null;
|
|
4310
|
+
status?: "in_progress" | "completed" | "incomplete";
|
|
4311
|
+
};
|
|
4312
|
+
type ResponseReasoningSummaryItem = {
|
|
4313
|
+
text: string;
|
|
4314
|
+
type: "summary_text";
|
|
4315
|
+
};
|
|
4316
|
+
type ResponseReasoningContentItem = {
|
|
4317
|
+
text: string;
|
|
4318
|
+
type: "reasoning_text";
|
|
4319
|
+
};
|
|
4320
|
+
type ResponseReasoningTextDeltaEvent = {
|
|
4321
|
+
content_index: number;
|
|
4322
|
+
delta: string;
|
|
4323
|
+
item_id: string;
|
|
4324
|
+
output_index: number;
|
|
4325
|
+
sequence_number: number;
|
|
4326
|
+
type: "response.reasoning_text.delta";
|
|
4327
|
+
};
|
|
4328
|
+
type ResponseReasoningTextDoneEvent = {
|
|
4329
|
+
content_index: number;
|
|
4330
|
+
item_id: string;
|
|
4331
|
+
output_index: number;
|
|
4332
|
+
sequence_number: number;
|
|
4333
|
+
text: string;
|
|
4334
|
+
type: "response.reasoning_text.done";
|
|
4335
|
+
};
|
|
4336
|
+
type ResponseRefusalDeltaEvent = {
|
|
4337
|
+
content_index: number;
|
|
4338
|
+
delta: string;
|
|
4339
|
+
item_id: string;
|
|
4340
|
+
output_index: number;
|
|
4341
|
+
sequence_number: number;
|
|
4342
|
+
type: "response.refusal.delta";
|
|
4343
|
+
};
|
|
4344
|
+
type ResponseRefusalDoneEvent = {
|
|
4345
|
+
content_index: number;
|
|
4346
|
+
item_id: string;
|
|
4347
|
+
output_index: number;
|
|
4348
|
+
refusal: string;
|
|
4349
|
+
sequence_number: number;
|
|
4350
|
+
type: "response.refusal.done";
|
|
4351
|
+
};
|
|
4352
|
+
type ResponseStatus =
|
|
4353
|
+
| "completed"
|
|
4354
|
+
| "failed"
|
|
4355
|
+
| "in_progress"
|
|
4356
|
+
| "cancelled"
|
|
4357
|
+
| "queued"
|
|
4358
|
+
| "incomplete";
|
|
4359
|
+
type ResponseStreamEvent =
|
|
4360
|
+
| ResponseCompletedEvent
|
|
4361
|
+
| ResponseCreatedEvent
|
|
4362
|
+
| ResponseErrorEvent
|
|
4363
|
+
| ResponseFunctionCallArgumentsDeltaEvent
|
|
4364
|
+
| ResponseFunctionCallArgumentsDoneEvent
|
|
4365
|
+
| ResponseFailedEvent
|
|
4366
|
+
| ResponseIncompleteEvent
|
|
4367
|
+
| ResponseOutputItemAddedEvent
|
|
4368
|
+
| ResponseOutputItemDoneEvent
|
|
4369
|
+
| ResponseReasoningTextDeltaEvent
|
|
4370
|
+
| ResponseReasoningTextDoneEvent
|
|
4371
|
+
| ResponseRefusalDeltaEvent
|
|
4372
|
+
| ResponseRefusalDoneEvent
|
|
4373
|
+
| ResponseTextDeltaEvent
|
|
4374
|
+
| ResponseTextDoneEvent;
|
|
4375
|
+
type ResponseCompletedEvent = {
|
|
4376
|
+
response: Response;
|
|
4377
|
+
sequence_number: number;
|
|
4378
|
+
type: "response.completed";
|
|
4379
|
+
};
|
|
4380
|
+
type ResponseTextConfig = {
|
|
4381
|
+
format?: ResponseFormatTextConfig;
|
|
4382
|
+
verbosity?: "low" | "medium" | "high" | null;
|
|
4383
|
+
};
|
|
4384
|
+
type ResponseTextDeltaEvent = {
|
|
4385
|
+
content_index: number;
|
|
4386
|
+
delta: string;
|
|
4387
|
+
item_id: string;
|
|
4388
|
+
logprobs: Array<Logprob>;
|
|
4389
|
+
output_index: number;
|
|
4390
|
+
sequence_number: number;
|
|
4391
|
+
type: "response.output_text.delta";
|
|
4392
|
+
};
|
|
4393
|
+
type ResponseTextDoneEvent = {
|
|
4394
|
+
content_index: number;
|
|
4395
|
+
item_id: string;
|
|
4396
|
+
logprobs: Array<Logprob>;
|
|
4397
|
+
output_index: number;
|
|
4398
|
+
sequence_number: number;
|
|
4399
|
+
text: string;
|
|
4400
|
+
type: "response.output_text.done";
|
|
4401
|
+
};
|
|
4402
|
+
type Logprob = {
|
|
4403
|
+
token: string;
|
|
4404
|
+
logprob: number;
|
|
4405
|
+
top_logprobs?: Array<TopLogprob>;
|
|
4406
|
+
};
|
|
4407
|
+
type TopLogprob = {
|
|
4408
|
+
token?: string;
|
|
4409
|
+
logprob?: number;
|
|
4410
|
+
};
|
|
4411
|
+
type ResponseUsage = {
|
|
4412
|
+
input_tokens: number;
|
|
4413
|
+
output_tokens: number;
|
|
4414
|
+
total_tokens: number;
|
|
4415
|
+
};
|
|
4416
|
+
type Tool = ResponsesFunctionTool;
|
|
4417
|
+
type ToolChoiceFunction = {
|
|
4418
|
+
name: string;
|
|
4419
|
+
type: "function";
|
|
4420
|
+
};
|
|
4421
|
+
type ToolChoiceOptions = "none";
|
|
4422
|
+
type ReasoningEffort = "minimal" | "low" | "medium" | "high" | null;
|
|
4423
|
+
type StreamOptions = {
|
|
4424
|
+
include_obfuscation?: boolean;
|
|
4425
|
+
};
|
|
4005
4426
|
type Ai_Cf_Baai_Bge_Base_En_V1_5_Input =
|
|
4006
4427
|
| {
|
|
4007
4428
|
text: string | string[];
|
|
@@ -4034,8 +4455,8 @@ type Ai_Cf_Baai_Bge_Base_En_V1_5_Output =
|
|
|
4034
4455
|
*/
|
|
4035
4456
|
pooling?: "mean" | "cls";
|
|
4036
4457
|
}
|
|
4037
|
-
|
|
|
4038
|
-
interface
|
|
4458
|
+
| Ai_Cf_Baai_Bge_Base_En_V1_5_AsyncResponse;
|
|
4459
|
+
interface Ai_Cf_Baai_Bge_Base_En_V1_5_AsyncResponse {
|
|
4039
4460
|
/**
|
|
4040
4461
|
* The async request id that can be used to obtain the results.
|
|
4041
4462
|
*/
|
|
@@ -4117,7 +4538,13 @@ type Ai_Cf_Meta_M2M100_1_2B_Output =
|
|
|
4117
4538
|
*/
|
|
4118
4539
|
translated_text?: string;
|
|
4119
4540
|
}
|
|
4120
|
-
|
|
|
4541
|
+
| Ai_Cf_Meta_M2M100_1_2B_AsyncResponse;
|
|
4542
|
+
interface Ai_Cf_Meta_M2M100_1_2B_AsyncResponse {
|
|
4543
|
+
/**
|
|
4544
|
+
* The async request id that can be used to obtain the results.
|
|
4545
|
+
*/
|
|
4546
|
+
request_id?: string;
|
|
4547
|
+
}
|
|
4121
4548
|
declare abstract class Base_Ai_Cf_Meta_M2M100_1_2B {
|
|
4122
4549
|
inputs: Ai_Cf_Meta_M2M100_1_2B_Input;
|
|
4123
4550
|
postProcessedOutputs: Ai_Cf_Meta_M2M100_1_2B_Output;
|
|
@@ -4154,7 +4581,13 @@ type Ai_Cf_Baai_Bge_Small_En_V1_5_Output =
|
|
|
4154
4581
|
*/
|
|
4155
4582
|
pooling?: "mean" | "cls";
|
|
4156
4583
|
}
|
|
4157
|
-
|
|
|
4584
|
+
| Ai_Cf_Baai_Bge_Small_En_V1_5_AsyncResponse;
|
|
4585
|
+
interface Ai_Cf_Baai_Bge_Small_En_V1_5_AsyncResponse {
|
|
4586
|
+
/**
|
|
4587
|
+
* The async request id that can be used to obtain the results.
|
|
4588
|
+
*/
|
|
4589
|
+
request_id?: string;
|
|
4590
|
+
}
|
|
4158
4591
|
declare abstract class Base_Ai_Cf_Baai_Bge_Small_En_V1_5 {
|
|
4159
4592
|
inputs: Ai_Cf_Baai_Bge_Small_En_V1_5_Input;
|
|
4160
4593
|
postProcessedOutputs: Ai_Cf_Baai_Bge_Small_En_V1_5_Output;
|
|
@@ -4191,7 +4624,13 @@ type Ai_Cf_Baai_Bge_Large_En_V1_5_Output =
|
|
|
4191
4624
|
*/
|
|
4192
4625
|
pooling?: "mean" | "cls";
|
|
4193
4626
|
}
|
|
4194
|
-
|
|
|
4627
|
+
| Ai_Cf_Baai_Bge_Large_En_V1_5_AsyncResponse;
|
|
4628
|
+
interface Ai_Cf_Baai_Bge_Large_En_V1_5_AsyncResponse {
|
|
4629
|
+
/**
|
|
4630
|
+
* The async request id that can be used to obtain the results.
|
|
4631
|
+
*/
|
|
4632
|
+
request_id?: string;
|
|
4633
|
+
}
|
|
4195
4634
|
declare abstract class Base_Ai_Cf_Baai_Bge_Large_En_V1_5 {
|
|
4196
4635
|
inputs: Ai_Cf_Baai_Bge_Large_En_V1_5_Input;
|
|
4197
4636
|
postProcessedOutputs: Ai_Cf_Baai_Bge_Large_En_V1_5_Output;
|
|
@@ -4382,15 +4821,18 @@ declare abstract class Base_Ai_Cf_Openai_Whisper_Large_V3_Turbo {
|
|
|
4382
4821
|
postProcessedOutputs: Ai_Cf_Openai_Whisper_Large_V3_Turbo_Output;
|
|
4383
4822
|
}
|
|
4384
4823
|
type Ai_Cf_Baai_Bge_M3_Input =
|
|
4385
|
-
|
|
|
4386
|
-
|
|
|
4824
|
+
| Ai_Cf_Baai_Bge_M3_Input_QueryAnd_Contexts
|
|
4825
|
+
| Ai_Cf_Baai_Bge_M3_Input_Embedding
|
|
4387
4826
|
| {
|
|
4388
4827
|
/**
|
|
4389
4828
|
* Batch of the embeddings requests to run using async-queue
|
|
4390
4829
|
*/
|
|
4391
|
-
requests: (
|
|
4830
|
+
requests: (
|
|
4831
|
+
| Ai_Cf_Baai_Bge_M3_Input_QueryAnd_Contexts_1
|
|
4832
|
+
| Ai_Cf_Baai_Bge_M3_Input_Embedding_1
|
|
4833
|
+
)[];
|
|
4392
4834
|
};
|
|
4393
|
-
interface
|
|
4835
|
+
interface Ai_Cf_Baai_Bge_M3_Input_QueryAnd_Contexts {
|
|
4394
4836
|
/**
|
|
4395
4837
|
* A query you wish to perform against the provided contexts. If no query is provided the model with respond with embeddings for contexts
|
|
4396
4838
|
*/
|
|
@@ -4409,14 +4851,14 @@ interface BGEM3InputQueryAndContexts {
|
|
|
4409
4851
|
*/
|
|
4410
4852
|
truncate_inputs?: boolean;
|
|
4411
4853
|
}
|
|
4412
|
-
interface
|
|
4854
|
+
interface Ai_Cf_Baai_Bge_M3_Input_Embedding {
|
|
4413
4855
|
text: string | string[];
|
|
4414
4856
|
/**
|
|
4415
4857
|
* When provided with too long context should the model error out or truncate the context to fit?
|
|
4416
4858
|
*/
|
|
4417
4859
|
truncate_inputs?: boolean;
|
|
4418
4860
|
}
|
|
4419
|
-
interface
|
|
4861
|
+
interface Ai_Cf_Baai_Bge_M3_Input_QueryAnd_Contexts_1 {
|
|
4420
4862
|
/**
|
|
4421
4863
|
* A query you wish to perform against the provided contexts. If no query is provided the model with respond with embeddings for contexts
|
|
4422
4864
|
*/
|
|
@@ -4435,7 +4877,7 @@ interface BGEM3InputQueryAndContexts1 {
|
|
|
4435
4877
|
*/
|
|
4436
4878
|
truncate_inputs?: boolean;
|
|
4437
4879
|
}
|
|
4438
|
-
interface
|
|
4880
|
+
interface Ai_Cf_Baai_Bge_M3_Input_Embedding_1 {
|
|
4439
4881
|
text: string | string[];
|
|
4440
4882
|
/**
|
|
4441
4883
|
* When provided with too long context should the model error out or truncate the context to fit?
|
|
@@ -4443,11 +4885,11 @@ interface BGEM3InputEmbedding1 {
|
|
|
4443
4885
|
truncate_inputs?: boolean;
|
|
4444
4886
|
}
|
|
4445
4887
|
type Ai_Cf_Baai_Bge_M3_Output =
|
|
4446
|
-
|
|
|
4447
|
-
|
|
|
4448
|
-
|
|
|
4449
|
-
|
|
|
4450
|
-
interface
|
|
4888
|
+
| Ai_Cf_Baai_Bge_M3_Ouput_Query
|
|
4889
|
+
| Ai_Cf_Baai_Bge_M3_Output_EmbeddingFor_Contexts
|
|
4890
|
+
| Ai_Cf_Baai_Bge_M3_Ouput_Embedding
|
|
4891
|
+
| Ai_Cf_Baai_Bge_M3_AsyncResponse;
|
|
4892
|
+
interface Ai_Cf_Baai_Bge_M3_Ouput_Query {
|
|
4451
4893
|
response?: {
|
|
4452
4894
|
/**
|
|
4453
4895
|
* Index of the context in the request
|
|
@@ -4459,7 +4901,7 @@ interface BGEM3OuputQuery {
|
|
|
4459
4901
|
score?: number;
|
|
4460
4902
|
}[];
|
|
4461
4903
|
}
|
|
4462
|
-
interface
|
|
4904
|
+
interface Ai_Cf_Baai_Bge_M3_Output_EmbeddingFor_Contexts {
|
|
4463
4905
|
response?: number[][];
|
|
4464
4906
|
shape?: number[];
|
|
4465
4907
|
/**
|
|
@@ -4467,7 +4909,7 @@ interface BGEM3OutputEmbeddingForContexts {
|
|
|
4467
4909
|
*/
|
|
4468
4910
|
pooling?: "mean" | "cls";
|
|
4469
4911
|
}
|
|
4470
|
-
interface
|
|
4912
|
+
interface Ai_Cf_Baai_Bge_M3_Ouput_Embedding {
|
|
4471
4913
|
shape?: number[];
|
|
4472
4914
|
/**
|
|
4473
4915
|
* Embeddings of the requested text values
|
|
@@ -4478,6 +4920,12 @@ interface BGEM3OuputEmbedding {
|
|
|
4478
4920
|
*/
|
|
4479
4921
|
pooling?: "mean" | "cls";
|
|
4480
4922
|
}
|
|
4923
|
+
interface Ai_Cf_Baai_Bge_M3_AsyncResponse {
|
|
4924
|
+
/**
|
|
4925
|
+
* The async request id that can be used to obtain the results.
|
|
4926
|
+
*/
|
|
4927
|
+
request_id?: string;
|
|
4928
|
+
}
|
|
4481
4929
|
declare abstract class Base_Ai_Cf_Baai_Bge_M3 {
|
|
4482
4930
|
inputs: Ai_Cf_Baai_Bge_M3_Input;
|
|
4483
4931
|
postProcessedOutputs: Ai_Cf_Baai_Bge_M3_Output;
|
|
@@ -4502,8 +4950,10 @@ declare abstract class Base_Ai_Cf_Black_Forest_Labs_Flux_1_Schnell {
|
|
|
4502
4950
|
inputs: Ai_Cf_Black_Forest_Labs_Flux_1_Schnell_Input;
|
|
4503
4951
|
postProcessedOutputs: Ai_Cf_Black_Forest_Labs_Flux_1_Schnell_Output;
|
|
4504
4952
|
}
|
|
4505
|
-
type Ai_Cf_Meta_Llama_3_2_11B_Vision_Instruct_Input =
|
|
4506
|
-
|
|
4953
|
+
type Ai_Cf_Meta_Llama_3_2_11B_Vision_Instruct_Input =
|
|
4954
|
+
| Ai_Cf_Meta_Llama_3_2_11B_Vision_Instruct_Prompt
|
|
4955
|
+
| Ai_Cf_Meta_Llama_3_2_11B_Vision_Instruct_Messages;
|
|
4956
|
+
interface Ai_Cf_Meta_Llama_3_2_11B_Vision_Instruct_Prompt {
|
|
4507
4957
|
/**
|
|
4508
4958
|
* The input text prompt for the model to generate a response.
|
|
4509
4959
|
*/
|
|
@@ -4554,7 +5004,7 @@ interface Prompt {
|
|
|
4554
5004
|
*/
|
|
4555
5005
|
lora?: string;
|
|
4556
5006
|
}
|
|
4557
|
-
interface
|
|
5007
|
+
interface Ai_Cf_Meta_Llama_3_2_11B_Vision_Instruct_Messages {
|
|
4558
5008
|
/**
|
|
4559
5009
|
* An array of message objects representing the conversation history.
|
|
4560
5010
|
*/
|
|
@@ -4752,10 +5202,10 @@ declare abstract class Base_Ai_Cf_Meta_Llama_3_2_11B_Vision_Instruct {
|
|
|
4752
5202
|
postProcessedOutputs: Ai_Cf_Meta_Llama_3_2_11B_Vision_Instruct_Output;
|
|
4753
5203
|
}
|
|
4754
5204
|
type Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Input =
|
|
4755
|
-
|
|
|
4756
|
-
|
|
|
4757
|
-
|
|
|
4758
|
-
interface
|
|
5205
|
+
| Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Prompt
|
|
5206
|
+
| Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Messages
|
|
5207
|
+
| Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Async_Batch;
|
|
5208
|
+
interface Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Prompt {
|
|
4759
5209
|
/**
|
|
4760
5210
|
* The input text prompt for the model to generate a response.
|
|
4761
5211
|
*/
|
|
@@ -4764,7 +5214,7 @@ interface Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Prompt {
|
|
|
4764
5214
|
* Name of the LoRA (Low-Rank Adaptation) model to fine-tune the base model.
|
|
4765
5215
|
*/
|
|
4766
5216
|
lora?: string;
|
|
4767
|
-
response_format?:
|
|
5217
|
+
response_format?: Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_JSON_Mode;
|
|
4768
5218
|
/**
|
|
4769
5219
|
* If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
|
|
4770
5220
|
*/
|
|
@@ -4806,11 +5256,11 @@ interface Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Prompt {
|
|
|
4806
5256
|
*/
|
|
4807
5257
|
presence_penalty?: number;
|
|
4808
5258
|
}
|
|
4809
|
-
interface
|
|
5259
|
+
interface Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_JSON_Mode {
|
|
4810
5260
|
type?: "json_object" | "json_schema";
|
|
4811
5261
|
json_schema?: unknown;
|
|
4812
5262
|
}
|
|
4813
|
-
interface
|
|
5263
|
+
interface Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Messages {
|
|
4814
5264
|
/**
|
|
4815
5265
|
* An array of message objects representing the conversation history.
|
|
4816
5266
|
*/
|
|
@@ -4918,7 +5368,7 @@ interface Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Messages {
|
|
|
4918
5368
|
};
|
|
4919
5369
|
}
|
|
4920
5370
|
)[];
|
|
4921
|
-
response_format?:
|
|
5371
|
+
response_format?: Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_JSON_Mode_1;
|
|
4922
5372
|
/**
|
|
4923
5373
|
* If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
|
|
4924
5374
|
*/
|
|
@@ -4960,7 +5410,11 @@ interface Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Messages {
|
|
|
4960
5410
|
*/
|
|
4961
5411
|
presence_penalty?: number;
|
|
4962
5412
|
}
|
|
4963
|
-
interface
|
|
5413
|
+
interface Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_JSON_Mode_1 {
|
|
5414
|
+
type?: "json_object" | "json_schema";
|
|
5415
|
+
json_schema?: unknown;
|
|
5416
|
+
}
|
|
5417
|
+
interface Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Async_Batch {
|
|
4964
5418
|
requests?: {
|
|
4965
5419
|
/**
|
|
4966
5420
|
* User-supplied reference. This field will be present in the response as well it can be used to reference the request and response. It's NOT validated to be unique.
|
|
@@ -5002,9 +5456,13 @@ interface AsyncBatch {
|
|
|
5002
5456
|
* Increases the likelihood of the model introducing new topics.
|
|
5003
5457
|
*/
|
|
5004
5458
|
presence_penalty?: number;
|
|
5005
|
-
response_format?:
|
|
5459
|
+
response_format?: Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_JSON_Mode_2;
|
|
5006
5460
|
}[];
|
|
5007
5461
|
}
|
|
5462
|
+
interface Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_JSON_Mode_2 {
|
|
5463
|
+
type?: "json_object" | "json_schema";
|
|
5464
|
+
json_schema?: unknown;
|
|
5465
|
+
}
|
|
5008
5466
|
type Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Output =
|
|
5009
5467
|
| {
|
|
5010
5468
|
/**
|
|
@@ -5043,7 +5501,13 @@ type Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Output =
|
|
|
5043
5501
|
}[];
|
|
5044
5502
|
}
|
|
5045
5503
|
| string
|
|
5046
|
-
|
|
|
5504
|
+
| Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_AsyncResponse;
|
|
5505
|
+
interface Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_AsyncResponse {
|
|
5506
|
+
/**
|
|
5507
|
+
* The async request id that can be used to obtain the results.
|
|
5508
|
+
*/
|
|
5509
|
+
request_id?: string;
|
|
5510
|
+
}
|
|
5047
5511
|
declare abstract class Base_Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast {
|
|
5048
5512
|
inputs: Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Input;
|
|
5049
5513
|
postProcessedOutputs: Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Output;
|
|
@@ -5150,9 +5614,9 @@ declare abstract class Base_Ai_Cf_Baai_Bge_Reranker_Base {
|
|
|
5150
5614
|
postProcessedOutputs: Ai_Cf_Baai_Bge_Reranker_Base_Output;
|
|
5151
5615
|
}
|
|
5152
5616
|
type Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_Input =
|
|
5153
|
-
|
|
|
5154
|
-
|
|
|
5155
|
-
interface
|
|
5617
|
+
| Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_Prompt
|
|
5618
|
+
| Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_Messages;
|
|
5619
|
+
interface Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_Prompt {
|
|
5156
5620
|
/**
|
|
5157
5621
|
* The input text prompt for the model to generate a response.
|
|
5158
5622
|
*/
|
|
@@ -5161,7 +5625,7 @@ interface Qwen2_5_Coder_32B_Instruct_Prompt {
|
|
|
5161
5625
|
* Name of the LoRA (Low-Rank Adaptation) model to fine-tune the base model.
|
|
5162
5626
|
*/
|
|
5163
5627
|
lora?: string;
|
|
5164
|
-
response_format?:
|
|
5628
|
+
response_format?: Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_JSON_Mode;
|
|
5165
5629
|
/**
|
|
5166
5630
|
* If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
|
|
5167
5631
|
*/
|
|
@@ -5203,7 +5667,11 @@ interface Qwen2_5_Coder_32B_Instruct_Prompt {
|
|
|
5203
5667
|
*/
|
|
5204
5668
|
presence_penalty?: number;
|
|
5205
5669
|
}
|
|
5206
|
-
interface
|
|
5670
|
+
interface Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_JSON_Mode {
|
|
5671
|
+
type?: "json_object" | "json_schema";
|
|
5672
|
+
json_schema?: unknown;
|
|
5673
|
+
}
|
|
5674
|
+
interface Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_Messages {
|
|
5207
5675
|
/**
|
|
5208
5676
|
* An array of message objects representing the conversation history.
|
|
5209
5677
|
*/
|
|
@@ -5311,7 +5779,7 @@ interface Qwen2_5_Coder_32B_Instruct_Messages {
|
|
|
5311
5779
|
};
|
|
5312
5780
|
}
|
|
5313
5781
|
)[];
|
|
5314
|
-
response_format?:
|
|
5782
|
+
response_format?: Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_JSON_Mode_1;
|
|
5315
5783
|
/**
|
|
5316
5784
|
* If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
|
|
5317
5785
|
*/
|
|
@@ -5353,6 +5821,10 @@ interface Qwen2_5_Coder_32B_Instruct_Messages {
|
|
|
5353
5821
|
*/
|
|
5354
5822
|
presence_penalty?: number;
|
|
5355
5823
|
}
|
|
5824
|
+
interface Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_JSON_Mode_1 {
|
|
5825
|
+
type?: "json_object" | "json_schema";
|
|
5826
|
+
json_schema?: unknown;
|
|
5827
|
+
}
|
|
5356
5828
|
type Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_Output = {
|
|
5357
5829
|
/**
|
|
5358
5830
|
* The generated text response from the model
|
|
@@ -5393,8 +5865,10 @@ declare abstract class Base_Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct {
|
|
|
5393
5865
|
inputs: Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_Input;
|
|
5394
5866
|
postProcessedOutputs: Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_Output;
|
|
5395
5867
|
}
|
|
5396
|
-
type Ai_Cf_Qwen_Qwq_32B_Input =
|
|
5397
|
-
|
|
5868
|
+
type Ai_Cf_Qwen_Qwq_32B_Input =
|
|
5869
|
+
| Ai_Cf_Qwen_Qwq_32B_Prompt
|
|
5870
|
+
| Ai_Cf_Qwen_Qwq_32B_Messages;
|
|
5871
|
+
interface Ai_Cf_Qwen_Qwq_32B_Prompt {
|
|
5398
5872
|
/**
|
|
5399
5873
|
* The input text prompt for the model to generate a response.
|
|
5400
5874
|
*/
|
|
@@ -5444,7 +5918,7 @@ interface Qwen_Qwq_32B_Prompt {
|
|
|
5444
5918
|
*/
|
|
5445
5919
|
presence_penalty?: number;
|
|
5446
5920
|
}
|
|
5447
|
-
interface
|
|
5921
|
+
interface Ai_Cf_Qwen_Qwq_32B_Messages {
|
|
5448
5922
|
/**
|
|
5449
5923
|
* An array of message objects representing the conversation history.
|
|
5450
5924
|
*/
|
|
@@ -5666,9 +6140,9 @@ declare abstract class Base_Ai_Cf_Qwen_Qwq_32B {
|
|
|
5666
6140
|
postProcessedOutputs: Ai_Cf_Qwen_Qwq_32B_Output;
|
|
5667
6141
|
}
|
|
5668
6142
|
type Ai_Cf_Mistralai_Mistral_Small_3_1_24B_Instruct_Input =
|
|
5669
|
-
|
|
|
5670
|
-
|
|
|
5671
|
-
interface
|
|
6143
|
+
| Ai_Cf_Mistralai_Mistral_Small_3_1_24B_Instruct_Prompt
|
|
6144
|
+
| Ai_Cf_Mistralai_Mistral_Small_3_1_24B_Instruct_Messages;
|
|
6145
|
+
interface Ai_Cf_Mistralai_Mistral_Small_3_1_24B_Instruct_Prompt {
|
|
5672
6146
|
/**
|
|
5673
6147
|
* The input text prompt for the model to generate a response.
|
|
5674
6148
|
*/
|
|
@@ -5718,7 +6192,7 @@ interface Mistral_Small_3_1_24B_Instruct_Prompt {
|
|
|
5718
6192
|
*/
|
|
5719
6193
|
presence_penalty?: number;
|
|
5720
6194
|
}
|
|
5721
|
-
interface
|
|
6195
|
+
interface Ai_Cf_Mistralai_Mistral_Small_3_1_24B_Instruct_Messages {
|
|
5722
6196
|
/**
|
|
5723
6197
|
* An array of message objects representing the conversation history.
|
|
5724
6198
|
*/
|
|
@@ -5940,9 +6414,9 @@ declare abstract class Base_Ai_Cf_Mistralai_Mistral_Small_3_1_24B_Instruct {
|
|
|
5940
6414
|
postProcessedOutputs: Ai_Cf_Mistralai_Mistral_Small_3_1_24B_Instruct_Output;
|
|
5941
6415
|
}
|
|
5942
6416
|
type Ai_Cf_Google_Gemma_3_12B_It_Input =
|
|
5943
|
-
|
|
|
5944
|
-
|
|
|
5945
|
-
interface
|
|
6417
|
+
| Ai_Cf_Google_Gemma_3_12B_It_Prompt
|
|
6418
|
+
| Ai_Cf_Google_Gemma_3_12B_It_Messages;
|
|
6419
|
+
interface Ai_Cf_Google_Gemma_3_12B_It_Prompt {
|
|
5946
6420
|
/**
|
|
5947
6421
|
* The input text prompt for the model to generate a response.
|
|
5948
6422
|
*/
|
|
@@ -5992,7 +6466,7 @@ interface Google_Gemma_3_12B_It_Prompt {
|
|
|
5992
6466
|
*/
|
|
5993
6467
|
presence_penalty?: number;
|
|
5994
6468
|
}
|
|
5995
|
-
interface
|
|
6469
|
+
interface Ai_Cf_Google_Gemma_3_12B_It_Messages {
|
|
5996
6470
|
/**
|
|
5997
6471
|
* An array of message objects representing the conversation history.
|
|
5998
6472
|
*/
|
|
@@ -6015,20 +6489,7 @@ interface Google_Gemma_3_12B_It_Messages {
|
|
|
6015
6489
|
*/
|
|
6016
6490
|
url?: string;
|
|
6017
6491
|
};
|
|
6018
|
-
}[]
|
|
6019
|
-
| {
|
|
6020
|
-
/**
|
|
6021
|
-
* Type of the content provided
|
|
6022
|
-
*/
|
|
6023
|
-
type?: string;
|
|
6024
|
-
text?: string;
|
|
6025
|
-
image_url?: {
|
|
6026
|
-
/**
|
|
6027
|
-
* image uri with data (e.g. ...). HTTP URL will not be accepted
|
|
6028
|
-
*/
|
|
6029
|
-
url?: string;
|
|
6030
|
-
};
|
|
6031
|
-
};
|
|
6492
|
+
}[];
|
|
6032
6493
|
}[];
|
|
6033
6494
|
functions?: {
|
|
6034
6495
|
name: string;
|
|
@@ -6210,10 +6671,10 @@ declare abstract class Base_Ai_Cf_Google_Gemma_3_12B_It {
|
|
|
6210
6671
|
postProcessedOutputs: Ai_Cf_Google_Gemma_3_12B_It_Output;
|
|
6211
6672
|
}
|
|
6212
6673
|
type Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Input =
|
|
6213
|
-
|
|
|
6214
|
-
|
|
|
6215
|
-
|
|
|
6216
|
-
interface
|
|
6674
|
+
| Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Prompt
|
|
6675
|
+
| Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Messages
|
|
6676
|
+
| Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Async_Batch;
|
|
6677
|
+
interface Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Prompt {
|
|
6217
6678
|
/**
|
|
6218
6679
|
* The input text prompt for the model to generate a response.
|
|
6219
6680
|
*/
|
|
@@ -6222,7 +6683,7 @@ interface Ai_Cf_Meta_Llama_4_Prompt {
|
|
|
6222
6683
|
* JSON schema that should be fulfilled for the response.
|
|
6223
6684
|
*/
|
|
6224
6685
|
guided_json?: object;
|
|
6225
|
-
response_format?:
|
|
6686
|
+
response_format?: Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_JSON_Mode;
|
|
6226
6687
|
/**
|
|
6227
6688
|
* If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
|
|
6228
6689
|
*/
|
|
@@ -6264,7 +6725,11 @@ interface Ai_Cf_Meta_Llama_4_Prompt {
|
|
|
6264
6725
|
*/
|
|
6265
6726
|
presence_penalty?: number;
|
|
6266
6727
|
}
|
|
6267
|
-
interface
|
|
6728
|
+
interface Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_JSON_Mode {
|
|
6729
|
+
type?: "json_object" | "json_schema";
|
|
6730
|
+
json_schema?: unknown;
|
|
6731
|
+
}
|
|
6732
|
+
interface Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Messages {
|
|
6268
6733
|
/**
|
|
6269
6734
|
* An array of message objects representing the conversation history.
|
|
6270
6735
|
*/
|
|
@@ -6400,7 +6865,7 @@ interface Ai_Cf_Meta_Llama_4_Messages {
|
|
|
6400
6865
|
};
|
|
6401
6866
|
}
|
|
6402
6867
|
)[];
|
|
6403
|
-
response_format?:
|
|
6868
|
+
response_format?: Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_JSON_Mode;
|
|
6404
6869
|
/**
|
|
6405
6870
|
* JSON schema that should be fufilled for the response.
|
|
6406
6871
|
*/
|
|
@@ -6446,13 +6911,13 @@ interface Ai_Cf_Meta_Llama_4_Messages {
|
|
|
6446
6911
|
*/
|
|
6447
6912
|
presence_penalty?: number;
|
|
6448
6913
|
}
|
|
6449
|
-
interface
|
|
6914
|
+
interface Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Async_Batch {
|
|
6450
6915
|
requests: (
|
|
6451
|
-
|
|
|
6452
|
-
|
|
|
6916
|
+
| Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Prompt_Inner
|
|
6917
|
+
| Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Messages_Inner
|
|
6453
6918
|
)[];
|
|
6454
6919
|
}
|
|
6455
|
-
interface
|
|
6920
|
+
interface Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Prompt_Inner {
|
|
6456
6921
|
/**
|
|
6457
6922
|
* The input text prompt for the model to generate a response.
|
|
6458
6923
|
*/
|
|
@@ -6461,7 +6926,7 @@ interface Ai_Cf_Meta_Llama_4_Prompt_Inner {
|
|
|
6461
6926
|
* JSON schema that should be fulfilled for the response.
|
|
6462
6927
|
*/
|
|
6463
6928
|
guided_json?: object;
|
|
6464
|
-
response_format?:
|
|
6929
|
+
response_format?: Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_JSON_Mode;
|
|
6465
6930
|
/**
|
|
6466
6931
|
* If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
|
|
6467
6932
|
*/
|
|
@@ -6503,7 +6968,7 @@ interface Ai_Cf_Meta_Llama_4_Prompt_Inner {
|
|
|
6503
6968
|
*/
|
|
6504
6969
|
presence_penalty?: number;
|
|
6505
6970
|
}
|
|
6506
|
-
interface
|
|
6971
|
+
interface Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Messages_Inner {
|
|
6507
6972
|
/**
|
|
6508
6973
|
* An array of message objects representing the conversation history.
|
|
6509
6974
|
*/
|
|
@@ -6639,7 +7104,7 @@ interface Ai_Cf_Meta_Llama_4_Messages_Inner {
|
|
|
6639
7104
|
};
|
|
6640
7105
|
}
|
|
6641
7106
|
)[];
|
|
6642
|
-
response_format?:
|
|
7107
|
+
response_format?: Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_JSON_Mode;
|
|
6643
7108
|
/**
|
|
6644
7109
|
* JSON schema that should be fufilled for the response.
|
|
6645
7110
|
*/
|
|
@@ -6738,414 +7203,1813 @@ declare abstract class Base_Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct {
|
|
|
6738
7203
|
inputs: Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Input;
|
|
6739
7204
|
postProcessedOutputs: Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Output;
|
|
6740
7205
|
}
|
|
6741
|
-
|
|
6742
|
-
|
|
6743
|
-
|
|
6744
|
-
|
|
6745
|
-
|
|
6746
|
-
/**
|
|
6747
|
-
* Sets how the model will interpret strings submitted to the custom_topic param. When strict, the model will only return topics submitted using the custom_topic param. When extended, the model will return its own detected topics in addition to those submitted using the custom_topic param.
|
|
6748
|
-
*/
|
|
6749
|
-
custom_topic_mode?: "extended" | "strict";
|
|
6750
|
-
/**
|
|
6751
|
-
* Custom topics you want the model to detect within your input audio or text if present Submit up to 100
|
|
6752
|
-
*/
|
|
6753
|
-
custom_topic?: string;
|
|
6754
|
-
/**
|
|
6755
|
-
* Sets how the model will interpret intents submitted to the custom_intent param. When strict, the model will only return intents submitted using the custom_intent param. When extended, the model will return its own detected intents in addition those submitted using the custom_intents param
|
|
6756
|
-
*/
|
|
6757
|
-
custom_intent_mode?: "extended" | "strict";
|
|
6758
|
-
/**
|
|
6759
|
-
* Custom intents you want the model to detect within your input audio if present
|
|
6760
|
-
*/
|
|
6761
|
-
custom_intent?: string;
|
|
6762
|
-
/**
|
|
6763
|
-
* Identifies and extracts key entities from content in submitted audio
|
|
6764
|
-
*/
|
|
6765
|
-
detect_entities?: boolean;
|
|
6766
|
-
/**
|
|
6767
|
-
* Identifies the dominant language spoken in submitted audio
|
|
6768
|
-
*/
|
|
6769
|
-
detect_language?: boolean;
|
|
6770
|
-
/**
|
|
6771
|
-
* Recognize speaker changes. Each word in the transcript will be assigned a speaker number starting at 0
|
|
6772
|
-
*/
|
|
6773
|
-
diarize?: boolean;
|
|
7206
|
+
type Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Input =
|
|
7207
|
+
| Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Prompt
|
|
7208
|
+
| Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Messages
|
|
7209
|
+
| Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Async_Batch;
|
|
7210
|
+
interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Prompt {
|
|
6774
7211
|
/**
|
|
6775
|
-
*
|
|
7212
|
+
* The input text prompt for the model to generate a response.
|
|
6776
7213
|
*/
|
|
6777
|
-
|
|
7214
|
+
prompt: string;
|
|
6778
7215
|
/**
|
|
6779
|
-
*
|
|
7216
|
+
* Name of the LoRA (Low-Rank Adaptation) model to fine-tune the base model.
|
|
6780
7217
|
*/
|
|
6781
|
-
|
|
6782
|
-
|
|
6783
|
-
| "flac"
|
|
6784
|
-
| "mulaw"
|
|
6785
|
-
| "amr-nb"
|
|
6786
|
-
| "amr-wb"
|
|
6787
|
-
| "opus"
|
|
6788
|
-
| "speex"
|
|
6789
|
-
| "g729";
|
|
7218
|
+
lora?: string;
|
|
7219
|
+
response_format?: Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_JSON_Mode;
|
|
6790
7220
|
/**
|
|
6791
|
-
*
|
|
7221
|
+
* If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
|
|
6792
7222
|
*/
|
|
6793
|
-
|
|
7223
|
+
raw?: boolean;
|
|
6794
7224
|
/**
|
|
6795
|
-
*
|
|
7225
|
+
* If true, the response will be streamed back incrementally using SSE, Server Sent Events.
|
|
6796
7226
|
*/
|
|
6797
|
-
|
|
7227
|
+
stream?: boolean;
|
|
6798
7228
|
/**
|
|
6799
|
-
*
|
|
7229
|
+
* The maximum number of tokens to generate in the response.
|
|
6800
7230
|
*/
|
|
6801
|
-
|
|
7231
|
+
max_tokens?: number;
|
|
6802
7232
|
/**
|
|
6803
|
-
*
|
|
7233
|
+
* Controls the randomness of the output; higher values produce more random results.
|
|
6804
7234
|
*/
|
|
6805
|
-
|
|
7235
|
+
temperature?: number;
|
|
6806
7236
|
/**
|
|
6807
|
-
*
|
|
7237
|
+
* Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses.
|
|
6808
7238
|
*/
|
|
6809
|
-
|
|
7239
|
+
top_p?: number;
|
|
6810
7240
|
/**
|
|
6811
|
-
*
|
|
7241
|
+
* Limits the AI to choose from the top 'k' most probable words. Lower values make responses more focused; higher values introduce more variety and potential surprises.
|
|
6812
7242
|
*/
|
|
6813
|
-
|
|
7243
|
+
top_k?: number;
|
|
6814
7244
|
/**
|
|
6815
|
-
*
|
|
7245
|
+
* Random seed for reproducibility of the generation.
|
|
6816
7246
|
*/
|
|
6817
|
-
|
|
7247
|
+
seed?: number;
|
|
6818
7248
|
/**
|
|
6819
|
-
*
|
|
7249
|
+
* Penalty for repeated tokens; higher values discourage repetition.
|
|
6820
7250
|
*/
|
|
6821
|
-
|
|
7251
|
+
repetition_penalty?: number;
|
|
6822
7252
|
/**
|
|
6823
|
-
*
|
|
7253
|
+
* Decreases the likelihood of the model repeating the same lines verbatim.
|
|
6824
7254
|
*/
|
|
6825
|
-
|
|
7255
|
+
frequency_penalty?: number;
|
|
6826
7256
|
/**
|
|
6827
|
-
*
|
|
7257
|
+
* Increases the likelihood of the model introducing new topics.
|
|
6828
7258
|
*/
|
|
6829
|
-
|
|
7259
|
+
presence_penalty?: number;
|
|
7260
|
+
}
|
|
7261
|
+
interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_JSON_Mode {
|
|
7262
|
+
type?: "json_object" | "json_schema";
|
|
7263
|
+
json_schema?: unknown;
|
|
7264
|
+
}
|
|
7265
|
+
interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Messages {
|
|
6830
7266
|
/**
|
|
6831
|
-
*
|
|
7267
|
+
* An array of message objects representing the conversation history.
|
|
6832
7268
|
*/
|
|
6833
|
-
|
|
7269
|
+
messages: {
|
|
7270
|
+
/**
|
|
7271
|
+
* The role of the message sender (e.g., 'user', 'assistant', 'system', 'tool').
|
|
7272
|
+
*/
|
|
7273
|
+
role: string;
|
|
7274
|
+
/**
|
|
7275
|
+
* The content of the message as a string.
|
|
7276
|
+
*/
|
|
7277
|
+
content: string;
|
|
7278
|
+
}[];
|
|
7279
|
+
functions?: {
|
|
7280
|
+
name: string;
|
|
7281
|
+
code: string;
|
|
7282
|
+
}[];
|
|
6834
7283
|
/**
|
|
6835
|
-
*
|
|
7284
|
+
* A list of tools available for the assistant to use.
|
|
7285
|
+
*/
|
|
7286
|
+
tools?: (
|
|
7287
|
+
| {
|
|
7288
|
+
/**
|
|
7289
|
+
* The name of the tool. More descriptive the better.
|
|
7290
|
+
*/
|
|
7291
|
+
name: string;
|
|
7292
|
+
/**
|
|
7293
|
+
* A brief description of what the tool does.
|
|
7294
|
+
*/
|
|
7295
|
+
description: string;
|
|
7296
|
+
/**
|
|
7297
|
+
* Schema defining the parameters accepted by the tool.
|
|
7298
|
+
*/
|
|
7299
|
+
parameters: {
|
|
7300
|
+
/**
|
|
7301
|
+
* The type of the parameters object (usually 'object').
|
|
7302
|
+
*/
|
|
7303
|
+
type: string;
|
|
7304
|
+
/**
|
|
7305
|
+
* List of required parameter names.
|
|
7306
|
+
*/
|
|
7307
|
+
required?: string[];
|
|
7308
|
+
/**
|
|
7309
|
+
* Definitions of each parameter.
|
|
7310
|
+
*/
|
|
7311
|
+
properties: {
|
|
7312
|
+
[k: string]: {
|
|
7313
|
+
/**
|
|
7314
|
+
* The data type of the parameter.
|
|
7315
|
+
*/
|
|
7316
|
+
type: string;
|
|
7317
|
+
/**
|
|
7318
|
+
* A description of the expected parameter.
|
|
7319
|
+
*/
|
|
7320
|
+
description: string;
|
|
7321
|
+
};
|
|
7322
|
+
};
|
|
7323
|
+
};
|
|
7324
|
+
}
|
|
7325
|
+
| {
|
|
7326
|
+
/**
|
|
7327
|
+
* Specifies the type of tool (e.g., 'function').
|
|
7328
|
+
*/
|
|
7329
|
+
type: string;
|
|
7330
|
+
/**
|
|
7331
|
+
* Details of the function tool.
|
|
7332
|
+
*/
|
|
7333
|
+
function: {
|
|
7334
|
+
/**
|
|
7335
|
+
* The name of the function.
|
|
7336
|
+
*/
|
|
7337
|
+
name: string;
|
|
7338
|
+
/**
|
|
7339
|
+
* A brief description of what the function does.
|
|
7340
|
+
*/
|
|
7341
|
+
description: string;
|
|
7342
|
+
/**
|
|
7343
|
+
* Schema defining the parameters accepted by the function.
|
|
7344
|
+
*/
|
|
7345
|
+
parameters: {
|
|
7346
|
+
/**
|
|
7347
|
+
* The type of the parameters object (usually 'object').
|
|
7348
|
+
*/
|
|
7349
|
+
type: string;
|
|
7350
|
+
/**
|
|
7351
|
+
* List of required parameter names.
|
|
7352
|
+
*/
|
|
7353
|
+
required?: string[];
|
|
7354
|
+
/**
|
|
7355
|
+
* Definitions of each parameter.
|
|
7356
|
+
*/
|
|
7357
|
+
properties: {
|
|
7358
|
+
[k: string]: {
|
|
7359
|
+
/**
|
|
7360
|
+
* The data type of the parameter.
|
|
7361
|
+
*/
|
|
7362
|
+
type: string;
|
|
7363
|
+
/**
|
|
7364
|
+
* A description of the expected parameter.
|
|
7365
|
+
*/
|
|
7366
|
+
description: string;
|
|
7367
|
+
};
|
|
7368
|
+
};
|
|
7369
|
+
};
|
|
7370
|
+
};
|
|
7371
|
+
}
|
|
7372
|
+
)[];
|
|
7373
|
+
response_format?: Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_JSON_Mode_1;
|
|
7374
|
+
/**
|
|
7375
|
+
* If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
|
|
7376
|
+
*/
|
|
7377
|
+
raw?: boolean;
|
|
7378
|
+
/**
|
|
7379
|
+
* If true, the response will be streamed back incrementally using SSE, Server Sent Events.
|
|
7380
|
+
*/
|
|
7381
|
+
stream?: boolean;
|
|
7382
|
+
/**
|
|
7383
|
+
* The maximum number of tokens to generate in the response.
|
|
7384
|
+
*/
|
|
7385
|
+
max_tokens?: number;
|
|
7386
|
+
/**
|
|
7387
|
+
* Controls the randomness of the output; higher values produce more random results.
|
|
7388
|
+
*/
|
|
7389
|
+
temperature?: number;
|
|
7390
|
+
/**
|
|
7391
|
+
* Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses.
|
|
7392
|
+
*/
|
|
7393
|
+
top_p?: number;
|
|
7394
|
+
/**
|
|
7395
|
+
* Limits the AI to choose from the top 'k' most probable words. Lower values make responses more focused; higher values introduce more variety and potential surprises.
|
|
7396
|
+
*/
|
|
7397
|
+
top_k?: number;
|
|
7398
|
+
/**
|
|
7399
|
+
* Random seed for reproducibility of the generation.
|
|
7400
|
+
*/
|
|
7401
|
+
seed?: number;
|
|
7402
|
+
/**
|
|
7403
|
+
* Penalty for repeated tokens; higher values discourage repetition.
|
|
7404
|
+
*/
|
|
7405
|
+
repetition_penalty?: number;
|
|
7406
|
+
/**
|
|
7407
|
+
* Decreases the likelihood of the model repeating the same lines verbatim.
|
|
7408
|
+
*/
|
|
7409
|
+
frequency_penalty?: number;
|
|
7410
|
+
/**
|
|
7411
|
+
* Increases the likelihood of the model introducing new topics.
|
|
7412
|
+
*/
|
|
7413
|
+
presence_penalty?: number;
|
|
7414
|
+
}
|
|
7415
|
+
interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_JSON_Mode_1 {
|
|
7416
|
+
type?: "json_object" | "json_schema";
|
|
7417
|
+
json_schema?: unknown;
|
|
7418
|
+
}
|
|
7419
|
+
interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Async_Batch {
|
|
7420
|
+
requests: (
|
|
7421
|
+
| Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Prompt_1
|
|
7422
|
+
| Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Messages_1
|
|
7423
|
+
)[];
|
|
7424
|
+
}
|
|
7425
|
+
interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Prompt_1 {
|
|
7426
|
+
/**
|
|
7427
|
+
* The input text prompt for the model to generate a response.
|
|
7428
|
+
*/
|
|
7429
|
+
prompt: string;
|
|
7430
|
+
/**
|
|
7431
|
+
* Name of the LoRA (Low-Rank Adaptation) model to fine-tune the base model.
|
|
7432
|
+
*/
|
|
7433
|
+
lora?: string;
|
|
7434
|
+
response_format?: Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_JSON_Mode_2;
|
|
7435
|
+
/**
|
|
7436
|
+
* If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
|
|
7437
|
+
*/
|
|
7438
|
+
raw?: boolean;
|
|
7439
|
+
/**
|
|
7440
|
+
* If true, the response will be streamed back incrementally using SSE, Server Sent Events.
|
|
7441
|
+
*/
|
|
7442
|
+
stream?: boolean;
|
|
7443
|
+
/**
|
|
7444
|
+
* The maximum number of tokens to generate in the response.
|
|
7445
|
+
*/
|
|
7446
|
+
max_tokens?: number;
|
|
7447
|
+
/**
|
|
7448
|
+
* Controls the randomness of the output; higher values produce more random results.
|
|
7449
|
+
*/
|
|
7450
|
+
temperature?: number;
|
|
7451
|
+
/**
|
|
7452
|
+
* Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses.
|
|
7453
|
+
*/
|
|
7454
|
+
top_p?: number;
|
|
7455
|
+
/**
|
|
7456
|
+
* Limits the AI to choose from the top 'k' most probable words. Lower values make responses more focused; higher values introduce more variety and potential surprises.
|
|
7457
|
+
*/
|
|
7458
|
+
top_k?: number;
|
|
7459
|
+
/**
|
|
7460
|
+
* Random seed for reproducibility of the generation.
|
|
7461
|
+
*/
|
|
7462
|
+
seed?: number;
|
|
7463
|
+
/**
|
|
7464
|
+
* Penalty for repeated tokens; higher values discourage repetition.
|
|
7465
|
+
*/
|
|
7466
|
+
repetition_penalty?: number;
|
|
7467
|
+
/**
|
|
7468
|
+
* Decreases the likelihood of the model repeating the same lines verbatim.
|
|
7469
|
+
*/
|
|
7470
|
+
frequency_penalty?: number;
|
|
7471
|
+
/**
|
|
7472
|
+
* Increases the likelihood of the model introducing new topics.
|
|
7473
|
+
*/
|
|
7474
|
+
presence_penalty?: number;
|
|
7475
|
+
}
|
|
7476
|
+
interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_JSON_Mode_2 {
|
|
7477
|
+
type?: "json_object" | "json_schema";
|
|
7478
|
+
json_schema?: unknown;
|
|
7479
|
+
}
|
|
7480
|
+
interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Messages_1 {
|
|
7481
|
+
/**
|
|
7482
|
+
* An array of message objects representing the conversation history.
|
|
7483
|
+
*/
|
|
7484
|
+
messages: {
|
|
7485
|
+
/**
|
|
7486
|
+
* The role of the message sender (e.g., 'user', 'assistant', 'system', 'tool').
|
|
7487
|
+
*/
|
|
7488
|
+
role: string;
|
|
7489
|
+
/**
|
|
7490
|
+
* The content of the message as a string.
|
|
7491
|
+
*/
|
|
7492
|
+
content: string;
|
|
7493
|
+
}[];
|
|
7494
|
+
functions?: {
|
|
7495
|
+
name: string;
|
|
7496
|
+
code: string;
|
|
7497
|
+
}[];
|
|
7498
|
+
/**
|
|
7499
|
+
* A list of tools available for the assistant to use.
|
|
7500
|
+
*/
|
|
7501
|
+
tools?: (
|
|
7502
|
+
| {
|
|
7503
|
+
/**
|
|
7504
|
+
* The name of the tool. More descriptive the better.
|
|
7505
|
+
*/
|
|
7506
|
+
name: string;
|
|
7507
|
+
/**
|
|
7508
|
+
* A brief description of what the tool does.
|
|
7509
|
+
*/
|
|
7510
|
+
description: string;
|
|
7511
|
+
/**
|
|
7512
|
+
* Schema defining the parameters accepted by the tool.
|
|
7513
|
+
*/
|
|
7514
|
+
parameters: {
|
|
7515
|
+
/**
|
|
7516
|
+
* The type of the parameters object (usually 'object').
|
|
7517
|
+
*/
|
|
7518
|
+
type: string;
|
|
7519
|
+
/**
|
|
7520
|
+
* List of required parameter names.
|
|
7521
|
+
*/
|
|
7522
|
+
required?: string[];
|
|
7523
|
+
/**
|
|
7524
|
+
* Definitions of each parameter.
|
|
7525
|
+
*/
|
|
7526
|
+
properties: {
|
|
7527
|
+
[k: string]: {
|
|
7528
|
+
/**
|
|
7529
|
+
* The data type of the parameter.
|
|
7530
|
+
*/
|
|
7531
|
+
type: string;
|
|
7532
|
+
/**
|
|
7533
|
+
* A description of the expected parameter.
|
|
7534
|
+
*/
|
|
7535
|
+
description: string;
|
|
7536
|
+
};
|
|
7537
|
+
};
|
|
7538
|
+
};
|
|
7539
|
+
}
|
|
7540
|
+
| {
|
|
7541
|
+
/**
|
|
7542
|
+
* Specifies the type of tool (e.g., 'function').
|
|
7543
|
+
*/
|
|
7544
|
+
type: string;
|
|
7545
|
+
/**
|
|
7546
|
+
* Details of the function tool.
|
|
7547
|
+
*/
|
|
7548
|
+
function: {
|
|
7549
|
+
/**
|
|
7550
|
+
* The name of the function.
|
|
7551
|
+
*/
|
|
7552
|
+
name: string;
|
|
7553
|
+
/**
|
|
7554
|
+
* A brief description of what the function does.
|
|
7555
|
+
*/
|
|
7556
|
+
description: string;
|
|
7557
|
+
/**
|
|
7558
|
+
* Schema defining the parameters accepted by the function.
|
|
7559
|
+
*/
|
|
7560
|
+
parameters: {
|
|
7561
|
+
/**
|
|
7562
|
+
* The type of the parameters object (usually 'object').
|
|
7563
|
+
*/
|
|
7564
|
+
type: string;
|
|
7565
|
+
/**
|
|
7566
|
+
* List of required parameter names.
|
|
7567
|
+
*/
|
|
7568
|
+
required?: string[];
|
|
7569
|
+
/**
|
|
7570
|
+
* Definitions of each parameter.
|
|
7571
|
+
*/
|
|
7572
|
+
properties: {
|
|
7573
|
+
[k: string]: {
|
|
7574
|
+
/**
|
|
7575
|
+
* The data type of the parameter.
|
|
7576
|
+
*/
|
|
7577
|
+
type: string;
|
|
7578
|
+
/**
|
|
7579
|
+
* A description of the expected parameter.
|
|
7580
|
+
*/
|
|
7581
|
+
description: string;
|
|
7582
|
+
};
|
|
7583
|
+
};
|
|
7584
|
+
};
|
|
7585
|
+
};
|
|
7586
|
+
}
|
|
7587
|
+
)[];
|
|
7588
|
+
response_format?: Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_JSON_Mode_3;
|
|
7589
|
+
/**
|
|
7590
|
+
* If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
|
|
7591
|
+
*/
|
|
7592
|
+
raw?: boolean;
|
|
7593
|
+
/**
|
|
7594
|
+
* If true, the response will be streamed back incrementally using SSE, Server Sent Events.
|
|
7595
|
+
*/
|
|
7596
|
+
stream?: boolean;
|
|
7597
|
+
/**
|
|
7598
|
+
* The maximum number of tokens to generate in the response.
|
|
7599
|
+
*/
|
|
7600
|
+
max_tokens?: number;
|
|
7601
|
+
/**
|
|
7602
|
+
* Controls the randomness of the output; higher values produce more random results.
|
|
7603
|
+
*/
|
|
7604
|
+
temperature?: number;
|
|
7605
|
+
/**
|
|
7606
|
+
* Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses.
|
|
7607
|
+
*/
|
|
7608
|
+
top_p?: number;
|
|
7609
|
+
/**
|
|
7610
|
+
* Limits the AI to choose from the top 'k' most probable words. Lower values make responses more focused; higher values introduce more variety and potential surprises.
|
|
7611
|
+
*/
|
|
7612
|
+
top_k?: number;
|
|
7613
|
+
/**
|
|
7614
|
+
* Random seed for reproducibility of the generation.
|
|
7615
|
+
*/
|
|
7616
|
+
seed?: number;
|
|
7617
|
+
/**
|
|
7618
|
+
* Penalty for repeated tokens; higher values discourage repetition.
|
|
7619
|
+
*/
|
|
7620
|
+
repetition_penalty?: number;
|
|
7621
|
+
/**
|
|
7622
|
+
* Decreases the likelihood of the model repeating the same lines verbatim.
|
|
7623
|
+
*/
|
|
7624
|
+
frequency_penalty?: number;
|
|
7625
|
+
/**
|
|
7626
|
+
* Increases the likelihood of the model introducing new topics.
|
|
7627
|
+
*/
|
|
7628
|
+
presence_penalty?: number;
|
|
7629
|
+
}
|
|
7630
|
+
interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_JSON_Mode_3 {
|
|
7631
|
+
type?: "json_object" | "json_schema";
|
|
7632
|
+
json_schema?: unknown;
|
|
7633
|
+
}
|
|
7634
|
+
type Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Output =
|
|
7635
|
+
| Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Chat_Completion_Response
|
|
7636
|
+
| Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Text_Completion_Response
|
|
7637
|
+
| string
|
|
7638
|
+
| Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_AsyncResponse;
|
|
7639
|
+
interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Chat_Completion_Response {
|
|
7640
|
+
/**
|
|
7641
|
+
* Unique identifier for the completion
|
|
7642
|
+
*/
|
|
7643
|
+
id?: string;
|
|
7644
|
+
/**
|
|
7645
|
+
* Object type identifier
|
|
7646
|
+
*/
|
|
7647
|
+
object?: "chat.completion";
|
|
7648
|
+
/**
|
|
7649
|
+
* Unix timestamp of when the completion was created
|
|
7650
|
+
*/
|
|
7651
|
+
created?: number;
|
|
7652
|
+
/**
|
|
7653
|
+
* Model used for the completion
|
|
7654
|
+
*/
|
|
7655
|
+
model?: string;
|
|
7656
|
+
/**
|
|
7657
|
+
* List of completion choices
|
|
7658
|
+
*/
|
|
7659
|
+
choices?: {
|
|
7660
|
+
/**
|
|
7661
|
+
* Index of the choice in the list
|
|
7662
|
+
*/
|
|
7663
|
+
index?: number;
|
|
7664
|
+
/**
|
|
7665
|
+
* The message generated by the model
|
|
7666
|
+
*/
|
|
7667
|
+
message?: {
|
|
7668
|
+
/**
|
|
7669
|
+
* Role of the message author
|
|
7670
|
+
*/
|
|
7671
|
+
role: string;
|
|
7672
|
+
/**
|
|
7673
|
+
* The content of the message
|
|
7674
|
+
*/
|
|
7675
|
+
content: string;
|
|
7676
|
+
/**
|
|
7677
|
+
* Internal reasoning content (if available)
|
|
7678
|
+
*/
|
|
7679
|
+
reasoning_content?: string;
|
|
7680
|
+
/**
|
|
7681
|
+
* Tool calls made by the assistant
|
|
7682
|
+
*/
|
|
7683
|
+
tool_calls?: {
|
|
7684
|
+
/**
|
|
7685
|
+
* Unique identifier for the tool call
|
|
7686
|
+
*/
|
|
7687
|
+
id: string;
|
|
7688
|
+
/**
|
|
7689
|
+
* Type of tool call
|
|
7690
|
+
*/
|
|
7691
|
+
type: "function";
|
|
7692
|
+
function: {
|
|
7693
|
+
/**
|
|
7694
|
+
* Name of the function to call
|
|
7695
|
+
*/
|
|
7696
|
+
name: string;
|
|
7697
|
+
/**
|
|
7698
|
+
* JSON string of arguments for the function
|
|
7699
|
+
*/
|
|
7700
|
+
arguments: string;
|
|
7701
|
+
};
|
|
7702
|
+
}[];
|
|
7703
|
+
};
|
|
7704
|
+
/**
|
|
7705
|
+
* Reason why the model stopped generating
|
|
7706
|
+
*/
|
|
7707
|
+
finish_reason?: string;
|
|
7708
|
+
/**
|
|
7709
|
+
* Stop reason (may be null)
|
|
7710
|
+
*/
|
|
7711
|
+
stop_reason?: string | null;
|
|
7712
|
+
/**
|
|
7713
|
+
* Log probabilities (if requested)
|
|
7714
|
+
*/
|
|
7715
|
+
logprobs?: {} | null;
|
|
7716
|
+
}[];
|
|
7717
|
+
/**
|
|
7718
|
+
* Usage statistics for the inference request
|
|
7719
|
+
*/
|
|
7720
|
+
usage?: {
|
|
7721
|
+
/**
|
|
7722
|
+
* Total number of tokens in input
|
|
7723
|
+
*/
|
|
7724
|
+
prompt_tokens?: number;
|
|
7725
|
+
/**
|
|
7726
|
+
* Total number of tokens in output
|
|
7727
|
+
*/
|
|
7728
|
+
completion_tokens?: number;
|
|
7729
|
+
/**
|
|
7730
|
+
* Total number of input and output tokens
|
|
7731
|
+
*/
|
|
7732
|
+
total_tokens?: number;
|
|
7733
|
+
};
|
|
7734
|
+
/**
|
|
7735
|
+
* Log probabilities for the prompt (if requested)
|
|
7736
|
+
*/
|
|
7737
|
+
prompt_logprobs?: {} | null;
|
|
7738
|
+
}
|
|
7739
|
+
interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Text_Completion_Response {
|
|
7740
|
+
/**
|
|
7741
|
+
* Unique identifier for the completion
|
|
7742
|
+
*/
|
|
7743
|
+
id?: string;
|
|
7744
|
+
/**
|
|
7745
|
+
* Object type identifier
|
|
7746
|
+
*/
|
|
7747
|
+
object?: "text_completion";
|
|
7748
|
+
/**
|
|
7749
|
+
* Unix timestamp of when the completion was created
|
|
7750
|
+
*/
|
|
7751
|
+
created?: number;
|
|
7752
|
+
/**
|
|
7753
|
+
* Model used for the completion
|
|
7754
|
+
*/
|
|
7755
|
+
model?: string;
|
|
7756
|
+
/**
|
|
7757
|
+
* List of completion choices
|
|
7758
|
+
*/
|
|
7759
|
+
choices?: {
|
|
7760
|
+
/**
|
|
7761
|
+
* Index of the choice in the list
|
|
7762
|
+
*/
|
|
7763
|
+
index: number;
|
|
7764
|
+
/**
|
|
7765
|
+
* The generated text completion
|
|
7766
|
+
*/
|
|
7767
|
+
text: string;
|
|
7768
|
+
/**
|
|
7769
|
+
* Reason why the model stopped generating
|
|
7770
|
+
*/
|
|
7771
|
+
finish_reason: string;
|
|
7772
|
+
/**
|
|
7773
|
+
* Stop reason (may be null)
|
|
7774
|
+
*/
|
|
7775
|
+
stop_reason?: string | null;
|
|
7776
|
+
/**
|
|
7777
|
+
* Log probabilities (if requested)
|
|
7778
|
+
*/
|
|
7779
|
+
logprobs?: {} | null;
|
|
7780
|
+
/**
|
|
7781
|
+
* Log probabilities for the prompt (if requested)
|
|
7782
|
+
*/
|
|
7783
|
+
prompt_logprobs?: {} | null;
|
|
7784
|
+
}[];
|
|
7785
|
+
/**
|
|
7786
|
+
* Usage statistics for the inference request
|
|
7787
|
+
*/
|
|
7788
|
+
usage?: {
|
|
7789
|
+
/**
|
|
7790
|
+
* Total number of tokens in input
|
|
7791
|
+
*/
|
|
7792
|
+
prompt_tokens?: number;
|
|
7793
|
+
/**
|
|
7794
|
+
* Total number of tokens in output
|
|
7795
|
+
*/
|
|
7796
|
+
completion_tokens?: number;
|
|
7797
|
+
/**
|
|
7798
|
+
* Total number of input and output tokens
|
|
7799
|
+
*/
|
|
7800
|
+
total_tokens?: number;
|
|
7801
|
+
};
|
|
7802
|
+
}
|
|
7803
|
+
interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_AsyncResponse {
|
|
7804
|
+
/**
|
|
7805
|
+
* The async request id that can be used to obtain the results.
|
|
7806
|
+
*/
|
|
7807
|
+
request_id?: string;
|
|
7808
|
+
}
|
|
7809
|
+
declare abstract class Base_Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8 {
|
|
7810
|
+
inputs: Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Input;
|
|
7811
|
+
postProcessedOutputs: Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Output;
|
|
7812
|
+
}
|
|
7813
|
+
interface Ai_Cf_Deepgram_Nova_3_Input {
|
|
7814
|
+
audio: {
|
|
7815
|
+
body: object;
|
|
7816
|
+
contentType: string;
|
|
7817
|
+
};
|
|
7818
|
+
/**
|
|
7819
|
+
* Sets how the model will interpret strings submitted to the custom_topic param. When strict, the model will only return topics submitted using the custom_topic param. When extended, the model will return its own detected topics in addition to those submitted using the custom_topic param.
|
|
7820
|
+
*/
|
|
7821
|
+
custom_topic_mode?: "extended" | "strict";
|
|
7822
|
+
/**
|
|
7823
|
+
* Custom topics you want the model to detect within your input audio or text if present Submit up to 100
|
|
7824
|
+
*/
|
|
7825
|
+
custom_topic?: string;
|
|
7826
|
+
/**
|
|
7827
|
+
* Sets how the model will interpret intents submitted to the custom_intent param. When strict, the model will only return intents submitted using the custom_intent param. When extended, the model will return its own detected intents in addition those submitted using the custom_intents param
|
|
7828
|
+
*/
|
|
7829
|
+
custom_intent_mode?: "extended" | "strict";
|
|
7830
|
+
/**
|
|
7831
|
+
* Custom intents you want the model to detect within your input audio if present
|
|
7832
|
+
*/
|
|
7833
|
+
custom_intent?: string;
|
|
7834
|
+
/**
|
|
7835
|
+
* Identifies and extracts key entities from content in submitted audio
|
|
7836
|
+
*/
|
|
7837
|
+
detect_entities?: boolean;
|
|
7838
|
+
/**
|
|
7839
|
+
* Identifies the dominant language spoken in submitted audio
|
|
7840
|
+
*/
|
|
7841
|
+
detect_language?: boolean;
|
|
7842
|
+
/**
|
|
7843
|
+
* Recognize speaker changes. Each word in the transcript will be assigned a speaker number starting at 0
|
|
7844
|
+
*/
|
|
7845
|
+
diarize?: boolean;
|
|
7846
|
+
/**
|
|
7847
|
+
* Identify and extract key entities from content in submitted audio
|
|
7848
|
+
*/
|
|
7849
|
+
dictation?: boolean;
|
|
7850
|
+
/**
|
|
7851
|
+
* Specify the expected encoding of your submitted audio
|
|
7852
|
+
*/
|
|
7853
|
+
encoding?:
|
|
7854
|
+
| "linear16"
|
|
7855
|
+
| "flac"
|
|
7856
|
+
| "mulaw"
|
|
7857
|
+
| "amr-nb"
|
|
7858
|
+
| "amr-wb"
|
|
7859
|
+
| "opus"
|
|
7860
|
+
| "speex"
|
|
7861
|
+
| "g729";
|
|
7862
|
+
/**
|
|
7863
|
+
* Arbitrary key-value pairs that are attached to the API response for usage in downstream processing
|
|
7864
|
+
*/
|
|
7865
|
+
extra?: string;
|
|
7866
|
+
/**
|
|
7867
|
+
* Filler Words can help transcribe interruptions in your audio, like 'uh' and 'um'
|
|
7868
|
+
*/
|
|
7869
|
+
filler_words?: boolean;
|
|
7870
|
+
/**
|
|
7871
|
+
* Key term prompting can boost or suppress specialized terminology and brands.
|
|
7872
|
+
*/
|
|
7873
|
+
keyterm?: string;
|
|
7874
|
+
/**
|
|
7875
|
+
* Keywords can boost or suppress specialized terminology and brands.
|
|
7876
|
+
*/
|
|
7877
|
+
keywords?: string;
|
|
7878
|
+
/**
|
|
7879
|
+
* The BCP-47 language tag that hints at the primary spoken language. Depending on the Model and API endpoint you choose only certain languages are available.
|
|
7880
|
+
*/
|
|
7881
|
+
language?: string;
|
|
7882
|
+
/**
|
|
7883
|
+
* Spoken measurements will be converted to their corresponding abbreviations.
|
|
7884
|
+
*/
|
|
7885
|
+
measurements?: boolean;
|
|
7886
|
+
/**
|
|
7887
|
+
* Opts out requests from the Deepgram Model Improvement Program. Refer to our Docs for pricing impacts before setting this to true. https://dpgr.am/deepgram-mip.
|
|
7888
|
+
*/
|
|
7889
|
+
mip_opt_out?: boolean;
|
|
7890
|
+
/**
|
|
7891
|
+
* Mode of operation for the model representing broad area of topic that will be talked about in the supplied audio
|
|
7892
|
+
*/
|
|
7893
|
+
mode?: "general" | "medical" | "finance";
|
|
7894
|
+
/**
|
|
7895
|
+
* Transcribe each audio channel independently.
|
|
7896
|
+
*/
|
|
7897
|
+
multichannel?: boolean;
|
|
7898
|
+
/**
|
|
7899
|
+
* Numerals converts numbers from written format to numerical format.
|
|
7900
|
+
*/
|
|
7901
|
+
numerals?: boolean;
|
|
7902
|
+
/**
|
|
7903
|
+
* Splits audio into paragraphs to improve transcript readability.
|
|
7904
|
+
*/
|
|
7905
|
+
paragraphs?: boolean;
|
|
7906
|
+
/**
|
|
7907
|
+
* Profanity Filter looks for recognized profanity and converts it to the nearest recognized non-profane word or removes it from the transcript completely.
|
|
6836
7908
|
*/
|
|
6837
7909
|
profanity_filter?: boolean;
|
|
6838
7910
|
/**
|
|
6839
|
-
* Add punctuation and capitalization to the transcript.
|
|
7911
|
+
* Add punctuation and capitalization to the transcript.
|
|
7912
|
+
*/
|
|
7913
|
+
punctuate?: boolean;
|
|
7914
|
+
/**
|
|
7915
|
+
* Redaction removes sensitive information from your transcripts.
|
|
7916
|
+
*/
|
|
7917
|
+
redact?: string;
|
|
7918
|
+
/**
|
|
7919
|
+
* Search for terms or phrases in submitted audio and replaces them.
|
|
7920
|
+
*/
|
|
7921
|
+
replace?: string;
|
|
7922
|
+
/**
|
|
7923
|
+
* Search for terms or phrases in submitted audio.
|
|
7924
|
+
*/
|
|
7925
|
+
search?: string;
|
|
7926
|
+
/**
|
|
7927
|
+
* Recognizes the sentiment throughout a transcript or text.
|
|
7928
|
+
*/
|
|
7929
|
+
sentiment?: boolean;
|
|
7930
|
+
/**
|
|
7931
|
+
* Apply formatting to transcript output. When set to true, additional formatting will be applied to transcripts to improve readability.
|
|
7932
|
+
*/
|
|
7933
|
+
smart_format?: boolean;
|
|
7934
|
+
/**
|
|
7935
|
+
* Detect topics throughout a transcript or text.
|
|
7936
|
+
*/
|
|
7937
|
+
topics?: boolean;
|
|
7938
|
+
/**
|
|
7939
|
+
* Segments speech into meaningful semantic units.
|
|
7940
|
+
*/
|
|
7941
|
+
utterances?: boolean;
|
|
7942
|
+
/**
|
|
7943
|
+
* Seconds to wait before detecting a pause between words in submitted audio.
|
|
7944
|
+
*/
|
|
7945
|
+
utt_split?: number;
|
|
7946
|
+
/**
|
|
7947
|
+
* The number of channels in the submitted audio
|
|
7948
|
+
*/
|
|
7949
|
+
channels?: number;
|
|
7950
|
+
/**
|
|
7951
|
+
* Specifies whether the streaming endpoint should provide ongoing transcription updates as more audio is received. When set to true, the endpoint sends continuous updates, meaning transcription results may evolve over time. Note: Supported only for webosockets.
|
|
7952
|
+
*/
|
|
7953
|
+
interim_results?: boolean;
|
|
7954
|
+
/**
|
|
7955
|
+
* Indicates how long model will wait to detect whether a speaker has finished speaking or pauses for a significant period of time. When set to a value, the streaming endpoint immediately finalizes the transcription for the processed time range and returns the transcript with a speech_final parameter set to true. Can also be set to false to disable endpointing
|
|
7956
|
+
*/
|
|
7957
|
+
endpointing?: string;
|
|
7958
|
+
/**
|
|
7959
|
+
* Indicates that speech has started. You'll begin receiving Speech Started messages upon speech starting. Note: Supported only for webosockets.
|
|
7960
|
+
*/
|
|
7961
|
+
vad_events?: boolean;
|
|
7962
|
+
/**
|
|
7963
|
+
* Indicates how long model will wait to send an UtteranceEnd message after a word has been transcribed. Use with interim_results. Note: Supported only for webosockets.
|
|
7964
|
+
*/
|
|
7965
|
+
utterance_end_ms?: boolean;
|
|
7966
|
+
}
|
|
7967
|
+
interface Ai_Cf_Deepgram_Nova_3_Output {
|
|
7968
|
+
results?: {
|
|
7969
|
+
channels?: {
|
|
7970
|
+
alternatives?: {
|
|
7971
|
+
confidence?: number;
|
|
7972
|
+
transcript?: string;
|
|
7973
|
+
words?: {
|
|
7974
|
+
confidence?: number;
|
|
7975
|
+
end?: number;
|
|
7976
|
+
start?: number;
|
|
7977
|
+
word?: string;
|
|
7978
|
+
}[];
|
|
7979
|
+
}[];
|
|
7980
|
+
}[];
|
|
7981
|
+
summary?: {
|
|
7982
|
+
result?: string;
|
|
7983
|
+
short?: string;
|
|
7984
|
+
};
|
|
7985
|
+
sentiments?: {
|
|
7986
|
+
segments?: {
|
|
7987
|
+
text?: string;
|
|
7988
|
+
start_word?: number;
|
|
7989
|
+
end_word?: number;
|
|
7990
|
+
sentiment?: string;
|
|
7991
|
+
sentiment_score?: number;
|
|
7992
|
+
}[];
|
|
7993
|
+
average?: {
|
|
7994
|
+
sentiment?: string;
|
|
7995
|
+
sentiment_score?: number;
|
|
7996
|
+
};
|
|
7997
|
+
};
|
|
7998
|
+
};
|
|
7999
|
+
}
|
|
8000
|
+
declare abstract class Base_Ai_Cf_Deepgram_Nova_3 {
|
|
8001
|
+
inputs: Ai_Cf_Deepgram_Nova_3_Input;
|
|
8002
|
+
postProcessedOutputs: Ai_Cf_Deepgram_Nova_3_Output;
|
|
8003
|
+
}
|
|
8004
|
+
interface Ai_Cf_Qwen_Qwen3_Embedding_0_6B_Input {
|
|
8005
|
+
queries?: string | string[];
|
|
8006
|
+
/**
|
|
8007
|
+
* Optional instruction for the task
|
|
8008
|
+
*/
|
|
8009
|
+
instruction?: string;
|
|
8010
|
+
documents?: string | string[];
|
|
8011
|
+
text?: string | string[];
|
|
8012
|
+
}
|
|
8013
|
+
interface Ai_Cf_Qwen_Qwen3_Embedding_0_6B_Output {
|
|
8014
|
+
data?: number[][];
|
|
8015
|
+
shape?: number[];
|
|
8016
|
+
}
|
|
8017
|
+
declare abstract class Base_Ai_Cf_Qwen_Qwen3_Embedding_0_6B {
|
|
8018
|
+
inputs: Ai_Cf_Qwen_Qwen3_Embedding_0_6B_Input;
|
|
8019
|
+
postProcessedOutputs: Ai_Cf_Qwen_Qwen3_Embedding_0_6B_Output;
|
|
8020
|
+
}
|
|
8021
|
+
type Ai_Cf_Pipecat_Ai_Smart_Turn_V2_Input =
|
|
8022
|
+
| {
|
|
8023
|
+
/**
|
|
8024
|
+
* readable stream with audio data and content-type specified for that data
|
|
8025
|
+
*/
|
|
8026
|
+
audio: {
|
|
8027
|
+
body: object;
|
|
8028
|
+
contentType: string;
|
|
8029
|
+
};
|
|
8030
|
+
/**
|
|
8031
|
+
* type of data PCM data that's sent to the inference server as raw array
|
|
8032
|
+
*/
|
|
8033
|
+
dtype?: "uint8" | "float32" | "float64";
|
|
8034
|
+
}
|
|
8035
|
+
| {
|
|
8036
|
+
/**
|
|
8037
|
+
* base64 encoded audio data
|
|
8038
|
+
*/
|
|
8039
|
+
audio: string;
|
|
8040
|
+
/**
|
|
8041
|
+
* type of data PCM data that's sent to the inference server as raw array
|
|
8042
|
+
*/
|
|
8043
|
+
dtype?: "uint8" | "float32" | "float64";
|
|
8044
|
+
};
|
|
8045
|
+
interface Ai_Cf_Pipecat_Ai_Smart_Turn_V2_Output {
|
|
8046
|
+
/**
|
|
8047
|
+
* if true, end-of-turn was detected
|
|
8048
|
+
*/
|
|
8049
|
+
is_complete?: boolean;
|
|
8050
|
+
/**
|
|
8051
|
+
* probability of the end-of-turn detection
|
|
8052
|
+
*/
|
|
8053
|
+
probability?: number;
|
|
8054
|
+
}
|
|
8055
|
+
declare abstract class Base_Ai_Cf_Pipecat_Ai_Smart_Turn_V2 {
|
|
8056
|
+
inputs: Ai_Cf_Pipecat_Ai_Smart_Turn_V2_Input;
|
|
8057
|
+
postProcessedOutputs: Ai_Cf_Pipecat_Ai_Smart_Turn_V2_Output;
|
|
8058
|
+
}
|
|
8059
|
+
declare abstract class Base_Ai_Cf_Openai_Gpt_Oss_120B {
|
|
8060
|
+
inputs: ResponsesInput;
|
|
8061
|
+
postProcessedOutputs: ResponsesOutput;
|
|
8062
|
+
}
|
|
8063
|
+
declare abstract class Base_Ai_Cf_Openai_Gpt_Oss_20B {
|
|
8064
|
+
inputs: ResponsesInput;
|
|
8065
|
+
postProcessedOutputs: ResponsesOutput;
|
|
8066
|
+
}
|
|
8067
|
+
interface Ai_Cf_Leonardo_Phoenix_1_0_Input {
|
|
8068
|
+
/**
|
|
8069
|
+
* A text description of the image you want to generate.
|
|
8070
|
+
*/
|
|
8071
|
+
prompt: string;
|
|
8072
|
+
/**
|
|
8073
|
+
* Controls how closely the generated image should adhere to the prompt; higher values make the image more aligned with the prompt
|
|
8074
|
+
*/
|
|
8075
|
+
guidance?: number;
|
|
8076
|
+
/**
|
|
8077
|
+
* Random seed for reproducibility of the image generation
|
|
8078
|
+
*/
|
|
8079
|
+
seed?: number;
|
|
8080
|
+
/**
|
|
8081
|
+
* The height of the generated image in pixels
|
|
8082
|
+
*/
|
|
8083
|
+
height?: number;
|
|
8084
|
+
/**
|
|
8085
|
+
* The width of the generated image in pixels
|
|
8086
|
+
*/
|
|
8087
|
+
width?: number;
|
|
8088
|
+
/**
|
|
8089
|
+
* The number of diffusion steps; higher values can improve quality but take longer
|
|
8090
|
+
*/
|
|
8091
|
+
num_steps?: number;
|
|
8092
|
+
/**
|
|
8093
|
+
* Specify what to exclude from the generated images
|
|
8094
|
+
*/
|
|
8095
|
+
negative_prompt?: string;
|
|
8096
|
+
}
|
|
8097
|
+
/**
|
|
8098
|
+
* The generated image in JPEG format
|
|
8099
|
+
*/
|
|
8100
|
+
type Ai_Cf_Leonardo_Phoenix_1_0_Output = string;
|
|
8101
|
+
declare abstract class Base_Ai_Cf_Leonardo_Phoenix_1_0 {
|
|
8102
|
+
inputs: Ai_Cf_Leonardo_Phoenix_1_0_Input;
|
|
8103
|
+
postProcessedOutputs: Ai_Cf_Leonardo_Phoenix_1_0_Output;
|
|
8104
|
+
}
|
|
8105
|
+
interface Ai_Cf_Leonardo_Lucid_Origin_Input {
|
|
8106
|
+
/**
|
|
8107
|
+
* A text description of the image you want to generate.
|
|
8108
|
+
*/
|
|
8109
|
+
prompt: string;
|
|
8110
|
+
/**
|
|
8111
|
+
* Controls how closely the generated image should adhere to the prompt; higher values make the image more aligned with the prompt
|
|
8112
|
+
*/
|
|
8113
|
+
guidance?: number;
|
|
8114
|
+
/**
|
|
8115
|
+
* Random seed for reproducibility of the image generation
|
|
8116
|
+
*/
|
|
8117
|
+
seed?: number;
|
|
8118
|
+
/**
|
|
8119
|
+
* The height of the generated image in pixels
|
|
8120
|
+
*/
|
|
8121
|
+
height?: number;
|
|
8122
|
+
/**
|
|
8123
|
+
* The width of the generated image in pixels
|
|
8124
|
+
*/
|
|
8125
|
+
width?: number;
|
|
8126
|
+
/**
|
|
8127
|
+
* The number of diffusion steps; higher values can improve quality but take longer
|
|
8128
|
+
*/
|
|
8129
|
+
num_steps?: number;
|
|
8130
|
+
/**
|
|
8131
|
+
* The number of diffusion steps; higher values can improve quality but take longer
|
|
8132
|
+
*/
|
|
8133
|
+
steps?: number;
|
|
8134
|
+
}
|
|
8135
|
+
interface Ai_Cf_Leonardo_Lucid_Origin_Output {
|
|
8136
|
+
/**
|
|
8137
|
+
* The generated image in Base64 format.
|
|
8138
|
+
*/
|
|
8139
|
+
image?: string;
|
|
8140
|
+
}
|
|
8141
|
+
declare abstract class Base_Ai_Cf_Leonardo_Lucid_Origin {
|
|
8142
|
+
inputs: Ai_Cf_Leonardo_Lucid_Origin_Input;
|
|
8143
|
+
postProcessedOutputs: Ai_Cf_Leonardo_Lucid_Origin_Output;
|
|
8144
|
+
}
|
|
8145
|
+
interface Ai_Cf_Deepgram_Aura_1_Input {
|
|
8146
|
+
/**
|
|
8147
|
+
* Speaker used to produce the audio.
|
|
8148
|
+
*/
|
|
8149
|
+
speaker?:
|
|
8150
|
+
| "angus"
|
|
8151
|
+
| "asteria"
|
|
8152
|
+
| "arcas"
|
|
8153
|
+
| "orion"
|
|
8154
|
+
| "orpheus"
|
|
8155
|
+
| "athena"
|
|
8156
|
+
| "luna"
|
|
8157
|
+
| "zeus"
|
|
8158
|
+
| "perseus"
|
|
8159
|
+
| "helios"
|
|
8160
|
+
| "hera"
|
|
8161
|
+
| "stella";
|
|
8162
|
+
/**
|
|
8163
|
+
* Encoding of the output audio.
|
|
8164
|
+
*/
|
|
8165
|
+
encoding?: "linear16" | "flac" | "mulaw" | "alaw" | "mp3" | "opus" | "aac";
|
|
8166
|
+
/**
|
|
8167
|
+
* Container specifies the file format wrapper for the output audio. The available options depend on the encoding type..
|
|
8168
|
+
*/
|
|
8169
|
+
container?: "none" | "wav" | "ogg";
|
|
8170
|
+
/**
|
|
8171
|
+
* The text content to be converted to speech
|
|
8172
|
+
*/
|
|
8173
|
+
text: string;
|
|
8174
|
+
/**
|
|
8175
|
+
* Sample Rate specifies the sample rate for the output audio. Based on the encoding, different sample rates are supported. For some encodings, the sample rate is not configurable
|
|
8176
|
+
*/
|
|
8177
|
+
sample_rate?: number;
|
|
8178
|
+
/**
|
|
8179
|
+
* The bitrate of the audio in bits per second. Choose from predefined ranges or specific values based on the encoding type.
|
|
8180
|
+
*/
|
|
8181
|
+
bit_rate?: number;
|
|
8182
|
+
}
|
|
8183
|
+
/**
|
|
8184
|
+
* The generated audio in MP3 format
|
|
8185
|
+
*/
|
|
8186
|
+
type Ai_Cf_Deepgram_Aura_1_Output = string;
|
|
8187
|
+
declare abstract class Base_Ai_Cf_Deepgram_Aura_1 {
|
|
8188
|
+
inputs: Ai_Cf_Deepgram_Aura_1_Input;
|
|
8189
|
+
postProcessedOutputs: Ai_Cf_Deepgram_Aura_1_Output;
|
|
8190
|
+
}
|
|
8191
|
+
interface Ai_Cf_Ai4Bharat_Indictrans2_En_Indic_1B_Input {
|
|
8192
|
+
/**
|
|
8193
|
+
* Input text to translate. Can be a single string or a list of strings.
|
|
8194
|
+
*/
|
|
8195
|
+
text: string | string[];
|
|
8196
|
+
/**
|
|
8197
|
+
* Target langauge to translate to
|
|
8198
|
+
*/
|
|
8199
|
+
target_language:
|
|
8200
|
+
| "asm_Beng"
|
|
8201
|
+
| "awa_Deva"
|
|
8202
|
+
| "ben_Beng"
|
|
8203
|
+
| "bho_Deva"
|
|
8204
|
+
| "brx_Deva"
|
|
8205
|
+
| "doi_Deva"
|
|
8206
|
+
| "eng_Latn"
|
|
8207
|
+
| "gom_Deva"
|
|
8208
|
+
| "gon_Deva"
|
|
8209
|
+
| "guj_Gujr"
|
|
8210
|
+
| "hin_Deva"
|
|
8211
|
+
| "hne_Deva"
|
|
8212
|
+
| "kan_Knda"
|
|
8213
|
+
| "kas_Arab"
|
|
8214
|
+
| "kas_Deva"
|
|
8215
|
+
| "kha_Latn"
|
|
8216
|
+
| "lus_Latn"
|
|
8217
|
+
| "mag_Deva"
|
|
8218
|
+
| "mai_Deva"
|
|
8219
|
+
| "mal_Mlym"
|
|
8220
|
+
| "mar_Deva"
|
|
8221
|
+
| "mni_Beng"
|
|
8222
|
+
| "mni_Mtei"
|
|
8223
|
+
| "npi_Deva"
|
|
8224
|
+
| "ory_Orya"
|
|
8225
|
+
| "pan_Guru"
|
|
8226
|
+
| "san_Deva"
|
|
8227
|
+
| "sat_Olck"
|
|
8228
|
+
| "snd_Arab"
|
|
8229
|
+
| "snd_Deva"
|
|
8230
|
+
| "tam_Taml"
|
|
8231
|
+
| "tel_Telu"
|
|
8232
|
+
| "urd_Arab"
|
|
8233
|
+
| "unr_Deva";
|
|
8234
|
+
}
|
|
8235
|
+
interface Ai_Cf_Ai4Bharat_Indictrans2_En_Indic_1B_Output {
|
|
8236
|
+
/**
|
|
8237
|
+
* Translated texts
|
|
8238
|
+
*/
|
|
8239
|
+
translations: string[];
|
|
8240
|
+
}
|
|
8241
|
+
declare abstract class Base_Ai_Cf_Ai4Bharat_Indictrans2_En_Indic_1B {
|
|
8242
|
+
inputs: Ai_Cf_Ai4Bharat_Indictrans2_En_Indic_1B_Input;
|
|
8243
|
+
postProcessedOutputs: Ai_Cf_Ai4Bharat_Indictrans2_En_Indic_1B_Output;
|
|
8244
|
+
}
|
|
8245
|
+
type Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Input =
|
|
8246
|
+
| Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Prompt
|
|
8247
|
+
| Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Messages
|
|
8248
|
+
| Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Async_Batch;
|
|
8249
|
+
interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Prompt {
|
|
8250
|
+
/**
|
|
8251
|
+
* The input text prompt for the model to generate a response.
|
|
8252
|
+
*/
|
|
8253
|
+
prompt: string;
|
|
8254
|
+
/**
|
|
8255
|
+
* Name of the LoRA (Low-Rank Adaptation) model to fine-tune the base model.
|
|
8256
|
+
*/
|
|
8257
|
+
lora?: string;
|
|
8258
|
+
response_format?: Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_JSON_Mode;
|
|
8259
|
+
/**
|
|
8260
|
+
* If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
|
|
8261
|
+
*/
|
|
8262
|
+
raw?: boolean;
|
|
8263
|
+
/**
|
|
8264
|
+
* If true, the response will be streamed back incrementally using SSE, Server Sent Events.
|
|
8265
|
+
*/
|
|
8266
|
+
stream?: boolean;
|
|
8267
|
+
/**
|
|
8268
|
+
* The maximum number of tokens to generate in the response.
|
|
8269
|
+
*/
|
|
8270
|
+
max_tokens?: number;
|
|
8271
|
+
/**
|
|
8272
|
+
* Controls the randomness of the output; higher values produce more random results.
|
|
8273
|
+
*/
|
|
8274
|
+
temperature?: number;
|
|
8275
|
+
/**
|
|
8276
|
+
* Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses.
|
|
8277
|
+
*/
|
|
8278
|
+
top_p?: number;
|
|
8279
|
+
/**
|
|
8280
|
+
* Limits the AI to choose from the top 'k' most probable words. Lower values make responses more focused; higher values introduce more variety and potential surprises.
|
|
8281
|
+
*/
|
|
8282
|
+
top_k?: number;
|
|
8283
|
+
/**
|
|
8284
|
+
* Random seed for reproducibility of the generation.
|
|
8285
|
+
*/
|
|
8286
|
+
seed?: number;
|
|
8287
|
+
/**
|
|
8288
|
+
* Penalty for repeated tokens; higher values discourage repetition.
|
|
8289
|
+
*/
|
|
8290
|
+
repetition_penalty?: number;
|
|
8291
|
+
/**
|
|
8292
|
+
* Decreases the likelihood of the model repeating the same lines verbatim.
|
|
8293
|
+
*/
|
|
8294
|
+
frequency_penalty?: number;
|
|
8295
|
+
/**
|
|
8296
|
+
* Increases the likelihood of the model introducing new topics.
|
|
8297
|
+
*/
|
|
8298
|
+
presence_penalty?: number;
|
|
8299
|
+
}
|
|
8300
|
+
interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_JSON_Mode {
|
|
8301
|
+
type?: "json_object" | "json_schema";
|
|
8302
|
+
json_schema?: unknown;
|
|
8303
|
+
}
|
|
8304
|
+
interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Messages {
|
|
8305
|
+
/**
|
|
8306
|
+
* An array of message objects representing the conversation history.
|
|
8307
|
+
*/
|
|
8308
|
+
messages: {
|
|
8309
|
+
/**
|
|
8310
|
+
* The role of the message sender (e.g., 'user', 'assistant', 'system', 'tool').
|
|
8311
|
+
*/
|
|
8312
|
+
role: string;
|
|
8313
|
+
/**
|
|
8314
|
+
* The content of the message as a string.
|
|
8315
|
+
*/
|
|
8316
|
+
content: string;
|
|
8317
|
+
}[];
|
|
8318
|
+
functions?: {
|
|
8319
|
+
name: string;
|
|
8320
|
+
code: string;
|
|
8321
|
+
}[];
|
|
8322
|
+
/**
|
|
8323
|
+
* A list of tools available for the assistant to use.
|
|
8324
|
+
*/
|
|
8325
|
+
tools?: (
|
|
8326
|
+
| {
|
|
8327
|
+
/**
|
|
8328
|
+
* The name of the tool. More descriptive the better.
|
|
8329
|
+
*/
|
|
8330
|
+
name: string;
|
|
8331
|
+
/**
|
|
8332
|
+
* A brief description of what the tool does.
|
|
8333
|
+
*/
|
|
8334
|
+
description: string;
|
|
8335
|
+
/**
|
|
8336
|
+
* Schema defining the parameters accepted by the tool.
|
|
8337
|
+
*/
|
|
8338
|
+
parameters: {
|
|
8339
|
+
/**
|
|
8340
|
+
* The type of the parameters object (usually 'object').
|
|
8341
|
+
*/
|
|
8342
|
+
type: string;
|
|
8343
|
+
/**
|
|
8344
|
+
* List of required parameter names.
|
|
8345
|
+
*/
|
|
8346
|
+
required?: string[];
|
|
8347
|
+
/**
|
|
8348
|
+
* Definitions of each parameter.
|
|
8349
|
+
*/
|
|
8350
|
+
properties: {
|
|
8351
|
+
[k: string]: {
|
|
8352
|
+
/**
|
|
8353
|
+
* The data type of the parameter.
|
|
8354
|
+
*/
|
|
8355
|
+
type: string;
|
|
8356
|
+
/**
|
|
8357
|
+
* A description of the expected parameter.
|
|
8358
|
+
*/
|
|
8359
|
+
description: string;
|
|
8360
|
+
};
|
|
8361
|
+
};
|
|
8362
|
+
};
|
|
8363
|
+
}
|
|
8364
|
+
| {
|
|
8365
|
+
/**
|
|
8366
|
+
* Specifies the type of tool (e.g., 'function').
|
|
8367
|
+
*/
|
|
8368
|
+
type: string;
|
|
8369
|
+
/**
|
|
8370
|
+
* Details of the function tool.
|
|
8371
|
+
*/
|
|
8372
|
+
function: {
|
|
8373
|
+
/**
|
|
8374
|
+
* The name of the function.
|
|
8375
|
+
*/
|
|
8376
|
+
name: string;
|
|
8377
|
+
/**
|
|
8378
|
+
* A brief description of what the function does.
|
|
8379
|
+
*/
|
|
8380
|
+
description: string;
|
|
8381
|
+
/**
|
|
8382
|
+
* Schema defining the parameters accepted by the function.
|
|
8383
|
+
*/
|
|
8384
|
+
parameters: {
|
|
8385
|
+
/**
|
|
8386
|
+
* The type of the parameters object (usually 'object').
|
|
8387
|
+
*/
|
|
8388
|
+
type: string;
|
|
8389
|
+
/**
|
|
8390
|
+
* List of required parameter names.
|
|
8391
|
+
*/
|
|
8392
|
+
required?: string[];
|
|
8393
|
+
/**
|
|
8394
|
+
* Definitions of each parameter.
|
|
8395
|
+
*/
|
|
8396
|
+
properties: {
|
|
8397
|
+
[k: string]: {
|
|
8398
|
+
/**
|
|
8399
|
+
* The data type of the parameter.
|
|
8400
|
+
*/
|
|
8401
|
+
type: string;
|
|
8402
|
+
/**
|
|
8403
|
+
* A description of the expected parameter.
|
|
8404
|
+
*/
|
|
8405
|
+
description: string;
|
|
8406
|
+
};
|
|
8407
|
+
};
|
|
8408
|
+
};
|
|
8409
|
+
};
|
|
8410
|
+
}
|
|
8411
|
+
)[];
|
|
8412
|
+
response_format?: Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_JSON_Mode_1;
|
|
8413
|
+
/**
|
|
8414
|
+
* If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
|
|
8415
|
+
*/
|
|
8416
|
+
raw?: boolean;
|
|
8417
|
+
/**
|
|
8418
|
+
* If true, the response will be streamed back incrementally using SSE, Server Sent Events.
|
|
8419
|
+
*/
|
|
8420
|
+
stream?: boolean;
|
|
8421
|
+
/**
|
|
8422
|
+
* The maximum number of tokens to generate in the response.
|
|
8423
|
+
*/
|
|
8424
|
+
max_tokens?: number;
|
|
8425
|
+
/**
|
|
8426
|
+
* Controls the randomness of the output; higher values produce more random results.
|
|
8427
|
+
*/
|
|
8428
|
+
temperature?: number;
|
|
8429
|
+
/**
|
|
8430
|
+
* Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses.
|
|
6840
8431
|
*/
|
|
6841
|
-
|
|
8432
|
+
top_p?: number;
|
|
6842
8433
|
/**
|
|
6843
|
-
*
|
|
8434
|
+
* Limits the AI to choose from the top 'k' most probable words. Lower values make responses more focused; higher values introduce more variety and potential surprises.
|
|
6844
8435
|
*/
|
|
6845
|
-
|
|
8436
|
+
top_k?: number;
|
|
6846
8437
|
/**
|
|
6847
|
-
*
|
|
8438
|
+
* Random seed for reproducibility of the generation.
|
|
6848
8439
|
*/
|
|
6849
|
-
|
|
8440
|
+
seed?: number;
|
|
6850
8441
|
/**
|
|
6851
|
-
*
|
|
8442
|
+
* Penalty for repeated tokens; higher values discourage repetition.
|
|
6852
8443
|
*/
|
|
6853
|
-
|
|
8444
|
+
repetition_penalty?: number;
|
|
6854
8445
|
/**
|
|
6855
|
-
*
|
|
8446
|
+
* Decreases the likelihood of the model repeating the same lines verbatim.
|
|
6856
8447
|
*/
|
|
6857
|
-
|
|
8448
|
+
frequency_penalty?: number;
|
|
6858
8449
|
/**
|
|
6859
|
-
*
|
|
8450
|
+
* Increases the likelihood of the model introducing new topics.
|
|
6860
8451
|
*/
|
|
6861
|
-
|
|
8452
|
+
presence_penalty?: number;
|
|
8453
|
+
}
|
|
8454
|
+
interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_JSON_Mode_1 {
|
|
8455
|
+
type?: "json_object" | "json_schema";
|
|
8456
|
+
json_schema?: unknown;
|
|
8457
|
+
}
|
|
8458
|
+
interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Async_Batch {
|
|
8459
|
+
requests: (
|
|
8460
|
+
| Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Prompt_1
|
|
8461
|
+
| Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Messages_1
|
|
8462
|
+
)[];
|
|
8463
|
+
}
|
|
8464
|
+
interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Prompt_1 {
|
|
6862
8465
|
/**
|
|
6863
|
-
*
|
|
8466
|
+
* The input text prompt for the model to generate a response.
|
|
6864
8467
|
*/
|
|
6865
|
-
|
|
8468
|
+
prompt: string;
|
|
6866
8469
|
/**
|
|
6867
|
-
*
|
|
8470
|
+
* Name of the LoRA (Low-Rank Adaptation) model to fine-tune the base model.
|
|
6868
8471
|
*/
|
|
6869
|
-
|
|
8472
|
+
lora?: string;
|
|
8473
|
+
response_format?: Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_JSON_Mode_2;
|
|
6870
8474
|
/**
|
|
6871
|
-
*
|
|
8475
|
+
* If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
|
|
6872
8476
|
*/
|
|
6873
|
-
|
|
8477
|
+
raw?: boolean;
|
|
6874
8478
|
/**
|
|
6875
|
-
*
|
|
8479
|
+
* If true, the response will be streamed back incrementally using SSE, Server Sent Events.
|
|
6876
8480
|
*/
|
|
6877
|
-
|
|
8481
|
+
stream?: boolean;
|
|
6878
8482
|
/**
|
|
6879
|
-
*
|
|
8483
|
+
* The maximum number of tokens to generate in the response.
|
|
6880
8484
|
*/
|
|
6881
|
-
|
|
8485
|
+
max_tokens?: number;
|
|
6882
8486
|
/**
|
|
6883
|
-
*
|
|
8487
|
+
* Controls the randomness of the output; higher values produce more random results.
|
|
6884
8488
|
*/
|
|
6885
|
-
|
|
8489
|
+
temperature?: number;
|
|
6886
8490
|
/**
|
|
6887
|
-
*
|
|
8491
|
+
* Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses.
|
|
6888
8492
|
*/
|
|
6889
|
-
|
|
8493
|
+
top_p?: number;
|
|
6890
8494
|
/**
|
|
6891
|
-
*
|
|
8495
|
+
* Limits the AI to choose from the top 'k' most probable words. Lower values make responses more focused; higher values introduce more variety and potential surprises.
|
|
6892
8496
|
*/
|
|
6893
|
-
|
|
8497
|
+
top_k?: number;
|
|
8498
|
+
/**
|
|
8499
|
+
* Random seed for reproducibility of the generation.
|
|
8500
|
+
*/
|
|
8501
|
+
seed?: number;
|
|
8502
|
+
/**
|
|
8503
|
+
* Penalty for repeated tokens; higher values discourage repetition.
|
|
8504
|
+
*/
|
|
8505
|
+
repetition_penalty?: number;
|
|
8506
|
+
/**
|
|
8507
|
+
* Decreases the likelihood of the model repeating the same lines verbatim.
|
|
8508
|
+
*/
|
|
8509
|
+
frequency_penalty?: number;
|
|
8510
|
+
/**
|
|
8511
|
+
* Increases the likelihood of the model introducing new topics.
|
|
8512
|
+
*/
|
|
8513
|
+
presence_penalty?: number;
|
|
6894
8514
|
}
|
|
6895
|
-
interface
|
|
6896
|
-
|
|
6897
|
-
|
|
6898
|
-
|
|
6899
|
-
|
|
6900
|
-
|
|
6901
|
-
|
|
6902
|
-
|
|
6903
|
-
|
|
6904
|
-
|
|
6905
|
-
|
|
6906
|
-
|
|
6907
|
-
|
|
6908
|
-
|
|
6909
|
-
|
|
6910
|
-
|
|
6911
|
-
|
|
6912
|
-
|
|
6913
|
-
|
|
6914
|
-
|
|
6915
|
-
|
|
6916
|
-
|
|
6917
|
-
|
|
6918
|
-
|
|
6919
|
-
|
|
6920
|
-
|
|
6921
|
-
|
|
6922
|
-
|
|
6923
|
-
|
|
6924
|
-
|
|
6925
|
-
|
|
6926
|
-
|
|
8515
|
+
interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_JSON_Mode_2 {
|
|
8516
|
+
type?: "json_object" | "json_schema";
|
|
8517
|
+
json_schema?: unknown;
|
|
8518
|
+
}
|
|
8519
|
+
interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Messages_1 {
|
|
8520
|
+
/**
|
|
8521
|
+
* An array of message objects representing the conversation history.
|
|
8522
|
+
*/
|
|
8523
|
+
messages: {
|
|
8524
|
+
/**
|
|
8525
|
+
* The role of the message sender (e.g., 'user', 'assistant', 'system', 'tool').
|
|
8526
|
+
*/
|
|
8527
|
+
role: string;
|
|
8528
|
+
/**
|
|
8529
|
+
* The content of the message as a string.
|
|
8530
|
+
*/
|
|
8531
|
+
content: string;
|
|
8532
|
+
}[];
|
|
8533
|
+
functions?: {
|
|
8534
|
+
name: string;
|
|
8535
|
+
code: string;
|
|
8536
|
+
}[];
|
|
8537
|
+
/**
|
|
8538
|
+
* A list of tools available for the assistant to use.
|
|
8539
|
+
*/
|
|
8540
|
+
tools?: (
|
|
8541
|
+
| {
|
|
8542
|
+
/**
|
|
8543
|
+
* The name of the tool. More descriptive the better.
|
|
8544
|
+
*/
|
|
8545
|
+
name: string;
|
|
8546
|
+
/**
|
|
8547
|
+
* A brief description of what the tool does.
|
|
8548
|
+
*/
|
|
8549
|
+
description: string;
|
|
8550
|
+
/**
|
|
8551
|
+
* Schema defining the parameters accepted by the tool.
|
|
8552
|
+
*/
|
|
8553
|
+
parameters: {
|
|
8554
|
+
/**
|
|
8555
|
+
* The type of the parameters object (usually 'object').
|
|
8556
|
+
*/
|
|
8557
|
+
type: string;
|
|
8558
|
+
/**
|
|
8559
|
+
* List of required parameter names.
|
|
8560
|
+
*/
|
|
8561
|
+
required?: string[];
|
|
8562
|
+
/**
|
|
8563
|
+
* Definitions of each parameter.
|
|
8564
|
+
*/
|
|
8565
|
+
properties: {
|
|
8566
|
+
[k: string]: {
|
|
8567
|
+
/**
|
|
8568
|
+
* The data type of the parameter.
|
|
8569
|
+
*/
|
|
8570
|
+
type: string;
|
|
8571
|
+
/**
|
|
8572
|
+
* A description of the expected parameter.
|
|
8573
|
+
*/
|
|
8574
|
+
description: string;
|
|
8575
|
+
};
|
|
8576
|
+
};
|
|
8577
|
+
};
|
|
8578
|
+
}
|
|
8579
|
+
| {
|
|
8580
|
+
/**
|
|
8581
|
+
* Specifies the type of tool (e.g., 'function').
|
|
8582
|
+
*/
|
|
8583
|
+
type: string;
|
|
8584
|
+
/**
|
|
8585
|
+
* Details of the function tool.
|
|
8586
|
+
*/
|
|
8587
|
+
function: {
|
|
8588
|
+
/**
|
|
8589
|
+
* The name of the function.
|
|
8590
|
+
*/
|
|
8591
|
+
name: string;
|
|
8592
|
+
/**
|
|
8593
|
+
* A brief description of what the function does.
|
|
8594
|
+
*/
|
|
8595
|
+
description: string;
|
|
8596
|
+
/**
|
|
8597
|
+
* Schema defining the parameters accepted by the function.
|
|
8598
|
+
*/
|
|
8599
|
+
parameters: {
|
|
8600
|
+
/**
|
|
8601
|
+
* The type of the parameters object (usually 'object').
|
|
8602
|
+
*/
|
|
8603
|
+
type: string;
|
|
8604
|
+
/**
|
|
8605
|
+
* List of required parameter names.
|
|
8606
|
+
*/
|
|
8607
|
+
required?: string[];
|
|
8608
|
+
/**
|
|
8609
|
+
* Definitions of each parameter.
|
|
8610
|
+
*/
|
|
8611
|
+
properties: {
|
|
8612
|
+
[k: string]: {
|
|
8613
|
+
/**
|
|
8614
|
+
* The data type of the parameter.
|
|
8615
|
+
*/
|
|
8616
|
+
type: string;
|
|
8617
|
+
/**
|
|
8618
|
+
* A description of the expected parameter.
|
|
8619
|
+
*/
|
|
8620
|
+
description: string;
|
|
8621
|
+
};
|
|
8622
|
+
};
|
|
8623
|
+
};
|
|
8624
|
+
};
|
|
8625
|
+
}
|
|
8626
|
+
)[];
|
|
8627
|
+
response_format?: Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_JSON_Mode_3;
|
|
8628
|
+
/**
|
|
8629
|
+
* If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
|
|
8630
|
+
*/
|
|
8631
|
+
raw?: boolean;
|
|
8632
|
+
/**
|
|
8633
|
+
* If true, the response will be streamed back incrementally using SSE, Server Sent Events.
|
|
8634
|
+
*/
|
|
8635
|
+
stream?: boolean;
|
|
8636
|
+
/**
|
|
8637
|
+
* The maximum number of tokens to generate in the response.
|
|
8638
|
+
*/
|
|
8639
|
+
max_tokens?: number;
|
|
8640
|
+
/**
|
|
8641
|
+
* Controls the randomness of the output; higher values produce more random results.
|
|
8642
|
+
*/
|
|
8643
|
+
temperature?: number;
|
|
8644
|
+
/**
|
|
8645
|
+
* Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses.
|
|
8646
|
+
*/
|
|
8647
|
+
top_p?: number;
|
|
8648
|
+
/**
|
|
8649
|
+
* Limits the AI to choose from the top 'k' most probable words. Lower values make responses more focused; higher values introduce more variety and potential surprises.
|
|
8650
|
+
*/
|
|
8651
|
+
top_k?: number;
|
|
8652
|
+
/**
|
|
8653
|
+
* Random seed for reproducibility of the generation.
|
|
8654
|
+
*/
|
|
8655
|
+
seed?: number;
|
|
8656
|
+
/**
|
|
8657
|
+
* Penalty for repeated tokens; higher values discourage repetition.
|
|
8658
|
+
*/
|
|
8659
|
+
repetition_penalty?: number;
|
|
8660
|
+
/**
|
|
8661
|
+
* Decreases the likelihood of the model repeating the same lines verbatim.
|
|
8662
|
+
*/
|
|
8663
|
+
frequency_penalty?: number;
|
|
8664
|
+
/**
|
|
8665
|
+
* Increases the likelihood of the model introducing new topics.
|
|
8666
|
+
*/
|
|
8667
|
+
presence_penalty?: number;
|
|
6927
8668
|
}
|
|
6928
|
-
|
|
6929
|
-
|
|
6930
|
-
|
|
8669
|
+
interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_JSON_Mode_3 {
|
|
8670
|
+
type?: "json_object" | "json_schema";
|
|
8671
|
+
json_schema?: unknown;
|
|
6931
8672
|
}
|
|
6932
|
-
type
|
|
6933
|
-
|
|
|
8673
|
+
type Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Output =
|
|
8674
|
+
| Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Chat_Completion_Response
|
|
8675
|
+
| Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Text_Completion_Response
|
|
8676
|
+
| string
|
|
8677
|
+
| Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_AsyncResponse;
|
|
8678
|
+
interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Chat_Completion_Response {
|
|
8679
|
+
/**
|
|
8680
|
+
* Unique identifier for the completion
|
|
8681
|
+
*/
|
|
8682
|
+
id?: string;
|
|
8683
|
+
/**
|
|
8684
|
+
* Object type identifier
|
|
8685
|
+
*/
|
|
8686
|
+
object?: "chat.completion";
|
|
8687
|
+
/**
|
|
8688
|
+
* Unix timestamp of when the completion was created
|
|
8689
|
+
*/
|
|
8690
|
+
created?: number;
|
|
8691
|
+
/**
|
|
8692
|
+
* Model used for the completion
|
|
8693
|
+
*/
|
|
8694
|
+
model?: string;
|
|
8695
|
+
/**
|
|
8696
|
+
* List of completion choices
|
|
8697
|
+
*/
|
|
8698
|
+
choices?: {
|
|
8699
|
+
/**
|
|
8700
|
+
* Index of the choice in the list
|
|
8701
|
+
*/
|
|
8702
|
+
index?: number;
|
|
8703
|
+
/**
|
|
8704
|
+
* The message generated by the model
|
|
8705
|
+
*/
|
|
8706
|
+
message?: {
|
|
6934
8707
|
/**
|
|
6935
|
-
*
|
|
8708
|
+
* Role of the message author
|
|
6936
8709
|
*/
|
|
6937
|
-
|
|
6938
|
-
body: object;
|
|
6939
|
-
contentType: string;
|
|
6940
|
-
};
|
|
8710
|
+
role: string;
|
|
6941
8711
|
/**
|
|
6942
|
-
*
|
|
8712
|
+
* The content of the message
|
|
6943
8713
|
*/
|
|
6944
|
-
|
|
6945
|
-
}
|
|
6946
|
-
| {
|
|
8714
|
+
content: string;
|
|
6947
8715
|
/**
|
|
6948
|
-
*
|
|
8716
|
+
* Internal reasoning content (if available)
|
|
6949
8717
|
*/
|
|
6950
|
-
|
|
8718
|
+
reasoning_content?: string;
|
|
6951
8719
|
/**
|
|
6952
|
-
*
|
|
8720
|
+
* Tool calls made by the assistant
|
|
6953
8721
|
*/
|
|
6954
|
-
|
|
8722
|
+
tool_calls?: {
|
|
8723
|
+
/**
|
|
8724
|
+
* Unique identifier for the tool call
|
|
8725
|
+
*/
|
|
8726
|
+
id: string;
|
|
8727
|
+
/**
|
|
8728
|
+
* Type of tool call
|
|
8729
|
+
*/
|
|
8730
|
+
type: "function";
|
|
8731
|
+
function: {
|
|
8732
|
+
/**
|
|
8733
|
+
* Name of the function to call
|
|
8734
|
+
*/
|
|
8735
|
+
name: string;
|
|
8736
|
+
/**
|
|
8737
|
+
* JSON string of arguments for the function
|
|
8738
|
+
*/
|
|
8739
|
+
arguments: string;
|
|
8740
|
+
};
|
|
8741
|
+
}[];
|
|
6955
8742
|
};
|
|
6956
|
-
|
|
8743
|
+
/**
|
|
8744
|
+
* Reason why the model stopped generating
|
|
8745
|
+
*/
|
|
8746
|
+
finish_reason?: string;
|
|
8747
|
+
/**
|
|
8748
|
+
* Stop reason (may be null)
|
|
8749
|
+
*/
|
|
8750
|
+
stop_reason?: string | null;
|
|
8751
|
+
/**
|
|
8752
|
+
* Log probabilities (if requested)
|
|
8753
|
+
*/
|
|
8754
|
+
logprobs?: {} | null;
|
|
8755
|
+
}[];
|
|
6957
8756
|
/**
|
|
6958
|
-
*
|
|
8757
|
+
* Usage statistics for the inference request
|
|
6959
8758
|
*/
|
|
6960
|
-
|
|
8759
|
+
usage?: {
|
|
8760
|
+
/**
|
|
8761
|
+
* Total number of tokens in input
|
|
8762
|
+
*/
|
|
8763
|
+
prompt_tokens?: number;
|
|
8764
|
+
/**
|
|
8765
|
+
* Total number of tokens in output
|
|
8766
|
+
*/
|
|
8767
|
+
completion_tokens?: number;
|
|
8768
|
+
/**
|
|
8769
|
+
* Total number of input and output tokens
|
|
8770
|
+
*/
|
|
8771
|
+
total_tokens?: number;
|
|
8772
|
+
};
|
|
6961
8773
|
/**
|
|
6962
|
-
*
|
|
8774
|
+
* Log probabilities for the prompt (if requested)
|
|
6963
8775
|
*/
|
|
6964
|
-
|
|
6965
|
-
}
|
|
6966
|
-
declare abstract class Base_Ai_Cf_Pipecat_Ai_Smart_Turn_V2 {
|
|
6967
|
-
inputs: Ai_Cf_Pipecat_Ai_Smart_Turn_V2_Input;
|
|
6968
|
-
postProcessedOutputs: Ai_Cf_Pipecat_Ai_Smart_Turn_V2_Output;
|
|
8776
|
+
prompt_logprobs?: {} | null;
|
|
6969
8777
|
}
|
|
6970
|
-
|
|
6971
|
-
|
|
6972
|
-
|
|
6973
|
-
|
|
8778
|
+
interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Text_Completion_Response {
|
|
8779
|
+
/**
|
|
8780
|
+
* Unique identifier for the completion
|
|
8781
|
+
*/
|
|
8782
|
+
id?: string;
|
|
8783
|
+
/**
|
|
8784
|
+
* Object type identifier
|
|
8785
|
+
*/
|
|
8786
|
+
object?: "text_completion";
|
|
8787
|
+
/**
|
|
8788
|
+
* Unix timestamp of when the completion was created
|
|
8789
|
+
*/
|
|
8790
|
+
created?: number;
|
|
8791
|
+
/**
|
|
8792
|
+
* Model used for the completion
|
|
8793
|
+
*/
|
|
8794
|
+
model?: string;
|
|
6974
8795
|
/**
|
|
6975
|
-
*
|
|
8796
|
+
* List of completion choices
|
|
6976
8797
|
*/
|
|
6977
|
-
|
|
6978
|
-
reasoning?: {
|
|
8798
|
+
choices?: {
|
|
6979
8799
|
/**
|
|
6980
|
-
*
|
|
8800
|
+
* Index of the choice in the list
|
|
6981
8801
|
*/
|
|
6982
|
-
|
|
8802
|
+
index: number;
|
|
6983
8803
|
/**
|
|
6984
|
-
*
|
|
8804
|
+
* The generated text completion
|
|
6985
8805
|
*/
|
|
6986
|
-
|
|
6987
|
-
};
|
|
6988
|
-
}
|
|
6989
|
-
interface GPT_OSS_120B_Responses_Async {
|
|
6990
|
-
requests: {
|
|
8806
|
+
text: string;
|
|
6991
8807
|
/**
|
|
6992
|
-
*
|
|
8808
|
+
* Reason why the model stopped generating
|
|
6993
8809
|
*/
|
|
6994
|
-
|
|
6995
|
-
|
|
6996
|
-
|
|
6997
|
-
|
|
6998
|
-
|
|
6999
|
-
|
|
7000
|
-
|
|
7001
|
-
|
|
7002
|
-
|
|
7003
|
-
|
|
7004
|
-
|
|
8810
|
+
finish_reason: string;
|
|
8811
|
+
/**
|
|
8812
|
+
* Stop reason (may be null)
|
|
8813
|
+
*/
|
|
8814
|
+
stop_reason?: string | null;
|
|
8815
|
+
/**
|
|
8816
|
+
* Log probabilities (if requested)
|
|
8817
|
+
*/
|
|
8818
|
+
logprobs?: {} | null;
|
|
8819
|
+
/**
|
|
8820
|
+
* Log probabilities for the prompt (if requested)
|
|
8821
|
+
*/
|
|
8822
|
+
prompt_logprobs?: {} | null;
|
|
7005
8823
|
}[];
|
|
7006
|
-
}
|
|
7007
|
-
type Ai_Cf_Openai_Gpt_Oss_120B_Output = {} | (string & NonNullable<unknown>);
|
|
7008
|
-
declare abstract class Base_Ai_Cf_Openai_Gpt_Oss_120B {
|
|
7009
|
-
inputs: Ai_Cf_Openai_Gpt_Oss_120B_Input;
|
|
7010
|
-
postProcessedOutputs: Ai_Cf_Openai_Gpt_Oss_120B_Output;
|
|
7011
|
-
}
|
|
7012
|
-
type Ai_Cf_Openai_Gpt_Oss_20B_Input =
|
|
7013
|
-
| GPT_OSS_20B_Responses
|
|
7014
|
-
| GPT_OSS_20B_Responses_Async;
|
|
7015
|
-
interface GPT_OSS_20B_Responses {
|
|
7016
8824
|
/**
|
|
7017
|
-
*
|
|
8825
|
+
* Usage statistics for the inference request
|
|
7018
8826
|
*/
|
|
7019
|
-
|
|
7020
|
-
reasoning?: {
|
|
8827
|
+
usage?: {
|
|
7021
8828
|
/**
|
|
7022
|
-
*
|
|
8829
|
+
* Total number of tokens in input
|
|
7023
8830
|
*/
|
|
7024
|
-
|
|
8831
|
+
prompt_tokens?: number;
|
|
7025
8832
|
/**
|
|
7026
|
-
*
|
|
8833
|
+
* Total number of tokens in output
|
|
7027
8834
|
*/
|
|
7028
|
-
|
|
7029
|
-
};
|
|
7030
|
-
}
|
|
7031
|
-
interface GPT_OSS_20B_Responses_Async {
|
|
7032
|
-
requests: {
|
|
8835
|
+
completion_tokens?: number;
|
|
7033
8836
|
/**
|
|
7034
|
-
*
|
|
8837
|
+
* Total number of input and output tokens
|
|
7035
8838
|
*/
|
|
7036
|
-
|
|
7037
|
-
|
|
7038
|
-
/**
|
|
7039
|
-
* Constrains effort on reasoning for reasoning models. Currently supported values are low, medium, and high. Reducing reasoning effort can result in faster responses and fewer tokens used on reasoning in a response.
|
|
7040
|
-
*/
|
|
7041
|
-
effort?: "low" | "medium" | "high";
|
|
7042
|
-
/**
|
|
7043
|
-
* A summary of the reasoning performed by the model. This can be useful for debugging and understanding the model's reasoning process. One of auto, concise, or detailed.
|
|
7044
|
-
*/
|
|
7045
|
-
summary?: "auto" | "concise" | "detailed";
|
|
7046
|
-
};
|
|
7047
|
-
}[];
|
|
8839
|
+
total_tokens?: number;
|
|
8840
|
+
};
|
|
7048
8841
|
}
|
|
7049
|
-
|
|
7050
|
-
|
|
7051
|
-
|
|
7052
|
-
|
|
8842
|
+
interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_AsyncResponse {
|
|
8843
|
+
/**
|
|
8844
|
+
* The async request id that can be used to obtain the results.
|
|
8845
|
+
*/
|
|
8846
|
+
request_id?: string;
|
|
7053
8847
|
}
|
|
7054
|
-
|
|
8848
|
+
declare abstract class Base_Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It {
|
|
8849
|
+
inputs: Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Input;
|
|
8850
|
+
postProcessedOutputs: Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Output;
|
|
8851
|
+
}
|
|
8852
|
+
interface Ai_Cf_Pfnet_Plamo_Embedding_1B_Input {
|
|
7055
8853
|
/**
|
|
7056
|
-
*
|
|
8854
|
+
* Input text to embed. Can be a single string or a list of strings.
|
|
7057
8855
|
*/
|
|
7058
|
-
|
|
8856
|
+
text: string | string[];
|
|
8857
|
+
}
|
|
8858
|
+
interface Ai_Cf_Pfnet_Plamo_Embedding_1B_Output {
|
|
7059
8859
|
/**
|
|
7060
|
-
*
|
|
8860
|
+
* Embedding vectors, where each vector is a list of floats.
|
|
7061
8861
|
*/
|
|
7062
|
-
|
|
8862
|
+
data: number[][];
|
|
7063
8863
|
/**
|
|
7064
|
-
*
|
|
8864
|
+
* Shape of the embedding data as [number_of_embeddings, embedding_dimension].
|
|
8865
|
+
*
|
|
8866
|
+
* @minItems 2
|
|
8867
|
+
* @maxItems 2
|
|
7065
8868
|
*/
|
|
7066
|
-
|
|
8869
|
+
shape: [number, number];
|
|
8870
|
+
}
|
|
8871
|
+
declare abstract class Base_Ai_Cf_Pfnet_Plamo_Embedding_1B {
|
|
8872
|
+
inputs: Ai_Cf_Pfnet_Plamo_Embedding_1B_Input;
|
|
8873
|
+
postProcessedOutputs: Ai_Cf_Pfnet_Plamo_Embedding_1B_Output;
|
|
8874
|
+
}
|
|
8875
|
+
interface Ai_Cf_Deepgram_Flux_Input {
|
|
7067
8876
|
/**
|
|
7068
|
-
*
|
|
8877
|
+
* Encoding of the audio stream. Currently only supports raw signed little-endian 16-bit PCM.
|
|
7069
8878
|
*/
|
|
7070
|
-
|
|
8879
|
+
encoding: "linear16";
|
|
7071
8880
|
/**
|
|
7072
|
-
*
|
|
8881
|
+
* Sample rate of the audio stream in Hz.
|
|
7073
8882
|
*/
|
|
7074
|
-
|
|
8883
|
+
sample_rate: string;
|
|
7075
8884
|
/**
|
|
7076
|
-
*
|
|
8885
|
+
* End-of-turn confidence required to fire an eager end-of-turn event. When set, enables EagerEndOfTurn and TurnResumed events. Valid Values 0.3 - 0.9.
|
|
7077
8886
|
*/
|
|
7078
|
-
|
|
8887
|
+
eager_eot_threshold?: string;
|
|
7079
8888
|
/**
|
|
7080
|
-
*
|
|
8889
|
+
* End-of-turn confidence required to finish a turn. Valid Values 0.5 - 0.9.
|
|
7081
8890
|
*/
|
|
7082
|
-
|
|
8891
|
+
eot_threshold?: string;
|
|
8892
|
+
/**
|
|
8893
|
+
* A turn will be finished when this much time has passed after speech, regardless of EOT confidence.
|
|
8894
|
+
*/
|
|
8895
|
+
eot_timeout_ms?: string;
|
|
8896
|
+
/**
|
|
8897
|
+
* Keyterm prompting can improve recognition of specialized terminology. Pass multiple keyterm query parameters to boost multiple keyterms.
|
|
8898
|
+
*/
|
|
8899
|
+
keyterm?: string;
|
|
8900
|
+
/**
|
|
8901
|
+
* Opts out requests from the Deepgram Model Improvement Program. Refer to Deepgram Docs for pricing impacts before setting this to true. https://dpgr.am/deepgram-mip
|
|
8902
|
+
*/
|
|
8903
|
+
mip_opt_out?: "true" | "false";
|
|
8904
|
+
/**
|
|
8905
|
+
* Label your requests for the purpose of identification during usage reporting
|
|
8906
|
+
*/
|
|
8907
|
+
tag?: string;
|
|
7083
8908
|
}
|
|
7084
8909
|
/**
|
|
7085
|
-
*
|
|
8910
|
+
* Output will be returned as websocket messages.
|
|
7086
8911
|
*/
|
|
7087
|
-
|
|
7088
|
-
declare abstract class Base_Ai_Cf_Leonardo_Phoenix_1_0 {
|
|
7089
|
-
inputs: Ai_Cf_Leonardo_Phoenix_1_0_Input;
|
|
7090
|
-
postProcessedOutputs: Ai_Cf_Leonardo_Phoenix_1_0_Output;
|
|
7091
|
-
}
|
|
7092
|
-
interface Ai_Cf_Leonardo_Lucid_Origin_Input {
|
|
8912
|
+
interface Ai_Cf_Deepgram_Flux_Output {
|
|
7093
8913
|
/**
|
|
7094
|
-
*
|
|
8914
|
+
* The unique identifier of the request (uuid)
|
|
7095
8915
|
*/
|
|
7096
|
-
|
|
8916
|
+
request_id?: string;
|
|
7097
8917
|
/**
|
|
7098
|
-
*
|
|
8918
|
+
* Starts at 0 and increments for each message the server sends to the client.
|
|
7099
8919
|
*/
|
|
7100
|
-
|
|
8920
|
+
sequence_id?: number;
|
|
7101
8921
|
/**
|
|
7102
|
-
*
|
|
8922
|
+
* The type of event being reported.
|
|
7103
8923
|
*/
|
|
7104
|
-
|
|
8924
|
+
event?:
|
|
8925
|
+
| "Update"
|
|
8926
|
+
| "StartOfTurn"
|
|
8927
|
+
| "EagerEndOfTurn"
|
|
8928
|
+
| "TurnResumed"
|
|
8929
|
+
| "EndOfTurn";
|
|
7105
8930
|
/**
|
|
7106
|
-
* The
|
|
8931
|
+
* The index of the current turn
|
|
7107
8932
|
*/
|
|
7108
|
-
|
|
8933
|
+
turn_index?: number;
|
|
7109
8934
|
/**
|
|
7110
|
-
*
|
|
8935
|
+
* Start time in seconds of the audio range that was transcribed
|
|
7111
8936
|
*/
|
|
7112
|
-
|
|
8937
|
+
audio_window_start?: number;
|
|
7113
8938
|
/**
|
|
7114
|
-
*
|
|
8939
|
+
* End time in seconds of the audio range that was transcribed
|
|
7115
8940
|
*/
|
|
7116
|
-
|
|
8941
|
+
audio_window_end?: number;
|
|
7117
8942
|
/**
|
|
7118
|
-
*
|
|
8943
|
+
* Text that was said over the course of the current turn
|
|
7119
8944
|
*/
|
|
7120
|
-
|
|
7121
|
-
}
|
|
7122
|
-
interface Ai_Cf_Leonardo_Lucid_Origin_Output {
|
|
8945
|
+
transcript?: string;
|
|
7123
8946
|
/**
|
|
7124
|
-
* The
|
|
8947
|
+
* The words in the transcript
|
|
7125
8948
|
*/
|
|
7126
|
-
|
|
8949
|
+
words?: {
|
|
8950
|
+
/**
|
|
8951
|
+
* The individual punctuated, properly-cased word from the transcript
|
|
8952
|
+
*/
|
|
8953
|
+
word: string;
|
|
8954
|
+
/**
|
|
8955
|
+
* Confidence that this word was transcribed correctly
|
|
8956
|
+
*/
|
|
8957
|
+
confidence: number;
|
|
8958
|
+
}[];
|
|
8959
|
+
/**
|
|
8960
|
+
* Confidence that no more speech is coming in this turn
|
|
8961
|
+
*/
|
|
8962
|
+
end_of_turn_confidence?: number;
|
|
7127
8963
|
}
|
|
7128
|
-
declare abstract class
|
|
7129
|
-
inputs:
|
|
7130
|
-
postProcessedOutputs:
|
|
8964
|
+
declare abstract class Base_Ai_Cf_Deepgram_Flux {
|
|
8965
|
+
inputs: Ai_Cf_Deepgram_Flux_Input;
|
|
8966
|
+
postProcessedOutputs: Ai_Cf_Deepgram_Flux_Output;
|
|
7131
8967
|
}
|
|
7132
|
-
interface
|
|
8968
|
+
interface Ai_Cf_Deepgram_Aura_2_En_Input {
|
|
7133
8969
|
/**
|
|
7134
8970
|
* Speaker used to produce the audio.
|
|
7135
8971
|
*/
|
|
7136
8972
|
speaker?:
|
|
7137
|
-
| "
|
|
7138
|
-
| "
|
|
8973
|
+
| "amalthea"
|
|
8974
|
+
| "andromeda"
|
|
8975
|
+
| "apollo"
|
|
7139
8976
|
| "arcas"
|
|
7140
|
-
| "
|
|
7141
|
-
| "
|
|
8977
|
+
| "aries"
|
|
8978
|
+
| "asteria"
|
|
7142
8979
|
| "athena"
|
|
7143
|
-
| "
|
|
7144
|
-
| "
|
|
7145
|
-
| "
|
|
7146
|
-
| "
|
|
8980
|
+
| "atlas"
|
|
8981
|
+
| "aurora"
|
|
8982
|
+
| "callista"
|
|
8983
|
+
| "cora"
|
|
8984
|
+
| "cordelia"
|
|
8985
|
+
| "delia"
|
|
8986
|
+
| "draco"
|
|
8987
|
+
| "electra"
|
|
8988
|
+
| "harmonia"
|
|
8989
|
+
| "helena"
|
|
7147
8990
|
| "hera"
|
|
7148
|
-
| "
|
|
8991
|
+
| "hermes"
|
|
8992
|
+
| "hyperion"
|
|
8993
|
+
| "iris"
|
|
8994
|
+
| "janus"
|
|
8995
|
+
| "juno"
|
|
8996
|
+
| "jupiter"
|
|
8997
|
+
| "luna"
|
|
8998
|
+
| "mars"
|
|
8999
|
+
| "minerva"
|
|
9000
|
+
| "neptune"
|
|
9001
|
+
| "odysseus"
|
|
9002
|
+
| "ophelia"
|
|
9003
|
+
| "orion"
|
|
9004
|
+
| "orpheus"
|
|
9005
|
+
| "pandora"
|
|
9006
|
+
| "phoebe"
|
|
9007
|
+
| "pluto"
|
|
9008
|
+
| "saturn"
|
|
9009
|
+
| "thalia"
|
|
9010
|
+
| "theia"
|
|
9011
|
+
| "vesta"
|
|
9012
|
+
| "zeus";
|
|
7149
9013
|
/**
|
|
7150
9014
|
* Encoding of the output audio.
|
|
7151
9015
|
*/
|
|
@@ -7170,10 +9034,54 @@ interface Ai_Cf_Deepgram_Aura_1_Input {
|
|
|
7170
9034
|
/**
|
|
7171
9035
|
* The generated audio in MP3 format
|
|
7172
9036
|
*/
|
|
7173
|
-
type
|
|
7174
|
-
declare abstract class
|
|
7175
|
-
inputs:
|
|
7176
|
-
postProcessedOutputs:
|
|
9037
|
+
type Ai_Cf_Deepgram_Aura_2_En_Output = string;
|
|
9038
|
+
declare abstract class Base_Ai_Cf_Deepgram_Aura_2_En {
|
|
9039
|
+
inputs: Ai_Cf_Deepgram_Aura_2_En_Input;
|
|
9040
|
+
postProcessedOutputs: Ai_Cf_Deepgram_Aura_2_En_Output;
|
|
9041
|
+
}
|
|
9042
|
+
interface Ai_Cf_Deepgram_Aura_2_Es_Input {
|
|
9043
|
+
/**
|
|
9044
|
+
* Speaker used to produce the audio.
|
|
9045
|
+
*/
|
|
9046
|
+
speaker?:
|
|
9047
|
+
| "sirio"
|
|
9048
|
+
| "nestor"
|
|
9049
|
+
| "carina"
|
|
9050
|
+
| "celeste"
|
|
9051
|
+
| "alvaro"
|
|
9052
|
+
| "diana"
|
|
9053
|
+
| "aquila"
|
|
9054
|
+
| "selena"
|
|
9055
|
+
| "estrella"
|
|
9056
|
+
| "javier";
|
|
9057
|
+
/**
|
|
9058
|
+
* Encoding of the output audio.
|
|
9059
|
+
*/
|
|
9060
|
+
encoding?: "linear16" | "flac" | "mulaw" | "alaw" | "mp3" | "opus" | "aac";
|
|
9061
|
+
/**
|
|
9062
|
+
* Container specifies the file format wrapper for the output audio. The available options depend on the encoding type..
|
|
9063
|
+
*/
|
|
9064
|
+
container?: "none" | "wav" | "ogg";
|
|
9065
|
+
/**
|
|
9066
|
+
* The text content to be converted to speech
|
|
9067
|
+
*/
|
|
9068
|
+
text: string;
|
|
9069
|
+
/**
|
|
9070
|
+
* Sample Rate specifies the sample rate for the output audio. Based on the encoding, different sample rates are supported. For some encodings, the sample rate is not configurable
|
|
9071
|
+
*/
|
|
9072
|
+
sample_rate?: number;
|
|
9073
|
+
/**
|
|
9074
|
+
* The bitrate of the audio in bits per second. Choose from predefined ranges or specific values based on the encoding type.
|
|
9075
|
+
*/
|
|
9076
|
+
bit_rate?: number;
|
|
9077
|
+
}
|
|
9078
|
+
/**
|
|
9079
|
+
* The generated audio in MP3 format
|
|
9080
|
+
*/
|
|
9081
|
+
type Ai_Cf_Deepgram_Aura_2_Es_Output = string;
|
|
9082
|
+
declare abstract class Base_Ai_Cf_Deepgram_Aura_2_Es {
|
|
9083
|
+
inputs: Ai_Cf_Deepgram_Aura_2_Es_Input;
|
|
9084
|
+
postProcessedOutputs: Ai_Cf_Deepgram_Aura_2_Es_Output;
|
|
7177
9085
|
}
|
|
7178
9086
|
interface AiModels {
|
|
7179
9087
|
"@cf/huggingface/distilbert-sst-2-int8": BaseAiTextClassification;
|
|
@@ -7218,12 +9126,12 @@ interface AiModels {
|
|
|
7218
9126
|
"@cf/meta/llama-3-8b-instruct": BaseAiTextGeneration;
|
|
7219
9127
|
"@cf/fblgit/una-cybertron-7b-v2-bf16": BaseAiTextGeneration;
|
|
7220
9128
|
"@cf/meta/llama-3-8b-instruct-awq": BaseAiTextGeneration;
|
|
7221
|
-
"@hf/meta-llama/meta-llama-3-8b-instruct": BaseAiTextGeneration;
|
|
7222
9129
|
"@cf/meta/llama-3.1-8b-instruct-fp8": BaseAiTextGeneration;
|
|
7223
9130
|
"@cf/meta/llama-3.1-8b-instruct-awq": BaseAiTextGeneration;
|
|
7224
9131
|
"@cf/meta/llama-3.2-3b-instruct": BaseAiTextGeneration;
|
|
7225
9132
|
"@cf/meta/llama-3.2-1b-instruct": BaseAiTextGeneration;
|
|
7226
9133
|
"@cf/deepseek-ai/deepseek-r1-distill-qwen-32b": BaseAiTextGeneration;
|
|
9134
|
+
"@cf/ibm-granite/granite-4.0-h-micro": BaseAiTextGeneration;
|
|
7227
9135
|
"@cf/facebook/bart-large-cnn": BaseAiSummarization;
|
|
7228
9136
|
"@cf/llava-hf/llava-1.5-7b-hf": BaseAiImageToText;
|
|
7229
9137
|
"@cf/baai/bge-base-en-v1.5": Base_Ai_Cf_Baai_Bge_Base_En_V1_5;
|
|
@@ -7245,13 +9153,21 @@ interface AiModels {
|
|
|
7245
9153
|
"@cf/mistralai/mistral-small-3.1-24b-instruct": Base_Ai_Cf_Mistralai_Mistral_Small_3_1_24B_Instruct;
|
|
7246
9154
|
"@cf/google/gemma-3-12b-it": Base_Ai_Cf_Google_Gemma_3_12B_It;
|
|
7247
9155
|
"@cf/meta/llama-4-scout-17b-16e-instruct": Base_Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct;
|
|
9156
|
+
"@cf/qwen/qwen3-30b-a3b-fp8": Base_Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8;
|
|
7248
9157
|
"@cf/deepgram/nova-3": Base_Ai_Cf_Deepgram_Nova_3;
|
|
9158
|
+
"@cf/qwen/qwen3-embedding-0.6b": Base_Ai_Cf_Qwen_Qwen3_Embedding_0_6B;
|
|
7249
9159
|
"@cf/pipecat-ai/smart-turn-v2": Base_Ai_Cf_Pipecat_Ai_Smart_Turn_V2;
|
|
7250
9160
|
"@cf/openai/gpt-oss-120b": Base_Ai_Cf_Openai_Gpt_Oss_120B;
|
|
7251
9161
|
"@cf/openai/gpt-oss-20b": Base_Ai_Cf_Openai_Gpt_Oss_20B;
|
|
7252
9162
|
"@cf/leonardo/phoenix-1.0": Base_Ai_Cf_Leonardo_Phoenix_1_0;
|
|
7253
9163
|
"@cf/leonardo/lucid-origin": Base_Ai_Cf_Leonardo_Lucid_Origin;
|
|
7254
9164
|
"@cf/deepgram/aura-1": Base_Ai_Cf_Deepgram_Aura_1;
|
|
9165
|
+
"@cf/ai4bharat/indictrans2-en-indic-1B": Base_Ai_Cf_Ai4Bharat_Indictrans2_En_Indic_1B;
|
|
9166
|
+
"@cf/aisingapore/gemma-sea-lion-v4-27b-it": Base_Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It;
|
|
9167
|
+
"@cf/pfnet/plamo-embedding-1b": Base_Ai_Cf_Pfnet_Plamo_Embedding_1B;
|
|
9168
|
+
"@cf/deepgram/flux": Base_Ai_Cf_Deepgram_Flux;
|
|
9169
|
+
"@cf/deepgram/aura-2-en": Base_Ai_Cf_Deepgram_Aura_2_En;
|
|
9170
|
+
"@cf/deepgram/aura-2-es": Base_Ai_Cf_Deepgram_Aura_2_Es;
|
|
7255
9171
|
}
|
|
7256
9172
|
type AiOptions = {
|
|
7257
9173
|
/**
|
|
@@ -7263,6 +9179,16 @@ type AiOptions = {
|
|
|
7263
9179
|
* Establish websocket connections, only works for supported models
|
|
7264
9180
|
*/
|
|
7265
9181
|
websocket?: boolean;
|
|
9182
|
+
/**
|
|
9183
|
+
* Tag your requests to group and view them in Cloudflare dashboard.
|
|
9184
|
+
*
|
|
9185
|
+
* Rules:
|
|
9186
|
+
* Tags must only contain letters, numbers, and the symbols: : - . / @
|
|
9187
|
+
* Each tag can have maximum 50 characters.
|
|
9188
|
+
* Maximum 5 tags are allowed each request.
|
|
9189
|
+
* Duplicate tags will removed.
|
|
9190
|
+
*/
|
|
9191
|
+
tags: string[];
|
|
7266
9192
|
gateway?: GatewayOptions;
|
|
7267
9193
|
returnRawResponse?: boolean;
|
|
7268
9194
|
prefix?: string;
|
|
@@ -9350,12 +11276,13 @@ declare namespace Rpc {
|
|
|
9350
11276
|
export type Provider<
|
|
9351
11277
|
T extends object,
|
|
9352
11278
|
Reserved extends string = never,
|
|
9353
|
-
> = MaybeCallableProvider<T> &
|
|
9354
|
-
|
|
9355
|
-
|
|
9356
|
-
|
|
9357
|
-
|
|
9358
|
-
|
|
11279
|
+
> = MaybeCallableProvider<T> &
|
|
11280
|
+
Pick<
|
|
11281
|
+
{
|
|
11282
|
+
[K in keyof T]: MethodOrProperty<T[K]>;
|
|
11283
|
+
},
|
|
11284
|
+
Exclude<keyof T, Reserved | symbol | keyof StubBase<never>>
|
|
11285
|
+
>;
|
|
9359
11286
|
}
|
|
9360
11287
|
declare namespace Cloudflare {
|
|
9361
11288
|
// Type of `env`.
|