@workers-community/workers-types 4.20251121.0 → 4.20251125.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/index.d.ts +2289 -362
- package/index.ts +2289 -367
- package/package.json +1 -1
package/index.d.ts
CHANGED
|
@@ -4109,6 +4109,427 @@ declare abstract class BaseAiTranslation {
|
|
|
4109
4109
|
inputs: AiTranslationInput;
|
|
4110
4110
|
postProcessedOutputs: AiTranslationOutput;
|
|
4111
4111
|
}
|
|
4112
|
+
/**
|
|
4113
|
+
* Workers AI support for OpenAI's Responses API
|
|
4114
|
+
* Reference: https://github.com/openai/openai-node/blob/master/src/resources/responses/responses.ts
|
|
4115
|
+
*
|
|
4116
|
+
* It's a stripped down version from its source.
|
|
4117
|
+
* It currently supports basic function calling, json mode and accepts images as input.
|
|
4118
|
+
*
|
|
4119
|
+
* It does not include types for WebSearch, CodeInterpreter, FileInputs, MCP, CustomTools.
|
|
4120
|
+
* We plan to add those incrementally as model + platform capabilities evolve.
|
|
4121
|
+
*/
|
|
4122
|
+
type ResponsesInput = {
|
|
4123
|
+
background?: boolean | null;
|
|
4124
|
+
conversation?: string | ResponseConversationParam | null;
|
|
4125
|
+
include?: Array<ResponseIncludable> | null;
|
|
4126
|
+
input?: string | ResponseInput;
|
|
4127
|
+
instructions?: string | null;
|
|
4128
|
+
max_output_tokens?: number | null;
|
|
4129
|
+
parallel_tool_calls?: boolean | null;
|
|
4130
|
+
previous_response_id?: string | null;
|
|
4131
|
+
prompt_cache_key?: string;
|
|
4132
|
+
reasoning?: Reasoning | null;
|
|
4133
|
+
safety_identifier?: string;
|
|
4134
|
+
service_tier?: "auto" | "default" | "flex" | "scale" | "priority" | null;
|
|
4135
|
+
stream?: boolean | null;
|
|
4136
|
+
stream_options?: StreamOptions | null;
|
|
4137
|
+
temperature?: number | null;
|
|
4138
|
+
text?: ResponseTextConfig;
|
|
4139
|
+
tool_choice?: ToolChoiceOptions | ToolChoiceFunction;
|
|
4140
|
+
tools?: Array<Tool>;
|
|
4141
|
+
top_p?: number | null;
|
|
4142
|
+
truncation?: "auto" | "disabled" | null;
|
|
4143
|
+
};
|
|
4144
|
+
type ResponsesOutput = {
|
|
4145
|
+
id?: string;
|
|
4146
|
+
created_at?: number;
|
|
4147
|
+
output_text?: string;
|
|
4148
|
+
error?: ResponseError | null;
|
|
4149
|
+
incomplete_details?: ResponseIncompleteDetails | null;
|
|
4150
|
+
instructions?: string | Array<ResponseInputItem> | null;
|
|
4151
|
+
object?: "response";
|
|
4152
|
+
output?: Array<ResponseOutputItem>;
|
|
4153
|
+
parallel_tool_calls?: boolean;
|
|
4154
|
+
temperature?: number | null;
|
|
4155
|
+
tool_choice?: ToolChoiceOptions | ToolChoiceFunction;
|
|
4156
|
+
tools?: Array<Tool>;
|
|
4157
|
+
top_p?: number | null;
|
|
4158
|
+
max_output_tokens?: number | null;
|
|
4159
|
+
previous_response_id?: string | null;
|
|
4160
|
+
prompt?: ResponsePrompt | null;
|
|
4161
|
+
reasoning?: Reasoning | null;
|
|
4162
|
+
safety_identifier?: string;
|
|
4163
|
+
service_tier?: "auto" | "default" | "flex" | "scale" | "priority" | null;
|
|
4164
|
+
status?: ResponseStatus;
|
|
4165
|
+
text?: ResponseTextConfig;
|
|
4166
|
+
truncation?: "auto" | "disabled" | null;
|
|
4167
|
+
usage?: ResponseUsage;
|
|
4168
|
+
};
|
|
4169
|
+
type EasyInputMessage = {
|
|
4170
|
+
content: string | ResponseInputMessageContentList;
|
|
4171
|
+
role: "user" | "assistant" | "system" | "developer";
|
|
4172
|
+
type?: "message";
|
|
4173
|
+
};
|
|
4174
|
+
type ResponsesFunctionTool = {
|
|
4175
|
+
name: string;
|
|
4176
|
+
parameters: {
|
|
4177
|
+
[key: string]: unknown;
|
|
4178
|
+
} | null;
|
|
4179
|
+
strict: boolean | null;
|
|
4180
|
+
type: "function";
|
|
4181
|
+
description?: string | null;
|
|
4182
|
+
};
|
|
4183
|
+
type ResponseIncompleteDetails = {
|
|
4184
|
+
reason?: "max_output_tokens" | "content_filter";
|
|
4185
|
+
};
|
|
4186
|
+
type ResponsePrompt = {
|
|
4187
|
+
id: string;
|
|
4188
|
+
variables?: {
|
|
4189
|
+
[key: string]: string | ResponseInputText | ResponseInputImage;
|
|
4190
|
+
} | null;
|
|
4191
|
+
version?: string | null;
|
|
4192
|
+
};
|
|
4193
|
+
type Reasoning = {
|
|
4194
|
+
effort?: ReasoningEffort | null;
|
|
4195
|
+
generate_summary?: "auto" | "concise" | "detailed" | null;
|
|
4196
|
+
summary?: "auto" | "concise" | "detailed" | null;
|
|
4197
|
+
};
|
|
4198
|
+
type ResponseContent =
|
|
4199
|
+
| ResponseInputText
|
|
4200
|
+
| ResponseInputImage
|
|
4201
|
+
| ResponseOutputText
|
|
4202
|
+
| ResponseOutputRefusal
|
|
4203
|
+
| ResponseContentReasoningText;
|
|
4204
|
+
type ResponseContentReasoningText = {
|
|
4205
|
+
text: string;
|
|
4206
|
+
type: "reasoning_text";
|
|
4207
|
+
};
|
|
4208
|
+
type ResponseConversationParam = {
|
|
4209
|
+
id: string;
|
|
4210
|
+
};
|
|
4211
|
+
type ResponseCreatedEvent = {
|
|
4212
|
+
response: Response;
|
|
4213
|
+
sequence_number: number;
|
|
4214
|
+
type: "response.created";
|
|
4215
|
+
};
|
|
4216
|
+
type ResponseCustomToolCallOutput = {
|
|
4217
|
+
call_id: string;
|
|
4218
|
+
output: string | Array<ResponseInputText | ResponseInputImage>;
|
|
4219
|
+
type: "custom_tool_call_output";
|
|
4220
|
+
id?: string;
|
|
4221
|
+
};
|
|
4222
|
+
type ResponseError = {
|
|
4223
|
+
code:
|
|
4224
|
+
| "server_error"
|
|
4225
|
+
| "rate_limit_exceeded"
|
|
4226
|
+
| "invalid_prompt"
|
|
4227
|
+
| "vector_store_timeout"
|
|
4228
|
+
| "invalid_image"
|
|
4229
|
+
| "invalid_image_format"
|
|
4230
|
+
| "invalid_base64_image"
|
|
4231
|
+
| "invalid_image_url"
|
|
4232
|
+
| "image_too_large"
|
|
4233
|
+
| "image_too_small"
|
|
4234
|
+
| "image_parse_error"
|
|
4235
|
+
| "image_content_policy_violation"
|
|
4236
|
+
| "invalid_image_mode"
|
|
4237
|
+
| "image_file_too_large"
|
|
4238
|
+
| "unsupported_image_media_type"
|
|
4239
|
+
| "empty_image_file"
|
|
4240
|
+
| "failed_to_download_image"
|
|
4241
|
+
| "image_file_not_found";
|
|
4242
|
+
message: string;
|
|
4243
|
+
};
|
|
4244
|
+
type ResponseErrorEvent = {
|
|
4245
|
+
code: string | null;
|
|
4246
|
+
message: string;
|
|
4247
|
+
param: string | null;
|
|
4248
|
+
sequence_number: number;
|
|
4249
|
+
type: "error";
|
|
4250
|
+
};
|
|
4251
|
+
type ResponseFailedEvent = {
|
|
4252
|
+
response: Response;
|
|
4253
|
+
sequence_number: number;
|
|
4254
|
+
type: "response.failed";
|
|
4255
|
+
};
|
|
4256
|
+
type ResponseFormatText = {
|
|
4257
|
+
type: "text";
|
|
4258
|
+
};
|
|
4259
|
+
type ResponseFormatJSONObject = {
|
|
4260
|
+
type: "json_object";
|
|
4261
|
+
};
|
|
4262
|
+
type ResponseFormatTextConfig =
|
|
4263
|
+
| ResponseFormatText
|
|
4264
|
+
| ResponseFormatTextJSONSchemaConfig
|
|
4265
|
+
| ResponseFormatJSONObject;
|
|
4266
|
+
type ResponseFormatTextJSONSchemaConfig = {
|
|
4267
|
+
name: string;
|
|
4268
|
+
schema: {
|
|
4269
|
+
[key: string]: unknown;
|
|
4270
|
+
};
|
|
4271
|
+
type: "json_schema";
|
|
4272
|
+
description?: string;
|
|
4273
|
+
strict?: boolean | null;
|
|
4274
|
+
};
|
|
4275
|
+
type ResponseFunctionCallArgumentsDeltaEvent = {
|
|
4276
|
+
delta: string;
|
|
4277
|
+
item_id: string;
|
|
4278
|
+
output_index: number;
|
|
4279
|
+
sequence_number: number;
|
|
4280
|
+
type: "response.function_call_arguments.delta";
|
|
4281
|
+
};
|
|
4282
|
+
type ResponseFunctionCallArgumentsDoneEvent = {
|
|
4283
|
+
arguments: string;
|
|
4284
|
+
item_id: string;
|
|
4285
|
+
name: string;
|
|
4286
|
+
output_index: number;
|
|
4287
|
+
sequence_number: number;
|
|
4288
|
+
type: "response.function_call_arguments.done";
|
|
4289
|
+
};
|
|
4290
|
+
type ResponseFunctionCallOutputItem =
|
|
4291
|
+
| ResponseInputTextContent
|
|
4292
|
+
| ResponseInputImageContent;
|
|
4293
|
+
type ResponseFunctionCallOutputItemList = Array<ResponseFunctionCallOutputItem>;
|
|
4294
|
+
type ResponseFunctionToolCall = {
|
|
4295
|
+
arguments: string;
|
|
4296
|
+
call_id: string;
|
|
4297
|
+
name: string;
|
|
4298
|
+
type: "function_call";
|
|
4299
|
+
id?: string;
|
|
4300
|
+
status?: "in_progress" | "completed" | "incomplete";
|
|
4301
|
+
};
|
|
4302
|
+
interface ResponseFunctionToolCallItem extends ResponseFunctionToolCall {
|
|
4303
|
+
id: string;
|
|
4304
|
+
}
|
|
4305
|
+
type ResponseFunctionToolCallOutputItem = {
|
|
4306
|
+
id: string;
|
|
4307
|
+
call_id: string;
|
|
4308
|
+
output: string | Array<ResponseInputText | ResponseInputImage>;
|
|
4309
|
+
type: "function_call_output";
|
|
4310
|
+
status?: "in_progress" | "completed" | "incomplete";
|
|
4311
|
+
};
|
|
4312
|
+
type ResponseIncludable =
|
|
4313
|
+
| "message.input_image.image_url"
|
|
4314
|
+
| "message.output_text.logprobs";
|
|
4315
|
+
type ResponseIncompleteEvent = {
|
|
4316
|
+
response: Response;
|
|
4317
|
+
sequence_number: number;
|
|
4318
|
+
type: "response.incomplete";
|
|
4319
|
+
};
|
|
4320
|
+
type ResponseInput = Array<ResponseInputItem>;
|
|
4321
|
+
type ResponseInputContent = ResponseInputText | ResponseInputImage;
|
|
4322
|
+
type ResponseInputImage = {
|
|
4323
|
+
detail: "low" | "high" | "auto";
|
|
4324
|
+
type: "input_image";
|
|
4325
|
+
/**
|
|
4326
|
+
* Base64 encoded image
|
|
4327
|
+
*/
|
|
4328
|
+
image_url?: string | null;
|
|
4329
|
+
};
|
|
4330
|
+
type ResponseInputImageContent = {
|
|
4331
|
+
type: "input_image";
|
|
4332
|
+
detail?: "low" | "high" | "auto" | null;
|
|
4333
|
+
/**
|
|
4334
|
+
* Base64 encoded image
|
|
4335
|
+
*/
|
|
4336
|
+
image_url?: string | null;
|
|
4337
|
+
};
|
|
4338
|
+
type ResponseInputItem =
|
|
4339
|
+
| EasyInputMessage
|
|
4340
|
+
| ResponseInputItemMessage
|
|
4341
|
+
| ResponseOutputMessage
|
|
4342
|
+
| ResponseFunctionToolCall
|
|
4343
|
+
| ResponseInputItemFunctionCallOutput
|
|
4344
|
+
| ResponseReasoningItem;
|
|
4345
|
+
type ResponseInputItemFunctionCallOutput = {
|
|
4346
|
+
call_id: string;
|
|
4347
|
+
output: string | ResponseFunctionCallOutputItemList;
|
|
4348
|
+
type: "function_call_output";
|
|
4349
|
+
id?: string | null;
|
|
4350
|
+
status?: "in_progress" | "completed" | "incomplete" | null;
|
|
4351
|
+
};
|
|
4352
|
+
type ResponseInputItemMessage = {
|
|
4353
|
+
content: ResponseInputMessageContentList;
|
|
4354
|
+
role: "user" | "system" | "developer";
|
|
4355
|
+
status?: "in_progress" | "completed" | "incomplete";
|
|
4356
|
+
type?: "message";
|
|
4357
|
+
};
|
|
4358
|
+
type ResponseInputMessageContentList = Array<ResponseInputContent>;
|
|
4359
|
+
type ResponseInputMessageItem = {
|
|
4360
|
+
id: string;
|
|
4361
|
+
content: ResponseInputMessageContentList;
|
|
4362
|
+
role: "user" | "system" | "developer";
|
|
4363
|
+
status?: "in_progress" | "completed" | "incomplete";
|
|
4364
|
+
type?: "message";
|
|
4365
|
+
};
|
|
4366
|
+
type ResponseInputText = {
|
|
4367
|
+
text: string;
|
|
4368
|
+
type: "input_text";
|
|
4369
|
+
};
|
|
4370
|
+
type ResponseInputTextContent = {
|
|
4371
|
+
text: string;
|
|
4372
|
+
type: "input_text";
|
|
4373
|
+
};
|
|
4374
|
+
type ResponseItem =
|
|
4375
|
+
| ResponseInputMessageItem
|
|
4376
|
+
| ResponseOutputMessage
|
|
4377
|
+
| ResponseFunctionToolCallItem
|
|
4378
|
+
| ResponseFunctionToolCallOutputItem;
|
|
4379
|
+
type ResponseOutputItem =
|
|
4380
|
+
| ResponseOutputMessage
|
|
4381
|
+
| ResponseFunctionToolCall
|
|
4382
|
+
| ResponseReasoningItem;
|
|
4383
|
+
type ResponseOutputItemAddedEvent = {
|
|
4384
|
+
item: ResponseOutputItem;
|
|
4385
|
+
output_index: number;
|
|
4386
|
+
sequence_number: number;
|
|
4387
|
+
type: "response.output_item.added";
|
|
4388
|
+
};
|
|
4389
|
+
type ResponseOutputItemDoneEvent = {
|
|
4390
|
+
item: ResponseOutputItem;
|
|
4391
|
+
output_index: number;
|
|
4392
|
+
sequence_number: number;
|
|
4393
|
+
type: "response.output_item.done";
|
|
4394
|
+
};
|
|
4395
|
+
type ResponseOutputMessage = {
|
|
4396
|
+
id: string;
|
|
4397
|
+
content: Array<ResponseOutputText | ResponseOutputRefusal>;
|
|
4398
|
+
role: "assistant";
|
|
4399
|
+
status: "in_progress" | "completed" | "incomplete";
|
|
4400
|
+
type: "message";
|
|
4401
|
+
};
|
|
4402
|
+
type ResponseOutputRefusal = {
|
|
4403
|
+
refusal: string;
|
|
4404
|
+
type: "refusal";
|
|
4405
|
+
};
|
|
4406
|
+
type ResponseOutputText = {
|
|
4407
|
+
text: string;
|
|
4408
|
+
type: "output_text";
|
|
4409
|
+
logprobs?: Array<Logprob>;
|
|
4410
|
+
};
|
|
4411
|
+
type ResponseReasoningItem = {
|
|
4412
|
+
id: string;
|
|
4413
|
+
summary: Array<ResponseReasoningSummaryItem>;
|
|
4414
|
+
type: "reasoning";
|
|
4415
|
+
content?: Array<ResponseReasoningContentItem>;
|
|
4416
|
+
encrypted_content?: string | null;
|
|
4417
|
+
status?: "in_progress" | "completed" | "incomplete";
|
|
4418
|
+
};
|
|
4419
|
+
type ResponseReasoningSummaryItem = {
|
|
4420
|
+
text: string;
|
|
4421
|
+
type: "summary_text";
|
|
4422
|
+
};
|
|
4423
|
+
type ResponseReasoningContentItem = {
|
|
4424
|
+
text: string;
|
|
4425
|
+
type: "reasoning_text";
|
|
4426
|
+
};
|
|
4427
|
+
type ResponseReasoningTextDeltaEvent = {
|
|
4428
|
+
content_index: number;
|
|
4429
|
+
delta: string;
|
|
4430
|
+
item_id: string;
|
|
4431
|
+
output_index: number;
|
|
4432
|
+
sequence_number: number;
|
|
4433
|
+
type: "response.reasoning_text.delta";
|
|
4434
|
+
};
|
|
4435
|
+
type ResponseReasoningTextDoneEvent = {
|
|
4436
|
+
content_index: number;
|
|
4437
|
+
item_id: string;
|
|
4438
|
+
output_index: number;
|
|
4439
|
+
sequence_number: number;
|
|
4440
|
+
text: string;
|
|
4441
|
+
type: "response.reasoning_text.done";
|
|
4442
|
+
};
|
|
4443
|
+
type ResponseRefusalDeltaEvent = {
|
|
4444
|
+
content_index: number;
|
|
4445
|
+
delta: string;
|
|
4446
|
+
item_id: string;
|
|
4447
|
+
output_index: number;
|
|
4448
|
+
sequence_number: number;
|
|
4449
|
+
type: "response.refusal.delta";
|
|
4450
|
+
};
|
|
4451
|
+
type ResponseRefusalDoneEvent = {
|
|
4452
|
+
content_index: number;
|
|
4453
|
+
item_id: string;
|
|
4454
|
+
output_index: number;
|
|
4455
|
+
refusal: string;
|
|
4456
|
+
sequence_number: number;
|
|
4457
|
+
type: "response.refusal.done";
|
|
4458
|
+
};
|
|
4459
|
+
type ResponseStatus =
|
|
4460
|
+
| "completed"
|
|
4461
|
+
| "failed"
|
|
4462
|
+
| "in_progress"
|
|
4463
|
+
| "cancelled"
|
|
4464
|
+
| "queued"
|
|
4465
|
+
| "incomplete";
|
|
4466
|
+
type ResponseStreamEvent =
|
|
4467
|
+
| ResponseCompletedEvent
|
|
4468
|
+
| ResponseCreatedEvent
|
|
4469
|
+
| ResponseErrorEvent
|
|
4470
|
+
| ResponseFunctionCallArgumentsDeltaEvent
|
|
4471
|
+
| ResponseFunctionCallArgumentsDoneEvent
|
|
4472
|
+
| ResponseFailedEvent
|
|
4473
|
+
| ResponseIncompleteEvent
|
|
4474
|
+
| ResponseOutputItemAddedEvent
|
|
4475
|
+
| ResponseOutputItemDoneEvent
|
|
4476
|
+
| ResponseReasoningTextDeltaEvent
|
|
4477
|
+
| ResponseReasoningTextDoneEvent
|
|
4478
|
+
| ResponseRefusalDeltaEvent
|
|
4479
|
+
| ResponseRefusalDoneEvent
|
|
4480
|
+
| ResponseTextDeltaEvent
|
|
4481
|
+
| ResponseTextDoneEvent;
|
|
4482
|
+
type ResponseCompletedEvent = {
|
|
4483
|
+
response: Response;
|
|
4484
|
+
sequence_number: number;
|
|
4485
|
+
type: "response.completed";
|
|
4486
|
+
};
|
|
4487
|
+
type ResponseTextConfig = {
|
|
4488
|
+
format?: ResponseFormatTextConfig;
|
|
4489
|
+
verbosity?: "low" | "medium" | "high" | null;
|
|
4490
|
+
};
|
|
4491
|
+
type ResponseTextDeltaEvent = {
|
|
4492
|
+
content_index: number;
|
|
4493
|
+
delta: string;
|
|
4494
|
+
item_id: string;
|
|
4495
|
+
logprobs: Array<Logprob>;
|
|
4496
|
+
output_index: number;
|
|
4497
|
+
sequence_number: number;
|
|
4498
|
+
type: "response.output_text.delta";
|
|
4499
|
+
};
|
|
4500
|
+
type ResponseTextDoneEvent = {
|
|
4501
|
+
content_index: number;
|
|
4502
|
+
item_id: string;
|
|
4503
|
+
logprobs: Array<Logprob>;
|
|
4504
|
+
output_index: number;
|
|
4505
|
+
sequence_number: number;
|
|
4506
|
+
text: string;
|
|
4507
|
+
type: "response.output_text.done";
|
|
4508
|
+
};
|
|
4509
|
+
type Logprob = {
|
|
4510
|
+
token: string;
|
|
4511
|
+
logprob: number;
|
|
4512
|
+
top_logprobs?: Array<TopLogprob>;
|
|
4513
|
+
};
|
|
4514
|
+
type TopLogprob = {
|
|
4515
|
+
token?: string;
|
|
4516
|
+
logprob?: number;
|
|
4517
|
+
};
|
|
4518
|
+
type ResponseUsage = {
|
|
4519
|
+
input_tokens: number;
|
|
4520
|
+
output_tokens: number;
|
|
4521
|
+
total_tokens: number;
|
|
4522
|
+
};
|
|
4523
|
+
type Tool = ResponsesFunctionTool;
|
|
4524
|
+
type ToolChoiceFunction = {
|
|
4525
|
+
name: string;
|
|
4526
|
+
type: "function";
|
|
4527
|
+
};
|
|
4528
|
+
type ToolChoiceOptions = "none";
|
|
4529
|
+
type ReasoningEffort = "minimal" | "low" | "medium" | "high" | null;
|
|
4530
|
+
type StreamOptions = {
|
|
4531
|
+
include_obfuscation?: boolean;
|
|
4532
|
+
};
|
|
4112
4533
|
type Ai_Cf_Baai_Bge_Base_En_V1_5_Input =
|
|
4113
4534
|
| {
|
|
4114
4535
|
text: string | string[];
|
|
@@ -4141,8 +4562,8 @@ type Ai_Cf_Baai_Bge_Base_En_V1_5_Output =
|
|
|
4141
4562
|
*/
|
|
4142
4563
|
pooling?: "mean" | "cls";
|
|
4143
4564
|
}
|
|
4144
|
-
|
|
|
4145
|
-
interface
|
|
4565
|
+
| Ai_Cf_Baai_Bge_Base_En_V1_5_AsyncResponse;
|
|
4566
|
+
interface Ai_Cf_Baai_Bge_Base_En_V1_5_AsyncResponse {
|
|
4146
4567
|
/**
|
|
4147
4568
|
* The async request id that can be used to obtain the results.
|
|
4148
4569
|
*/
|
|
@@ -4224,7 +4645,13 @@ type Ai_Cf_Meta_M2M100_1_2B_Output =
|
|
|
4224
4645
|
*/
|
|
4225
4646
|
translated_text?: string;
|
|
4226
4647
|
}
|
|
4227
|
-
|
|
|
4648
|
+
| Ai_Cf_Meta_M2M100_1_2B_AsyncResponse;
|
|
4649
|
+
interface Ai_Cf_Meta_M2M100_1_2B_AsyncResponse {
|
|
4650
|
+
/**
|
|
4651
|
+
* The async request id that can be used to obtain the results.
|
|
4652
|
+
*/
|
|
4653
|
+
request_id?: string;
|
|
4654
|
+
}
|
|
4228
4655
|
declare abstract class Base_Ai_Cf_Meta_M2M100_1_2B {
|
|
4229
4656
|
inputs: Ai_Cf_Meta_M2M100_1_2B_Input;
|
|
4230
4657
|
postProcessedOutputs: Ai_Cf_Meta_M2M100_1_2B_Output;
|
|
@@ -4261,7 +4688,13 @@ type Ai_Cf_Baai_Bge_Small_En_V1_5_Output =
|
|
|
4261
4688
|
*/
|
|
4262
4689
|
pooling?: "mean" | "cls";
|
|
4263
4690
|
}
|
|
4264
|
-
|
|
|
4691
|
+
| Ai_Cf_Baai_Bge_Small_En_V1_5_AsyncResponse;
|
|
4692
|
+
interface Ai_Cf_Baai_Bge_Small_En_V1_5_AsyncResponse {
|
|
4693
|
+
/**
|
|
4694
|
+
* The async request id that can be used to obtain the results.
|
|
4695
|
+
*/
|
|
4696
|
+
request_id?: string;
|
|
4697
|
+
}
|
|
4265
4698
|
declare abstract class Base_Ai_Cf_Baai_Bge_Small_En_V1_5 {
|
|
4266
4699
|
inputs: Ai_Cf_Baai_Bge_Small_En_V1_5_Input;
|
|
4267
4700
|
postProcessedOutputs: Ai_Cf_Baai_Bge_Small_En_V1_5_Output;
|
|
@@ -4298,7 +4731,13 @@ type Ai_Cf_Baai_Bge_Large_En_V1_5_Output =
|
|
|
4298
4731
|
*/
|
|
4299
4732
|
pooling?: "mean" | "cls";
|
|
4300
4733
|
}
|
|
4301
|
-
|
|
|
4734
|
+
| Ai_Cf_Baai_Bge_Large_En_V1_5_AsyncResponse;
|
|
4735
|
+
interface Ai_Cf_Baai_Bge_Large_En_V1_5_AsyncResponse {
|
|
4736
|
+
/**
|
|
4737
|
+
* The async request id that can be used to obtain the results.
|
|
4738
|
+
*/
|
|
4739
|
+
request_id?: string;
|
|
4740
|
+
}
|
|
4302
4741
|
declare abstract class Base_Ai_Cf_Baai_Bge_Large_En_V1_5 {
|
|
4303
4742
|
inputs: Ai_Cf_Baai_Bge_Large_En_V1_5_Input;
|
|
4304
4743
|
postProcessedOutputs: Ai_Cf_Baai_Bge_Large_En_V1_5_Output;
|
|
@@ -4489,15 +4928,18 @@ declare abstract class Base_Ai_Cf_Openai_Whisper_Large_V3_Turbo {
|
|
|
4489
4928
|
postProcessedOutputs: Ai_Cf_Openai_Whisper_Large_V3_Turbo_Output;
|
|
4490
4929
|
}
|
|
4491
4930
|
type Ai_Cf_Baai_Bge_M3_Input =
|
|
4492
|
-
|
|
|
4493
|
-
|
|
|
4931
|
+
| Ai_Cf_Baai_Bge_M3_Input_QueryAnd_Contexts
|
|
4932
|
+
| Ai_Cf_Baai_Bge_M3_Input_Embedding
|
|
4494
4933
|
| {
|
|
4495
4934
|
/**
|
|
4496
4935
|
* Batch of the embeddings requests to run using async-queue
|
|
4497
4936
|
*/
|
|
4498
|
-
requests: (
|
|
4937
|
+
requests: (
|
|
4938
|
+
| Ai_Cf_Baai_Bge_M3_Input_QueryAnd_Contexts_1
|
|
4939
|
+
| Ai_Cf_Baai_Bge_M3_Input_Embedding_1
|
|
4940
|
+
)[];
|
|
4499
4941
|
};
|
|
4500
|
-
interface
|
|
4942
|
+
interface Ai_Cf_Baai_Bge_M3_Input_QueryAnd_Contexts {
|
|
4501
4943
|
/**
|
|
4502
4944
|
* A query you wish to perform against the provided contexts. If no query is provided the model with respond with embeddings for contexts
|
|
4503
4945
|
*/
|
|
@@ -4516,14 +4958,14 @@ interface BGEM3InputQueryAndContexts {
|
|
|
4516
4958
|
*/
|
|
4517
4959
|
truncate_inputs?: boolean;
|
|
4518
4960
|
}
|
|
4519
|
-
interface
|
|
4961
|
+
interface Ai_Cf_Baai_Bge_M3_Input_Embedding {
|
|
4520
4962
|
text: string | string[];
|
|
4521
4963
|
/**
|
|
4522
4964
|
* When provided with too long context should the model error out or truncate the context to fit?
|
|
4523
4965
|
*/
|
|
4524
4966
|
truncate_inputs?: boolean;
|
|
4525
4967
|
}
|
|
4526
|
-
interface
|
|
4968
|
+
interface Ai_Cf_Baai_Bge_M3_Input_QueryAnd_Contexts_1 {
|
|
4527
4969
|
/**
|
|
4528
4970
|
* A query you wish to perform against the provided contexts. If no query is provided the model with respond with embeddings for contexts
|
|
4529
4971
|
*/
|
|
@@ -4542,7 +4984,7 @@ interface BGEM3InputQueryAndContexts1 {
|
|
|
4542
4984
|
*/
|
|
4543
4985
|
truncate_inputs?: boolean;
|
|
4544
4986
|
}
|
|
4545
|
-
interface
|
|
4987
|
+
interface Ai_Cf_Baai_Bge_M3_Input_Embedding_1 {
|
|
4546
4988
|
text: string | string[];
|
|
4547
4989
|
/**
|
|
4548
4990
|
* When provided with too long context should the model error out or truncate the context to fit?
|
|
@@ -4550,11 +4992,11 @@ interface BGEM3InputEmbedding1 {
|
|
|
4550
4992
|
truncate_inputs?: boolean;
|
|
4551
4993
|
}
|
|
4552
4994
|
type Ai_Cf_Baai_Bge_M3_Output =
|
|
4553
|
-
|
|
|
4554
|
-
|
|
|
4555
|
-
|
|
|
4556
|
-
|
|
|
4557
|
-
interface
|
|
4995
|
+
| Ai_Cf_Baai_Bge_M3_Ouput_Query
|
|
4996
|
+
| Ai_Cf_Baai_Bge_M3_Output_EmbeddingFor_Contexts
|
|
4997
|
+
| Ai_Cf_Baai_Bge_M3_Ouput_Embedding
|
|
4998
|
+
| Ai_Cf_Baai_Bge_M3_AsyncResponse;
|
|
4999
|
+
interface Ai_Cf_Baai_Bge_M3_Ouput_Query {
|
|
4558
5000
|
response?: {
|
|
4559
5001
|
/**
|
|
4560
5002
|
* Index of the context in the request
|
|
@@ -4566,7 +5008,7 @@ interface BGEM3OuputQuery {
|
|
|
4566
5008
|
score?: number;
|
|
4567
5009
|
}[];
|
|
4568
5010
|
}
|
|
4569
|
-
interface
|
|
5011
|
+
interface Ai_Cf_Baai_Bge_M3_Output_EmbeddingFor_Contexts {
|
|
4570
5012
|
response?: number[][];
|
|
4571
5013
|
shape?: number[];
|
|
4572
5014
|
/**
|
|
@@ -4574,7 +5016,7 @@ interface BGEM3OutputEmbeddingForContexts {
|
|
|
4574
5016
|
*/
|
|
4575
5017
|
pooling?: "mean" | "cls";
|
|
4576
5018
|
}
|
|
4577
|
-
interface
|
|
5019
|
+
interface Ai_Cf_Baai_Bge_M3_Ouput_Embedding {
|
|
4578
5020
|
shape?: number[];
|
|
4579
5021
|
/**
|
|
4580
5022
|
* Embeddings of the requested text values
|
|
@@ -4585,6 +5027,12 @@ interface BGEM3OuputEmbedding {
|
|
|
4585
5027
|
*/
|
|
4586
5028
|
pooling?: "mean" | "cls";
|
|
4587
5029
|
}
|
|
5030
|
+
interface Ai_Cf_Baai_Bge_M3_AsyncResponse {
|
|
5031
|
+
/**
|
|
5032
|
+
* The async request id that can be used to obtain the results.
|
|
5033
|
+
*/
|
|
5034
|
+
request_id?: string;
|
|
5035
|
+
}
|
|
4588
5036
|
declare abstract class Base_Ai_Cf_Baai_Bge_M3 {
|
|
4589
5037
|
inputs: Ai_Cf_Baai_Bge_M3_Input;
|
|
4590
5038
|
postProcessedOutputs: Ai_Cf_Baai_Bge_M3_Output;
|
|
@@ -4609,8 +5057,10 @@ declare abstract class Base_Ai_Cf_Black_Forest_Labs_Flux_1_Schnell {
|
|
|
4609
5057
|
inputs: Ai_Cf_Black_Forest_Labs_Flux_1_Schnell_Input;
|
|
4610
5058
|
postProcessedOutputs: Ai_Cf_Black_Forest_Labs_Flux_1_Schnell_Output;
|
|
4611
5059
|
}
|
|
4612
|
-
type Ai_Cf_Meta_Llama_3_2_11B_Vision_Instruct_Input =
|
|
4613
|
-
|
|
5060
|
+
type Ai_Cf_Meta_Llama_3_2_11B_Vision_Instruct_Input =
|
|
5061
|
+
| Ai_Cf_Meta_Llama_3_2_11B_Vision_Instruct_Prompt
|
|
5062
|
+
| Ai_Cf_Meta_Llama_3_2_11B_Vision_Instruct_Messages;
|
|
5063
|
+
interface Ai_Cf_Meta_Llama_3_2_11B_Vision_Instruct_Prompt {
|
|
4614
5064
|
/**
|
|
4615
5065
|
* The input text prompt for the model to generate a response.
|
|
4616
5066
|
*/
|
|
@@ -4661,7 +5111,7 @@ interface Prompt {
|
|
|
4661
5111
|
*/
|
|
4662
5112
|
lora?: string;
|
|
4663
5113
|
}
|
|
4664
|
-
interface
|
|
5114
|
+
interface Ai_Cf_Meta_Llama_3_2_11B_Vision_Instruct_Messages {
|
|
4665
5115
|
/**
|
|
4666
5116
|
* An array of message objects representing the conversation history.
|
|
4667
5117
|
*/
|
|
@@ -4859,10 +5309,10 @@ declare abstract class Base_Ai_Cf_Meta_Llama_3_2_11B_Vision_Instruct {
|
|
|
4859
5309
|
postProcessedOutputs: Ai_Cf_Meta_Llama_3_2_11B_Vision_Instruct_Output;
|
|
4860
5310
|
}
|
|
4861
5311
|
type Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Input =
|
|
4862
|
-
|
|
|
4863
|
-
|
|
|
4864
|
-
|
|
|
4865
|
-
interface
|
|
5312
|
+
| Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Prompt
|
|
5313
|
+
| Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Messages
|
|
5314
|
+
| Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Async_Batch;
|
|
5315
|
+
interface Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Prompt {
|
|
4866
5316
|
/**
|
|
4867
5317
|
* The input text prompt for the model to generate a response.
|
|
4868
5318
|
*/
|
|
@@ -4871,7 +5321,7 @@ interface Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Prompt {
|
|
|
4871
5321
|
* Name of the LoRA (Low-Rank Adaptation) model to fine-tune the base model.
|
|
4872
5322
|
*/
|
|
4873
5323
|
lora?: string;
|
|
4874
|
-
response_format?:
|
|
5324
|
+
response_format?: Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_JSON_Mode;
|
|
4875
5325
|
/**
|
|
4876
5326
|
* If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
|
|
4877
5327
|
*/
|
|
@@ -4913,11 +5363,11 @@ interface Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Prompt {
|
|
|
4913
5363
|
*/
|
|
4914
5364
|
presence_penalty?: number;
|
|
4915
5365
|
}
|
|
4916
|
-
interface
|
|
5366
|
+
interface Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_JSON_Mode {
|
|
4917
5367
|
type?: "json_object" | "json_schema";
|
|
4918
5368
|
json_schema?: unknown;
|
|
4919
5369
|
}
|
|
4920
|
-
interface
|
|
5370
|
+
interface Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Messages {
|
|
4921
5371
|
/**
|
|
4922
5372
|
* An array of message objects representing the conversation history.
|
|
4923
5373
|
*/
|
|
@@ -5025,7 +5475,7 @@ interface Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Messages {
|
|
|
5025
5475
|
};
|
|
5026
5476
|
}
|
|
5027
5477
|
)[];
|
|
5028
|
-
response_format?:
|
|
5478
|
+
response_format?: Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_JSON_Mode_1;
|
|
5029
5479
|
/**
|
|
5030
5480
|
* If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
|
|
5031
5481
|
*/
|
|
@@ -5067,7 +5517,11 @@ interface Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Messages {
|
|
|
5067
5517
|
*/
|
|
5068
5518
|
presence_penalty?: number;
|
|
5069
5519
|
}
|
|
5070
|
-
interface
|
|
5520
|
+
interface Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_JSON_Mode_1 {
|
|
5521
|
+
type?: "json_object" | "json_schema";
|
|
5522
|
+
json_schema?: unknown;
|
|
5523
|
+
}
|
|
5524
|
+
interface Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Async_Batch {
|
|
5071
5525
|
requests?: {
|
|
5072
5526
|
/**
|
|
5073
5527
|
* User-supplied reference. This field will be present in the response as well it can be used to reference the request and response. It's NOT validated to be unique.
|
|
@@ -5109,9 +5563,13 @@ interface AsyncBatch {
|
|
|
5109
5563
|
* Increases the likelihood of the model introducing new topics.
|
|
5110
5564
|
*/
|
|
5111
5565
|
presence_penalty?: number;
|
|
5112
|
-
response_format?:
|
|
5566
|
+
response_format?: Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_JSON_Mode_2;
|
|
5113
5567
|
}[];
|
|
5114
5568
|
}
|
|
5569
|
+
interface Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_JSON_Mode_2 {
|
|
5570
|
+
type?: "json_object" | "json_schema";
|
|
5571
|
+
json_schema?: unknown;
|
|
5572
|
+
}
|
|
5115
5573
|
type Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Output =
|
|
5116
5574
|
| {
|
|
5117
5575
|
/**
|
|
@@ -5150,7 +5608,13 @@ type Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Output =
|
|
|
5150
5608
|
}[];
|
|
5151
5609
|
}
|
|
5152
5610
|
| string
|
|
5153
|
-
|
|
|
5611
|
+
| Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_AsyncResponse;
|
|
5612
|
+
interface Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_AsyncResponse {
|
|
5613
|
+
/**
|
|
5614
|
+
* The async request id that can be used to obtain the results.
|
|
5615
|
+
*/
|
|
5616
|
+
request_id?: string;
|
|
5617
|
+
}
|
|
5154
5618
|
declare abstract class Base_Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast {
|
|
5155
5619
|
inputs: Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Input;
|
|
5156
5620
|
postProcessedOutputs: Ai_Cf_Meta_Llama_3_3_70B_Instruct_Fp8_Fast_Output;
|
|
@@ -5257,9 +5721,9 @@ declare abstract class Base_Ai_Cf_Baai_Bge_Reranker_Base {
|
|
|
5257
5721
|
postProcessedOutputs: Ai_Cf_Baai_Bge_Reranker_Base_Output;
|
|
5258
5722
|
}
|
|
5259
5723
|
type Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_Input =
|
|
5260
|
-
|
|
|
5261
|
-
|
|
|
5262
|
-
interface
|
|
5724
|
+
| Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_Prompt
|
|
5725
|
+
| Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_Messages;
|
|
5726
|
+
interface Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_Prompt {
|
|
5263
5727
|
/**
|
|
5264
5728
|
* The input text prompt for the model to generate a response.
|
|
5265
5729
|
*/
|
|
@@ -5268,7 +5732,7 @@ interface Qwen2_5_Coder_32B_Instruct_Prompt {
|
|
|
5268
5732
|
* Name of the LoRA (Low-Rank Adaptation) model to fine-tune the base model.
|
|
5269
5733
|
*/
|
|
5270
5734
|
lora?: string;
|
|
5271
|
-
response_format?:
|
|
5735
|
+
response_format?: Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_JSON_Mode;
|
|
5272
5736
|
/**
|
|
5273
5737
|
* If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
|
|
5274
5738
|
*/
|
|
@@ -5310,7 +5774,11 @@ interface Qwen2_5_Coder_32B_Instruct_Prompt {
|
|
|
5310
5774
|
*/
|
|
5311
5775
|
presence_penalty?: number;
|
|
5312
5776
|
}
|
|
5313
|
-
interface
|
|
5777
|
+
interface Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_JSON_Mode {
|
|
5778
|
+
type?: "json_object" | "json_schema";
|
|
5779
|
+
json_schema?: unknown;
|
|
5780
|
+
}
|
|
5781
|
+
interface Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_Messages {
|
|
5314
5782
|
/**
|
|
5315
5783
|
* An array of message objects representing the conversation history.
|
|
5316
5784
|
*/
|
|
@@ -5418,7 +5886,7 @@ interface Qwen2_5_Coder_32B_Instruct_Messages {
|
|
|
5418
5886
|
};
|
|
5419
5887
|
}
|
|
5420
5888
|
)[];
|
|
5421
|
-
response_format?:
|
|
5889
|
+
response_format?: Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_JSON_Mode_1;
|
|
5422
5890
|
/**
|
|
5423
5891
|
* If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
|
|
5424
5892
|
*/
|
|
@@ -5460,6 +5928,10 @@ interface Qwen2_5_Coder_32B_Instruct_Messages {
|
|
|
5460
5928
|
*/
|
|
5461
5929
|
presence_penalty?: number;
|
|
5462
5930
|
}
|
|
5931
|
+
interface Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_JSON_Mode_1 {
|
|
5932
|
+
type?: "json_object" | "json_schema";
|
|
5933
|
+
json_schema?: unknown;
|
|
5934
|
+
}
|
|
5463
5935
|
type Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_Output = {
|
|
5464
5936
|
/**
|
|
5465
5937
|
* The generated text response from the model
|
|
@@ -5500,8 +5972,10 @@ declare abstract class Base_Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct {
|
|
|
5500
5972
|
inputs: Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_Input;
|
|
5501
5973
|
postProcessedOutputs: Ai_Cf_Qwen_Qwen2_5_Coder_32B_Instruct_Output;
|
|
5502
5974
|
}
|
|
5503
|
-
type Ai_Cf_Qwen_Qwq_32B_Input =
|
|
5504
|
-
|
|
5975
|
+
type Ai_Cf_Qwen_Qwq_32B_Input =
|
|
5976
|
+
| Ai_Cf_Qwen_Qwq_32B_Prompt
|
|
5977
|
+
| Ai_Cf_Qwen_Qwq_32B_Messages;
|
|
5978
|
+
interface Ai_Cf_Qwen_Qwq_32B_Prompt {
|
|
5505
5979
|
/**
|
|
5506
5980
|
* The input text prompt for the model to generate a response.
|
|
5507
5981
|
*/
|
|
@@ -5551,7 +6025,7 @@ interface Qwen_Qwq_32B_Prompt {
|
|
|
5551
6025
|
*/
|
|
5552
6026
|
presence_penalty?: number;
|
|
5553
6027
|
}
|
|
5554
|
-
interface
|
|
6028
|
+
interface Ai_Cf_Qwen_Qwq_32B_Messages {
|
|
5555
6029
|
/**
|
|
5556
6030
|
* An array of message objects representing the conversation history.
|
|
5557
6031
|
*/
|
|
@@ -5773,9 +6247,9 @@ declare abstract class Base_Ai_Cf_Qwen_Qwq_32B {
|
|
|
5773
6247
|
postProcessedOutputs: Ai_Cf_Qwen_Qwq_32B_Output;
|
|
5774
6248
|
}
|
|
5775
6249
|
type Ai_Cf_Mistralai_Mistral_Small_3_1_24B_Instruct_Input =
|
|
5776
|
-
|
|
|
5777
|
-
|
|
|
5778
|
-
interface
|
|
6250
|
+
| Ai_Cf_Mistralai_Mistral_Small_3_1_24B_Instruct_Prompt
|
|
6251
|
+
| Ai_Cf_Mistralai_Mistral_Small_3_1_24B_Instruct_Messages;
|
|
6252
|
+
interface Ai_Cf_Mistralai_Mistral_Small_3_1_24B_Instruct_Prompt {
|
|
5779
6253
|
/**
|
|
5780
6254
|
* The input text prompt for the model to generate a response.
|
|
5781
6255
|
*/
|
|
@@ -5825,7 +6299,7 @@ interface Mistral_Small_3_1_24B_Instruct_Prompt {
|
|
|
5825
6299
|
*/
|
|
5826
6300
|
presence_penalty?: number;
|
|
5827
6301
|
}
|
|
5828
|
-
interface
|
|
6302
|
+
interface Ai_Cf_Mistralai_Mistral_Small_3_1_24B_Instruct_Messages {
|
|
5829
6303
|
/**
|
|
5830
6304
|
* An array of message objects representing the conversation history.
|
|
5831
6305
|
*/
|
|
@@ -6047,9 +6521,9 @@ declare abstract class Base_Ai_Cf_Mistralai_Mistral_Small_3_1_24B_Instruct {
|
|
|
6047
6521
|
postProcessedOutputs: Ai_Cf_Mistralai_Mistral_Small_3_1_24B_Instruct_Output;
|
|
6048
6522
|
}
|
|
6049
6523
|
type Ai_Cf_Google_Gemma_3_12B_It_Input =
|
|
6050
|
-
|
|
|
6051
|
-
|
|
|
6052
|
-
interface
|
|
6524
|
+
| Ai_Cf_Google_Gemma_3_12B_It_Prompt
|
|
6525
|
+
| Ai_Cf_Google_Gemma_3_12B_It_Messages;
|
|
6526
|
+
interface Ai_Cf_Google_Gemma_3_12B_It_Prompt {
|
|
6053
6527
|
/**
|
|
6054
6528
|
* The input text prompt for the model to generate a response.
|
|
6055
6529
|
*/
|
|
@@ -6099,7 +6573,7 @@ interface Google_Gemma_3_12B_It_Prompt {
|
|
|
6099
6573
|
*/
|
|
6100
6574
|
presence_penalty?: number;
|
|
6101
6575
|
}
|
|
6102
|
-
interface
|
|
6576
|
+
interface Ai_Cf_Google_Gemma_3_12B_It_Messages {
|
|
6103
6577
|
/**
|
|
6104
6578
|
* An array of message objects representing the conversation history.
|
|
6105
6579
|
*/
|
|
@@ -6122,20 +6596,7 @@ interface Google_Gemma_3_12B_It_Messages {
|
|
|
6122
6596
|
*/
|
|
6123
6597
|
url?: string;
|
|
6124
6598
|
};
|
|
6125
|
-
}[]
|
|
6126
|
-
| {
|
|
6127
|
-
/**
|
|
6128
|
-
* Type of the content provided
|
|
6129
|
-
*/
|
|
6130
|
-
type?: string;
|
|
6131
|
-
text?: string;
|
|
6132
|
-
image_url?: {
|
|
6133
|
-
/**
|
|
6134
|
-
* image uri with data (e.g. data:image/jpeg;base64,/9j/...). HTTP URL will not be accepted
|
|
6135
|
-
*/
|
|
6136
|
-
url?: string;
|
|
6137
|
-
};
|
|
6138
|
-
};
|
|
6599
|
+
}[];
|
|
6139
6600
|
}[];
|
|
6140
6601
|
functions?: {
|
|
6141
6602
|
name: string;
|
|
@@ -6317,10 +6778,10 @@ declare abstract class Base_Ai_Cf_Google_Gemma_3_12B_It {
|
|
|
6317
6778
|
postProcessedOutputs: Ai_Cf_Google_Gemma_3_12B_It_Output;
|
|
6318
6779
|
}
|
|
6319
6780
|
type Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Input =
|
|
6320
|
-
|
|
|
6321
|
-
|
|
|
6322
|
-
|
|
|
6323
|
-
interface
|
|
6781
|
+
| Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Prompt
|
|
6782
|
+
| Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Messages
|
|
6783
|
+
| Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Async_Batch;
|
|
6784
|
+
interface Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Prompt {
|
|
6324
6785
|
/**
|
|
6325
6786
|
* The input text prompt for the model to generate a response.
|
|
6326
6787
|
*/
|
|
@@ -6329,7 +6790,7 @@ interface Ai_Cf_Meta_Llama_4_Prompt {
|
|
|
6329
6790
|
* JSON schema that should be fulfilled for the response.
|
|
6330
6791
|
*/
|
|
6331
6792
|
guided_json?: object;
|
|
6332
|
-
response_format?:
|
|
6793
|
+
response_format?: Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_JSON_Mode;
|
|
6333
6794
|
/**
|
|
6334
6795
|
* If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
|
|
6335
6796
|
*/
|
|
@@ -6371,7 +6832,11 @@ interface Ai_Cf_Meta_Llama_4_Prompt {
|
|
|
6371
6832
|
*/
|
|
6372
6833
|
presence_penalty?: number;
|
|
6373
6834
|
}
|
|
6374
|
-
interface
|
|
6835
|
+
interface Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_JSON_Mode {
|
|
6836
|
+
type?: "json_object" | "json_schema";
|
|
6837
|
+
json_schema?: unknown;
|
|
6838
|
+
}
|
|
6839
|
+
interface Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Messages {
|
|
6375
6840
|
/**
|
|
6376
6841
|
* An array of message objects representing the conversation history.
|
|
6377
6842
|
*/
|
|
@@ -6507,7 +6972,7 @@ interface Ai_Cf_Meta_Llama_4_Messages {
|
|
|
6507
6972
|
};
|
|
6508
6973
|
}
|
|
6509
6974
|
)[];
|
|
6510
|
-
response_format?:
|
|
6975
|
+
response_format?: Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_JSON_Mode;
|
|
6511
6976
|
/**
|
|
6512
6977
|
* JSON schema that should be fufilled for the response.
|
|
6513
6978
|
*/
|
|
@@ -6553,13 +7018,13 @@ interface Ai_Cf_Meta_Llama_4_Messages {
|
|
|
6553
7018
|
*/
|
|
6554
7019
|
presence_penalty?: number;
|
|
6555
7020
|
}
|
|
6556
|
-
interface
|
|
7021
|
+
interface Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Async_Batch {
|
|
6557
7022
|
requests: (
|
|
6558
|
-
|
|
|
6559
|
-
|
|
|
7023
|
+
| Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Prompt_Inner
|
|
7024
|
+
| Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Messages_Inner
|
|
6560
7025
|
)[];
|
|
6561
7026
|
}
|
|
6562
|
-
interface
|
|
7027
|
+
interface Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Prompt_Inner {
|
|
6563
7028
|
/**
|
|
6564
7029
|
* The input text prompt for the model to generate a response.
|
|
6565
7030
|
*/
|
|
@@ -6568,7 +7033,7 @@ interface Ai_Cf_Meta_Llama_4_Prompt_Inner {
|
|
|
6568
7033
|
* JSON schema that should be fulfilled for the response.
|
|
6569
7034
|
*/
|
|
6570
7035
|
guided_json?: object;
|
|
6571
|
-
response_format?:
|
|
7036
|
+
response_format?: Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_JSON_Mode;
|
|
6572
7037
|
/**
|
|
6573
7038
|
* If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
|
|
6574
7039
|
*/
|
|
@@ -6610,7 +7075,7 @@ interface Ai_Cf_Meta_Llama_4_Prompt_Inner {
|
|
|
6610
7075
|
*/
|
|
6611
7076
|
presence_penalty?: number;
|
|
6612
7077
|
}
|
|
6613
|
-
interface
|
|
7078
|
+
interface Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Messages_Inner {
|
|
6614
7079
|
/**
|
|
6615
7080
|
* An array of message objects representing the conversation history.
|
|
6616
7081
|
*/
|
|
@@ -6746,7 +7211,7 @@ interface Ai_Cf_Meta_Llama_4_Messages_Inner {
|
|
|
6746
7211
|
};
|
|
6747
7212
|
}
|
|
6748
7213
|
)[];
|
|
6749
|
-
response_format?:
|
|
7214
|
+
response_format?: Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_JSON_Mode;
|
|
6750
7215
|
/**
|
|
6751
7216
|
* JSON schema that should be fufilled for the response.
|
|
6752
7217
|
*/
|
|
@@ -6845,414 +7310,1813 @@ declare abstract class Base_Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct {
|
|
|
6845
7310
|
inputs: Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Input;
|
|
6846
7311
|
postProcessedOutputs: Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct_Output;
|
|
6847
7312
|
}
|
|
6848
|
-
|
|
6849
|
-
|
|
6850
|
-
|
|
6851
|
-
|
|
6852
|
-
|
|
6853
|
-
/**
|
|
6854
|
-
* Sets how the model will interpret strings submitted to the custom_topic param. When strict, the model will only return topics submitted using the custom_topic param. When extended, the model will return its own detected topics in addition to those submitted using the custom_topic param.
|
|
6855
|
-
*/
|
|
6856
|
-
custom_topic_mode?: "extended" | "strict";
|
|
6857
|
-
/**
|
|
6858
|
-
* Custom topics you want the model to detect within your input audio or text if present Submit up to 100
|
|
6859
|
-
*/
|
|
6860
|
-
custom_topic?: string;
|
|
6861
|
-
/**
|
|
6862
|
-
* Sets how the model will interpret intents submitted to the custom_intent param. When strict, the model will only return intents submitted using the custom_intent param. When extended, the model will return its own detected intents in addition those submitted using the custom_intents param
|
|
6863
|
-
*/
|
|
6864
|
-
custom_intent_mode?: "extended" | "strict";
|
|
6865
|
-
/**
|
|
6866
|
-
* Custom intents you want the model to detect within your input audio if present
|
|
6867
|
-
*/
|
|
6868
|
-
custom_intent?: string;
|
|
6869
|
-
/**
|
|
6870
|
-
* Identifies and extracts key entities from content in submitted audio
|
|
6871
|
-
*/
|
|
6872
|
-
detect_entities?: boolean;
|
|
6873
|
-
/**
|
|
6874
|
-
* Identifies the dominant language spoken in submitted audio
|
|
6875
|
-
*/
|
|
6876
|
-
detect_language?: boolean;
|
|
6877
|
-
/**
|
|
6878
|
-
* Recognize speaker changes. Each word in the transcript will be assigned a speaker number starting at 0
|
|
6879
|
-
*/
|
|
6880
|
-
diarize?: boolean;
|
|
7313
|
+
type Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Input =
|
|
7314
|
+
| Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Prompt
|
|
7315
|
+
| Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Messages
|
|
7316
|
+
| Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Async_Batch;
|
|
7317
|
+
interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Prompt {
|
|
6881
7318
|
/**
|
|
6882
|
-
*
|
|
7319
|
+
* The input text prompt for the model to generate a response.
|
|
6883
7320
|
*/
|
|
6884
|
-
|
|
7321
|
+
prompt: string;
|
|
6885
7322
|
/**
|
|
6886
|
-
*
|
|
7323
|
+
* Name of the LoRA (Low-Rank Adaptation) model to fine-tune the base model.
|
|
6887
7324
|
*/
|
|
6888
|
-
|
|
6889
|
-
|
|
6890
|
-
| "flac"
|
|
6891
|
-
| "mulaw"
|
|
6892
|
-
| "amr-nb"
|
|
6893
|
-
| "amr-wb"
|
|
6894
|
-
| "opus"
|
|
6895
|
-
| "speex"
|
|
6896
|
-
| "g729";
|
|
7325
|
+
lora?: string;
|
|
7326
|
+
response_format?: Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_JSON_Mode;
|
|
6897
7327
|
/**
|
|
6898
|
-
*
|
|
7328
|
+
* If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
|
|
6899
7329
|
*/
|
|
6900
|
-
|
|
7330
|
+
raw?: boolean;
|
|
6901
7331
|
/**
|
|
6902
|
-
*
|
|
7332
|
+
* If true, the response will be streamed back incrementally using SSE, Server Sent Events.
|
|
6903
7333
|
*/
|
|
6904
|
-
|
|
7334
|
+
stream?: boolean;
|
|
6905
7335
|
/**
|
|
6906
|
-
*
|
|
7336
|
+
* The maximum number of tokens to generate in the response.
|
|
6907
7337
|
*/
|
|
6908
|
-
|
|
7338
|
+
max_tokens?: number;
|
|
6909
7339
|
/**
|
|
6910
|
-
*
|
|
7340
|
+
* Controls the randomness of the output; higher values produce more random results.
|
|
6911
7341
|
*/
|
|
6912
|
-
|
|
7342
|
+
temperature?: number;
|
|
6913
7343
|
/**
|
|
6914
|
-
*
|
|
7344
|
+
* Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses.
|
|
6915
7345
|
*/
|
|
6916
|
-
|
|
7346
|
+
top_p?: number;
|
|
6917
7347
|
/**
|
|
6918
|
-
*
|
|
7348
|
+
* Limits the AI to choose from the top 'k' most probable words. Lower values make responses more focused; higher values introduce more variety and potential surprises.
|
|
6919
7349
|
*/
|
|
6920
|
-
|
|
7350
|
+
top_k?: number;
|
|
6921
7351
|
/**
|
|
6922
|
-
*
|
|
7352
|
+
* Random seed for reproducibility of the generation.
|
|
6923
7353
|
*/
|
|
6924
|
-
|
|
7354
|
+
seed?: number;
|
|
6925
7355
|
/**
|
|
6926
|
-
*
|
|
7356
|
+
* Penalty for repeated tokens; higher values discourage repetition.
|
|
6927
7357
|
*/
|
|
6928
|
-
|
|
7358
|
+
repetition_penalty?: number;
|
|
6929
7359
|
/**
|
|
6930
|
-
*
|
|
7360
|
+
* Decreases the likelihood of the model repeating the same lines verbatim.
|
|
6931
7361
|
*/
|
|
6932
|
-
|
|
7362
|
+
frequency_penalty?: number;
|
|
6933
7363
|
/**
|
|
6934
|
-
*
|
|
7364
|
+
* Increases the likelihood of the model introducing new topics.
|
|
6935
7365
|
*/
|
|
6936
|
-
|
|
7366
|
+
presence_penalty?: number;
|
|
7367
|
+
}
|
|
7368
|
+
interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_JSON_Mode {
|
|
7369
|
+
type?: "json_object" | "json_schema";
|
|
7370
|
+
json_schema?: unknown;
|
|
7371
|
+
}
|
|
7372
|
+
interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Messages {
|
|
6937
7373
|
/**
|
|
6938
|
-
*
|
|
7374
|
+
* An array of message objects representing the conversation history.
|
|
6939
7375
|
*/
|
|
6940
|
-
|
|
7376
|
+
messages: {
|
|
7377
|
+
/**
|
|
7378
|
+
* The role of the message sender (e.g., 'user', 'assistant', 'system', 'tool').
|
|
7379
|
+
*/
|
|
7380
|
+
role: string;
|
|
7381
|
+
/**
|
|
7382
|
+
* The content of the message as a string.
|
|
7383
|
+
*/
|
|
7384
|
+
content: string;
|
|
7385
|
+
}[];
|
|
7386
|
+
functions?: {
|
|
7387
|
+
name: string;
|
|
7388
|
+
code: string;
|
|
7389
|
+
}[];
|
|
6941
7390
|
/**
|
|
6942
|
-
*
|
|
7391
|
+
* A list of tools available for the assistant to use.
|
|
7392
|
+
*/
|
|
7393
|
+
tools?: (
|
|
7394
|
+
| {
|
|
7395
|
+
/**
|
|
7396
|
+
* The name of the tool. More descriptive the better.
|
|
7397
|
+
*/
|
|
7398
|
+
name: string;
|
|
7399
|
+
/**
|
|
7400
|
+
* A brief description of what the tool does.
|
|
7401
|
+
*/
|
|
7402
|
+
description: string;
|
|
7403
|
+
/**
|
|
7404
|
+
* Schema defining the parameters accepted by the tool.
|
|
7405
|
+
*/
|
|
7406
|
+
parameters: {
|
|
7407
|
+
/**
|
|
7408
|
+
* The type of the parameters object (usually 'object').
|
|
7409
|
+
*/
|
|
7410
|
+
type: string;
|
|
7411
|
+
/**
|
|
7412
|
+
* List of required parameter names.
|
|
7413
|
+
*/
|
|
7414
|
+
required?: string[];
|
|
7415
|
+
/**
|
|
7416
|
+
* Definitions of each parameter.
|
|
7417
|
+
*/
|
|
7418
|
+
properties: {
|
|
7419
|
+
[k: string]: {
|
|
7420
|
+
/**
|
|
7421
|
+
* The data type of the parameter.
|
|
7422
|
+
*/
|
|
7423
|
+
type: string;
|
|
7424
|
+
/**
|
|
7425
|
+
* A description of the expected parameter.
|
|
7426
|
+
*/
|
|
7427
|
+
description: string;
|
|
7428
|
+
};
|
|
7429
|
+
};
|
|
7430
|
+
};
|
|
7431
|
+
}
|
|
7432
|
+
| {
|
|
7433
|
+
/**
|
|
7434
|
+
* Specifies the type of tool (e.g., 'function').
|
|
7435
|
+
*/
|
|
7436
|
+
type: string;
|
|
7437
|
+
/**
|
|
7438
|
+
* Details of the function tool.
|
|
7439
|
+
*/
|
|
7440
|
+
function: {
|
|
7441
|
+
/**
|
|
7442
|
+
* The name of the function.
|
|
7443
|
+
*/
|
|
7444
|
+
name: string;
|
|
7445
|
+
/**
|
|
7446
|
+
* A brief description of what the function does.
|
|
7447
|
+
*/
|
|
7448
|
+
description: string;
|
|
7449
|
+
/**
|
|
7450
|
+
* Schema defining the parameters accepted by the function.
|
|
7451
|
+
*/
|
|
7452
|
+
parameters: {
|
|
7453
|
+
/**
|
|
7454
|
+
* The type of the parameters object (usually 'object').
|
|
7455
|
+
*/
|
|
7456
|
+
type: string;
|
|
7457
|
+
/**
|
|
7458
|
+
* List of required parameter names.
|
|
7459
|
+
*/
|
|
7460
|
+
required?: string[];
|
|
7461
|
+
/**
|
|
7462
|
+
* Definitions of each parameter.
|
|
7463
|
+
*/
|
|
7464
|
+
properties: {
|
|
7465
|
+
[k: string]: {
|
|
7466
|
+
/**
|
|
7467
|
+
* The data type of the parameter.
|
|
7468
|
+
*/
|
|
7469
|
+
type: string;
|
|
7470
|
+
/**
|
|
7471
|
+
* A description of the expected parameter.
|
|
7472
|
+
*/
|
|
7473
|
+
description: string;
|
|
7474
|
+
};
|
|
7475
|
+
};
|
|
7476
|
+
};
|
|
7477
|
+
};
|
|
7478
|
+
}
|
|
7479
|
+
)[];
|
|
7480
|
+
response_format?: Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_JSON_Mode_1;
|
|
7481
|
+
/**
|
|
7482
|
+
* If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
|
|
7483
|
+
*/
|
|
7484
|
+
raw?: boolean;
|
|
7485
|
+
/**
|
|
7486
|
+
* If true, the response will be streamed back incrementally using SSE, Server Sent Events.
|
|
7487
|
+
*/
|
|
7488
|
+
stream?: boolean;
|
|
7489
|
+
/**
|
|
7490
|
+
* The maximum number of tokens to generate in the response.
|
|
7491
|
+
*/
|
|
7492
|
+
max_tokens?: number;
|
|
7493
|
+
/**
|
|
7494
|
+
* Controls the randomness of the output; higher values produce more random results.
|
|
7495
|
+
*/
|
|
7496
|
+
temperature?: number;
|
|
7497
|
+
/**
|
|
7498
|
+
* Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses.
|
|
7499
|
+
*/
|
|
7500
|
+
top_p?: number;
|
|
7501
|
+
/**
|
|
7502
|
+
* Limits the AI to choose from the top 'k' most probable words. Lower values make responses more focused; higher values introduce more variety and potential surprises.
|
|
7503
|
+
*/
|
|
7504
|
+
top_k?: number;
|
|
7505
|
+
/**
|
|
7506
|
+
* Random seed for reproducibility of the generation.
|
|
7507
|
+
*/
|
|
7508
|
+
seed?: number;
|
|
7509
|
+
/**
|
|
7510
|
+
* Penalty for repeated tokens; higher values discourage repetition.
|
|
7511
|
+
*/
|
|
7512
|
+
repetition_penalty?: number;
|
|
7513
|
+
/**
|
|
7514
|
+
* Decreases the likelihood of the model repeating the same lines verbatim.
|
|
7515
|
+
*/
|
|
7516
|
+
frequency_penalty?: number;
|
|
7517
|
+
/**
|
|
7518
|
+
* Increases the likelihood of the model introducing new topics.
|
|
7519
|
+
*/
|
|
7520
|
+
presence_penalty?: number;
|
|
7521
|
+
}
|
|
7522
|
+
interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_JSON_Mode_1 {
|
|
7523
|
+
type?: "json_object" | "json_schema";
|
|
7524
|
+
json_schema?: unknown;
|
|
7525
|
+
}
|
|
7526
|
+
interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Async_Batch {
|
|
7527
|
+
requests: (
|
|
7528
|
+
| Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Prompt_1
|
|
7529
|
+
| Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Messages_1
|
|
7530
|
+
)[];
|
|
7531
|
+
}
|
|
7532
|
+
interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Prompt_1 {
|
|
7533
|
+
/**
|
|
7534
|
+
* The input text prompt for the model to generate a response.
|
|
7535
|
+
*/
|
|
7536
|
+
prompt: string;
|
|
7537
|
+
/**
|
|
7538
|
+
* Name of the LoRA (Low-Rank Adaptation) model to fine-tune the base model.
|
|
7539
|
+
*/
|
|
7540
|
+
lora?: string;
|
|
7541
|
+
response_format?: Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_JSON_Mode_2;
|
|
7542
|
+
/**
|
|
7543
|
+
* If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
|
|
7544
|
+
*/
|
|
7545
|
+
raw?: boolean;
|
|
7546
|
+
/**
|
|
7547
|
+
* If true, the response will be streamed back incrementally using SSE, Server Sent Events.
|
|
7548
|
+
*/
|
|
7549
|
+
stream?: boolean;
|
|
7550
|
+
/**
|
|
7551
|
+
* The maximum number of tokens to generate in the response.
|
|
7552
|
+
*/
|
|
7553
|
+
max_tokens?: number;
|
|
7554
|
+
/**
|
|
7555
|
+
* Controls the randomness of the output; higher values produce more random results.
|
|
7556
|
+
*/
|
|
7557
|
+
temperature?: number;
|
|
7558
|
+
/**
|
|
7559
|
+
* Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses.
|
|
7560
|
+
*/
|
|
7561
|
+
top_p?: number;
|
|
7562
|
+
/**
|
|
7563
|
+
* Limits the AI to choose from the top 'k' most probable words. Lower values make responses more focused; higher values introduce more variety and potential surprises.
|
|
7564
|
+
*/
|
|
7565
|
+
top_k?: number;
|
|
7566
|
+
/**
|
|
7567
|
+
* Random seed for reproducibility of the generation.
|
|
7568
|
+
*/
|
|
7569
|
+
seed?: number;
|
|
7570
|
+
/**
|
|
7571
|
+
* Penalty for repeated tokens; higher values discourage repetition.
|
|
7572
|
+
*/
|
|
7573
|
+
repetition_penalty?: number;
|
|
7574
|
+
/**
|
|
7575
|
+
* Decreases the likelihood of the model repeating the same lines verbatim.
|
|
7576
|
+
*/
|
|
7577
|
+
frequency_penalty?: number;
|
|
7578
|
+
/**
|
|
7579
|
+
* Increases the likelihood of the model introducing new topics.
|
|
7580
|
+
*/
|
|
7581
|
+
presence_penalty?: number;
|
|
7582
|
+
}
|
|
7583
|
+
interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_JSON_Mode_2 {
|
|
7584
|
+
type?: "json_object" | "json_schema";
|
|
7585
|
+
json_schema?: unknown;
|
|
7586
|
+
}
|
|
7587
|
+
interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Messages_1 {
|
|
7588
|
+
/**
|
|
7589
|
+
* An array of message objects representing the conversation history.
|
|
7590
|
+
*/
|
|
7591
|
+
messages: {
|
|
7592
|
+
/**
|
|
7593
|
+
* The role of the message sender (e.g., 'user', 'assistant', 'system', 'tool').
|
|
7594
|
+
*/
|
|
7595
|
+
role: string;
|
|
7596
|
+
/**
|
|
7597
|
+
* The content of the message as a string.
|
|
7598
|
+
*/
|
|
7599
|
+
content: string;
|
|
7600
|
+
}[];
|
|
7601
|
+
functions?: {
|
|
7602
|
+
name: string;
|
|
7603
|
+
code: string;
|
|
7604
|
+
}[];
|
|
7605
|
+
/**
|
|
7606
|
+
* A list of tools available for the assistant to use.
|
|
7607
|
+
*/
|
|
7608
|
+
tools?: (
|
|
7609
|
+
| {
|
|
7610
|
+
/**
|
|
7611
|
+
* The name of the tool. More descriptive the better.
|
|
7612
|
+
*/
|
|
7613
|
+
name: string;
|
|
7614
|
+
/**
|
|
7615
|
+
* A brief description of what the tool does.
|
|
7616
|
+
*/
|
|
7617
|
+
description: string;
|
|
7618
|
+
/**
|
|
7619
|
+
* Schema defining the parameters accepted by the tool.
|
|
7620
|
+
*/
|
|
7621
|
+
parameters: {
|
|
7622
|
+
/**
|
|
7623
|
+
* The type of the parameters object (usually 'object').
|
|
7624
|
+
*/
|
|
7625
|
+
type: string;
|
|
7626
|
+
/**
|
|
7627
|
+
* List of required parameter names.
|
|
7628
|
+
*/
|
|
7629
|
+
required?: string[];
|
|
7630
|
+
/**
|
|
7631
|
+
* Definitions of each parameter.
|
|
7632
|
+
*/
|
|
7633
|
+
properties: {
|
|
7634
|
+
[k: string]: {
|
|
7635
|
+
/**
|
|
7636
|
+
* The data type of the parameter.
|
|
7637
|
+
*/
|
|
7638
|
+
type: string;
|
|
7639
|
+
/**
|
|
7640
|
+
* A description of the expected parameter.
|
|
7641
|
+
*/
|
|
7642
|
+
description: string;
|
|
7643
|
+
};
|
|
7644
|
+
};
|
|
7645
|
+
};
|
|
7646
|
+
}
|
|
7647
|
+
| {
|
|
7648
|
+
/**
|
|
7649
|
+
* Specifies the type of tool (e.g., 'function').
|
|
7650
|
+
*/
|
|
7651
|
+
type: string;
|
|
7652
|
+
/**
|
|
7653
|
+
* Details of the function tool.
|
|
7654
|
+
*/
|
|
7655
|
+
function: {
|
|
7656
|
+
/**
|
|
7657
|
+
* The name of the function.
|
|
7658
|
+
*/
|
|
7659
|
+
name: string;
|
|
7660
|
+
/**
|
|
7661
|
+
* A brief description of what the function does.
|
|
7662
|
+
*/
|
|
7663
|
+
description: string;
|
|
7664
|
+
/**
|
|
7665
|
+
* Schema defining the parameters accepted by the function.
|
|
7666
|
+
*/
|
|
7667
|
+
parameters: {
|
|
7668
|
+
/**
|
|
7669
|
+
* The type of the parameters object (usually 'object').
|
|
7670
|
+
*/
|
|
7671
|
+
type: string;
|
|
7672
|
+
/**
|
|
7673
|
+
* List of required parameter names.
|
|
7674
|
+
*/
|
|
7675
|
+
required?: string[];
|
|
7676
|
+
/**
|
|
7677
|
+
* Definitions of each parameter.
|
|
7678
|
+
*/
|
|
7679
|
+
properties: {
|
|
7680
|
+
[k: string]: {
|
|
7681
|
+
/**
|
|
7682
|
+
* The data type of the parameter.
|
|
7683
|
+
*/
|
|
7684
|
+
type: string;
|
|
7685
|
+
/**
|
|
7686
|
+
* A description of the expected parameter.
|
|
7687
|
+
*/
|
|
7688
|
+
description: string;
|
|
7689
|
+
};
|
|
7690
|
+
};
|
|
7691
|
+
};
|
|
7692
|
+
};
|
|
7693
|
+
}
|
|
7694
|
+
)[];
|
|
7695
|
+
response_format?: Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_JSON_Mode_3;
|
|
7696
|
+
/**
|
|
7697
|
+
* If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
|
|
7698
|
+
*/
|
|
7699
|
+
raw?: boolean;
|
|
7700
|
+
/**
|
|
7701
|
+
* If true, the response will be streamed back incrementally using SSE, Server Sent Events.
|
|
7702
|
+
*/
|
|
7703
|
+
stream?: boolean;
|
|
7704
|
+
/**
|
|
7705
|
+
* The maximum number of tokens to generate in the response.
|
|
7706
|
+
*/
|
|
7707
|
+
max_tokens?: number;
|
|
7708
|
+
/**
|
|
7709
|
+
* Controls the randomness of the output; higher values produce more random results.
|
|
7710
|
+
*/
|
|
7711
|
+
temperature?: number;
|
|
7712
|
+
/**
|
|
7713
|
+
* Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses.
|
|
7714
|
+
*/
|
|
7715
|
+
top_p?: number;
|
|
7716
|
+
/**
|
|
7717
|
+
* Limits the AI to choose from the top 'k' most probable words. Lower values make responses more focused; higher values introduce more variety and potential surprises.
|
|
7718
|
+
*/
|
|
7719
|
+
top_k?: number;
|
|
7720
|
+
/**
|
|
7721
|
+
* Random seed for reproducibility of the generation.
|
|
7722
|
+
*/
|
|
7723
|
+
seed?: number;
|
|
7724
|
+
/**
|
|
7725
|
+
* Penalty for repeated tokens; higher values discourage repetition.
|
|
7726
|
+
*/
|
|
7727
|
+
repetition_penalty?: number;
|
|
7728
|
+
/**
|
|
7729
|
+
* Decreases the likelihood of the model repeating the same lines verbatim.
|
|
7730
|
+
*/
|
|
7731
|
+
frequency_penalty?: number;
|
|
7732
|
+
/**
|
|
7733
|
+
* Increases the likelihood of the model introducing new topics.
|
|
7734
|
+
*/
|
|
7735
|
+
presence_penalty?: number;
|
|
7736
|
+
}
|
|
7737
|
+
interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_JSON_Mode_3 {
|
|
7738
|
+
type?: "json_object" | "json_schema";
|
|
7739
|
+
json_schema?: unknown;
|
|
7740
|
+
}
|
|
7741
|
+
type Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Output =
|
|
7742
|
+
| Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Chat_Completion_Response
|
|
7743
|
+
| Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Text_Completion_Response
|
|
7744
|
+
| string
|
|
7745
|
+
| Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_AsyncResponse;
|
|
7746
|
+
interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Chat_Completion_Response {
|
|
7747
|
+
/**
|
|
7748
|
+
* Unique identifier for the completion
|
|
7749
|
+
*/
|
|
7750
|
+
id?: string;
|
|
7751
|
+
/**
|
|
7752
|
+
* Object type identifier
|
|
7753
|
+
*/
|
|
7754
|
+
object?: "chat.completion";
|
|
7755
|
+
/**
|
|
7756
|
+
* Unix timestamp of when the completion was created
|
|
7757
|
+
*/
|
|
7758
|
+
created?: number;
|
|
7759
|
+
/**
|
|
7760
|
+
* Model used for the completion
|
|
7761
|
+
*/
|
|
7762
|
+
model?: string;
|
|
7763
|
+
/**
|
|
7764
|
+
* List of completion choices
|
|
7765
|
+
*/
|
|
7766
|
+
choices?: {
|
|
7767
|
+
/**
|
|
7768
|
+
* Index of the choice in the list
|
|
7769
|
+
*/
|
|
7770
|
+
index?: number;
|
|
7771
|
+
/**
|
|
7772
|
+
* The message generated by the model
|
|
7773
|
+
*/
|
|
7774
|
+
message?: {
|
|
7775
|
+
/**
|
|
7776
|
+
* Role of the message author
|
|
7777
|
+
*/
|
|
7778
|
+
role: string;
|
|
7779
|
+
/**
|
|
7780
|
+
* The content of the message
|
|
7781
|
+
*/
|
|
7782
|
+
content: string;
|
|
7783
|
+
/**
|
|
7784
|
+
* Internal reasoning content (if available)
|
|
7785
|
+
*/
|
|
7786
|
+
reasoning_content?: string;
|
|
7787
|
+
/**
|
|
7788
|
+
* Tool calls made by the assistant
|
|
7789
|
+
*/
|
|
7790
|
+
tool_calls?: {
|
|
7791
|
+
/**
|
|
7792
|
+
* Unique identifier for the tool call
|
|
7793
|
+
*/
|
|
7794
|
+
id: string;
|
|
7795
|
+
/**
|
|
7796
|
+
* Type of tool call
|
|
7797
|
+
*/
|
|
7798
|
+
type: "function";
|
|
7799
|
+
function: {
|
|
7800
|
+
/**
|
|
7801
|
+
* Name of the function to call
|
|
7802
|
+
*/
|
|
7803
|
+
name: string;
|
|
7804
|
+
/**
|
|
7805
|
+
* JSON string of arguments for the function
|
|
7806
|
+
*/
|
|
7807
|
+
arguments: string;
|
|
7808
|
+
};
|
|
7809
|
+
}[];
|
|
7810
|
+
};
|
|
7811
|
+
/**
|
|
7812
|
+
* Reason why the model stopped generating
|
|
7813
|
+
*/
|
|
7814
|
+
finish_reason?: string;
|
|
7815
|
+
/**
|
|
7816
|
+
* Stop reason (may be null)
|
|
7817
|
+
*/
|
|
7818
|
+
stop_reason?: string | null;
|
|
7819
|
+
/**
|
|
7820
|
+
* Log probabilities (if requested)
|
|
7821
|
+
*/
|
|
7822
|
+
logprobs?: {} | null;
|
|
7823
|
+
}[];
|
|
7824
|
+
/**
|
|
7825
|
+
* Usage statistics for the inference request
|
|
7826
|
+
*/
|
|
7827
|
+
usage?: {
|
|
7828
|
+
/**
|
|
7829
|
+
* Total number of tokens in input
|
|
7830
|
+
*/
|
|
7831
|
+
prompt_tokens?: number;
|
|
7832
|
+
/**
|
|
7833
|
+
* Total number of tokens in output
|
|
7834
|
+
*/
|
|
7835
|
+
completion_tokens?: number;
|
|
7836
|
+
/**
|
|
7837
|
+
* Total number of input and output tokens
|
|
7838
|
+
*/
|
|
7839
|
+
total_tokens?: number;
|
|
7840
|
+
};
|
|
7841
|
+
/**
|
|
7842
|
+
* Log probabilities for the prompt (if requested)
|
|
7843
|
+
*/
|
|
7844
|
+
prompt_logprobs?: {} | null;
|
|
7845
|
+
}
|
|
7846
|
+
interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Text_Completion_Response {
|
|
7847
|
+
/**
|
|
7848
|
+
* Unique identifier for the completion
|
|
7849
|
+
*/
|
|
7850
|
+
id?: string;
|
|
7851
|
+
/**
|
|
7852
|
+
* Object type identifier
|
|
7853
|
+
*/
|
|
7854
|
+
object?: "text_completion";
|
|
7855
|
+
/**
|
|
7856
|
+
* Unix timestamp of when the completion was created
|
|
7857
|
+
*/
|
|
7858
|
+
created?: number;
|
|
7859
|
+
/**
|
|
7860
|
+
* Model used for the completion
|
|
7861
|
+
*/
|
|
7862
|
+
model?: string;
|
|
7863
|
+
/**
|
|
7864
|
+
* List of completion choices
|
|
7865
|
+
*/
|
|
7866
|
+
choices?: {
|
|
7867
|
+
/**
|
|
7868
|
+
* Index of the choice in the list
|
|
7869
|
+
*/
|
|
7870
|
+
index: number;
|
|
7871
|
+
/**
|
|
7872
|
+
* The generated text completion
|
|
7873
|
+
*/
|
|
7874
|
+
text: string;
|
|
7875
|
+
/**
|
|
7876
|
+
* Reason why the model stopped generating
|
|
7877
|
+
*/
|
|
7878
|
+
finish_reason: string;
|
|
7879
|
+
/**
|
|
7880
|
+
* Stop reason (may be null)
|
|
7881
|
+
*/
|
|
7882
|
+
stop_reason?: string | null;
|
|
7883
|
+
/**
|
|
7884
|
+
* Log probabilities (if requested)
|
|
7885
|
+
*/
|
|
7886
|
+
logprobs?: {} | null;
|
|
7887
|
+
/**
|
|
7888
|
+
* Log probabilities for the prompt (if requested)
|
|
7889
|
+
*/
|
|
7890
|
+
prompt_logprobs?: {} | null;
|
|
7891
|
+
}[];
|
|
7892
|
+
/**
|
|
7893
|
+
* Usage statistics for the inference request
|
|
7894
|
+
*/
|
|
7895
|
+
usage?: {
|
|
7896
|
+
/**
|
|
7897
|
+
* Total number of tokens in input
|
|
7898
|
+
*/
|
|
7899
|
+
prompt_tokens?: number;
|
|
7900
|
+
/**
|
|
7901
|
+
* Total number of tokens in output
|
|
7902
|
+
*/
|
|
7903
|
+
completion_tokens?: number;
|
|
7904
|
+
/**
|
|
7905
|
+
* Total number of input and output tokens
|
|
7906
|
+
*/
|
|
7907
|
+
total_tokens?: number;
|
|
7908
|
+
};
|
|
7909
|
+
}
|
|
7910
|
+
interface Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_AsyncResponse {
|
|
7911
|
+
/**
|
|
7912
|
+
* The async request id that can be used to obtain the results.
|
|
7913
|
+
*/
|
|
7914
|
+
request_id?: string;
|
|
7915
|
+
}
|
|
7916
|
+
declare abstract class Base_Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8 {
|
|
7917
|
+
inputs: Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Input;
|
|
7918
|
+
postProcessedOutputs: Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8_Output;
|
|
7919
|
+
}
|
|
7920
|
+
interface Ai_Cf_Deepgram_Nova_3_Input {
|
|
7921
|
+
audio: {
|
|
7922
|
+
body: object;
|
|
7923
|
+
contentType: string;
|
|
7924
|
+
};
|
|
7925
|
+
/**
|
|
7926
|
+
* Sets how the model will interpret strings submitted to the custom_topic param. When strict, the model will only return topics submitted using the custom_topic param. When extended, the model will return its own detected topics in addition to those submitted using the custom_topic param.
|
|
7927
|
+
*/
|
|
7928
|
+
custom_topic_mode?: "extended" | "strict";
|
|
7929
|
+
/**
|
|
7930
|
+
* Custom topics you want the model to detect within your input audio or text if present Submit up to 100
|
|
7931
|
+
*/
|
|
7932
|
+
custom_topic?: string;
|
|
7933
|
+
/**
|
|
7934
|
+
* Sets how the model will interpret intents submitted to the custom_intent param. When strict, the model will only return intents submitted using the custom_intent param. When extended, the model will return its own detected intents in addition those submitted using the custom_intents param
|
|
7935
|
+
*/
|
|
7936
|
+
custom_intent_mode?: "extended" | "strict";
|
|
7937
|
+
/**
|
|
7938
|
+
* Custom intents you want the model to detect within your input audio if present
|
|
7939
|
+
*/
|
|
7940
|
+
custom_intent?: string;
|
|
7941
|
+
/**
|
|
7942
|
+
* Identifies and extracts key entities from content in submitted audio
|
|
7943
|
+
*/
|
|
7944
|
+
detect_entities?: boolean;
|
|
7945
|
+
/**
|
|
7946
|
+
* Identifies the dominant language spoken in submitted audio
|
|
7947
|
+
*/
|
|
7948
|
+
detect_language?: boolean;
|
|
7949
|
+
/**
|
|
7950
|
+
* Recognize speaker changes. Each word in the transcript will be assigned a speaker number starting at 0
|
|
7951
|
+
*/
|
|
7952
|
+
diarize?: boolean;
|
|
7953
|
+
/**
|
|
7954
|
+
* Identify and extract key entities from content in submitted audio
|
|
7955
|
+
*/
|
|
7956
|
+
dictation?: boolean;
|
|
7957
|
+
/**
|
|
7958
|
+
* Specify the expected encoding of your submitted audio
|
|
7959
|
+
*/
|
|
7960
|
+
encoding?:
|
|
7961
|
+
| "linear16"
|
|
7962
|
+
| "flac"
|
|
7963
|
+
| "mulaw"
|
|
7964
|
+
| "amr-nb"
|
|
7965
|
+
| "amr-wb"
|
|
7966
|
+
| "opus"
|
|
7967
|
+
| "speex"
|
|
7968
|
+
| "g729";
|
|
7969
|
+
/**
|
|
7970
|
+
* Arbitrary key-value pairs that are attached to the API response for usage in downstream processing
|
|
7971
|
+
*/
|
|
7972
|
+
extra?: string;
|
|
7973
|
+
/**
|
|
7974
|
+
* Filler Words can help transcribe interruptions in your audio, like 'uh' and 'um'
|
|
7975
|
+
*/
|
|
7976
|
+
filler_words?: boolean;
|
|
7977
|
+
/**
|
|
7978
|
+
* Key term prompting can boost or suppress specialized terminology and brands.
|
|
7979
|
+
*/
|
|
7980
|
+
keyterm?: string;
|
|
7981
|
+
/**
|
|
7982
|
+
* Keywords can boost or suppress specialized terminology and brands.
|
|
7983
|
+
*/
|
|
7984
|
+
keywords?: string;
|
|
7985
|
+
/**
|
|
7986
|
+
* The BCP-47 language tag that hints at the primary spoken language. Depending on the Model and API endpoint you choose only certain languages are available.
|
|
7987
|
+
*/
|
|
7988
|
+
language?: string;
|
|
7989
|
+
/**
|
|
7990
|
+
* Spoken measurements will be converted to their corresponding abbreviations.
|
|
7991
|
+
*/
|
|
7992
|
+
measurements?: boolean;
|
|
7993
|
+
/**
|
|
7994
|
+
* Opts out requests from the Deepgram Model Improvement Program. Refer to our Docs for pricing impacts before setting this to true. https://dpgr.am/deepgram-mip.
|
|
7995
|
+
*/
|
|
7996
|
+
mip_opt_out?: boolean;
|
|
7997
|
+
/**
|
|
7998
|
+
* Mode of operation for the model representing broad area of topic that will be talked about in the supplied audio
|
|
7999
|
+
*/
|
|
8000
|
+
mode?: "general" | "medical" | "finance";
|
|
8001
|
+
/**
|
|
8002
|
+
* Transcribe each audio channel independently.
|
|
8003
|
+
*/
|
|
8004
|
+
multichannel?: boolean;
|
|
8005
|
+
/**
|
|
8006
|
+
* Numerals converts numbers from written format to numerical format.
|
|
8007
|
+
*/
|
|
8008
|
+
numerals?: boolean;
|
|
8009
|
+
/**
|
|
8010
|
+
* Splits audio into paragraphs to improve transcript readability.
|
|
8011
|
+
*/
|
|
8012
|
+
paragraphs?: boolean;
|
|
8013
|
+
/**
|
|
8014
|
+
* Profanity Filter looks for recognized profanity and converts it to the nearest recognized non-profane word or removes it from the transcript completely.
|
|
6943
8015
|
*/
|
|
6944
8016
|
profanity_filter?: boolean;
|
|
6945
8017
|
/**
|
|
6946
|
-
* Add punctuation and capitalization to the transcript.
|
|
8018
|
+
* Add punctuation and capitalization to the transcript.
|
|
8019
|
+
*/
|
|
8020
|
+
punctuate?: boolean;
|
|
8021
|
+
/**
|
|
8022
|
+
* Redaction removes sensitive information from your transcripts.
|
|
8023
|
+
*/
|
|
8024
|
+
redact?: string;
|
|
8025
|
+
/**
|
|
8026
|
+
* Search for terms or phrases in submitted audio and replaces them.
|
|
8027
|
+
*/
|
|
8028
|
+
replace?: string;
|
|
8029
|
+
/**
|
|
8030
|
+
* Search for terms or phrases in submitted audio.
|
|
8031
|
+
*/
|
|
8032
|
+
search?: string;
|
|
8033
|
+
/**
|
|
8034
|
+
* Recognizes the sentiment throughout a transcript or text.
|
|
8035
|
+
*/
|
|
8036
|
+
sentiment?: boolean;
|
|
8037
|
+
/**
|
|
8038
|
+
* Apply formatting to transcript output. When set to true, additional formatting will be applied to transcripts to improve readability.
|
|
8039
|
+
*/
|
|
8040
|
+
smart_format?: boolean;
|
|
8041
|
+
/**
|
|
8042
|
+
* Detect topics throughout a transcript or text.
|
|
8043
|
+
*/
|
|
8044
|
+
topics?: boolean;
|
|
8045
|
+
/**
|
|
8046
|
+
* Segments speech into meaningful semantic units.
|
|
8047
|
+
*/
|
|
8048
|
+
utterances?: boolean;
|
|
8049
|
+
/**
|
|
8050
|
+
* Seconds to wait before detecting a pause between words in submitted audio.
|
|
8051
|
+
*/
|
|
8052
|
+
utt_split?: number;
|
|
8053
|
+
/**
|
|
8054
|
+
* The number of channels in the submitted audio
|
|
8055
|
+
*/
|
|
8056
|
+
channels?: number;
|
|
8057
|
+
/**
|
|
8058
|
+
* Specifies whether the streaming endpoint should provide ongoing transcription updates as more audio is received. When set to true, the endpoint sends continuous updates, meaning transcription results may evolve over time. Note: Supported only for webosockets.
|
|
8059
|
+
*/
|
|
8060
|
+
interim_results?: boolean;
|
|
8061
|
+
/**
|
|
8062
|
+
* Indicates how long model will wait to detect whether a speaker has finished speaking or pauses for a significant period of time. When set to a value, the streaming endpoint immediately finalizes the transcription for the processed time range and returns the transcript with a speech_final parameter set to true. Can also be set to false to disable endpointing
|
|
8063
|
+
*/
|
|
8064
|
+
endpointing?: string;
|
|
8065
|
+
/**
|
|
8066
|
+
* Indicates that speech has started. You'll begin receiving Speech Started messages upon speech starting. Note: Supported only for webosockets.
|
|
8067
|
+
*/
|
|
8068
|
+
vad_events?: boolean;
|
|
8069
|
+
/**
|
|
8070
|
+
* Indicates how long model will wait to send an UtteranceEnd message after a word has been transcribed. Use with interim_results. Note: Supported only for webosockets.
|
|
8071
|
+
*/
|
|
8072
|
+
utterance_end_ms?: boolean;
|
|
8073
|
+
}
|
|
8074
|
+
interface Ai_Cf_Deepgram_Nova_3_Output {
|
|
8075
|
+
results?: {
|
|
8076
|
+
channels?: {
|
|
8077
|
+
alternatives?: {
|
|
8078
|
+
confidence?: number;
|
|
8079
|
+
transcript?: string;
|
|
8080
|
+
words?: {
|
|
8081
|
+
confidence?: number;
|
|
8082
|
+
end?: number;
|
|
8083
|
+
start?: number;
|
|
8084
|
+
word?: string;
|
|
8085
|
+
}[];
|
|
8086
|
+
}[];
|
|
8087
|
+
}[];
|
|
8088
|
+
summary?: {
|
|
8089
|
+
result?: string;
|
|
8090
|
+
short?: string;
|
|
8091
|
+
};
|
|
8092
|
+
sentiments?: {
|
|
8093
|
+
segments?: {
|
|
8094
|
+
text?: string;
|
|
8095
|
+
start_word?: number;
|
|
8096
|
+
end_word?: number;
|
|
8097
|
+
sentiment?: string;
|
|
8098
|
+
sentiment_score?: number;
|
|
8099
|
+
}[];
|
|
8100
|
+
average?: {
|
|
8101
|
+
sentiment?: string;
|
|
8102
|
+
sentiment_score?: number;
|
|
8103
|
+
};
|
|
8104
|
+
};
|
|
8105
|
+
};
|
|
8106
|
+
}
|
|
8107
|
+
declare abstract class Base_Ai_Cf_Deepgram_Nova_3 {
|
|
8108
|
+
inputs: Ai_Cf_Deepgram_Nova_3_Input;
|
|
8109
|
+
postProcessedOutputs: Ai_Cf_Deepgram_Nova_3_Output;
|
|
8110
|
+
}
|
|
8111
|
+
interface Ai_Cf_Qwen_Qwen3_Embedding_0_6B_Input {
|
|
8112
|
+
queries?: string | string[];
|
|
8113
|
+
/**
|
|
8114
|
+
* Optional instruction for the task
|
|
8115
|
+
*/
|
|
8116
|
+
instruction?: string;
|
|
8117
|
+
documents?: string | string[];
|
|
8118
|
+
text?: string | string[];
|
|
8119
|
+
}
|
|
8120
|
+
interface Ai_Cf_Qwen_Qwen3_Embedding_0_6B_Output {
|
|
8121
|
+
data?: number[][];
|
|
8122
|
+
shape?: number[];
|
|
8123
|
+
}
|
|
8124
|
+
declare abstract class Base_Ai_Cf_Qwen_Qwen3_Embedding_0_6B {
|
|
8125
|
+
inputs: Ai_Cf_Qwen_Qwen3_Embedding_0_6B_Input;
|
|
8126
|
+
postProcessedOutputs: Ai_Cf_Qwen_Qwen3_Embedding_0_6B_Output;
|
|
8127
|
+
}
|
|
8128
|
+
type Ai_Cf_Pipecat_Ai_Smart_Turn_V2_Input =
|
|
8129
|
+
| {
|
|
8130
|
+
/**
|
|
8131
|
+
* readable stream with audio data and content-type specified for that data
|
|
8132
|
+
*/
|
|
8133
|
+
audio: {
|
|
8134
|
+
body: object;
|
|
8135
|
+
contentType: string;
|
|
8136
|
+
};
|
|
8137
|
+
/**
|
|
8138
|
+
* type of data PCM data that's sent to the inference server as raw array
|
|
8139
|
+
*/
|
|
8140
|
+
dtype?: "uint8" | "float32" | "float64";
|
|
8141
|
+
}
|
|
8142
|
+
| {
|
|
8143
|
+
/**
|
|
8144
|
+
* base64 encoded audio data
|
|
8145
|
+
*/
|
|
8146
|
+
audio: string;
|
|
8147
|
+
/**
|
|
8148
|
+
* type of data PCM data that's sent to the inference server as raw array
|
|
8149
|
+
*/
|
|
8150
|
+
dtype?: "uint8" | "float32" | "float64";
|
|
8151
|
+
};
|
|
8152
|
+
interface Ai_Cf_Pipecat_Ai_Smart_Turn_V2_Output {
|
|
8153
|
+
/**
|
|
8154
|
+
* if true, end-of-turn was detected
|
|
8155
|
+
*/
|
|
8156
|
+
is_complete?: boolean;
|
|
8157
|
+
/**
|
|
8158
|
+
* probability of the end-of-turn detection
|
|
8159
|
+
*/
|
|
8160
|
+
probability?: number;
|
|
8161
|
+
}
|
|
8162
|
+
declare abstract class Base_Ai_Cf_Pipecat_Ai_Smart_Turn_V2 {
|
|
8163
|
+
inputs: Ai_Cf_Pipecat_Ai_Smart_Turn_V2_Input;
|
|
8164
|
+
postProcessedOutputs: Ai_Cf_Pipecat_Ai_Smart_Turn_V2_Output;
|
|
8165
|
+
}
|
|
8166
|
+
declare abstract class Base_Ai_Cf_Openai_Gpt_Oss_120B {
|
|
8167
|
+
inputs: ResponsesInput;
|
|
8168
|
+
postProcessedOutputs: ResponsesOutput;
|
|
8169
|
+
}
|
|
8170
|
+
declare abstract class Base_Ai_Cf_Openai_Gpt_Oss_20B {
|
|
8171
|
+
inputs: ResponsesInput;
|
|
8172
|
+
postProcessedOutputs: ResponsesOutput;
|
|
8173
|
+
}
|
|
8174
|
+
interface Ai_Cf_Leonardo_Phoenix_1_0_Input {
|
|
8175
|
+
/**
|
|
8176
|
+
* A text description of the image you want to generate.
|
|
8177
|
+
*/
|
|
8178
|
+
prompt: string;
|
|
8179
|
+
/**
|
|
8180
|
+
* Controls how closely the generated image should adhere to the prompt; higher values make the image more aligned with the prompt
|
|
8181
|
+
*/
|
|
8182
|
+
guidance?: number;
|
|
8183
|
+
/**
|
|
8184
|
+
* Random seed for reproducibility of the image generation
|
|
8185
|
+
*/
|
|
8186
|
+
seed?: number;
|
|
8187
|
+
/**
|
|
8188
|
+
* The height of the generated image in pixels
|
|
8189
|
+
*/
|
|
8190
|
+
height?: number;
|
|
8191
|
+
/**
|
|
8192
|
+
* The width of the generated image in pixels
|
|
8193
|
+
*/
|
|
8194
|
+
width?: number;
|
|
8195
|
+
/**
|
|
8196
|
+
* The number of diffusion steps; higher values can improve quality but take longer
|
|
8197
|
+
*/
|
|
8198
|
+
num_steps?: number;
|
|
8199
|
+
/**
|
|
8200
|
+
* Specify what to exclude from the generated images
|
|
8201
|
+
*/
|
|
8202
|
+
negative_prompt?: string;
|
|
8203
|
+
}
|
|
8204
|
+
/**
|
|
8205
|
+
* The generated image in JPEG format
|
|
8206
|
+
*/
|
|
8207
|
+
type Ai_Cf_Leonardo_Phoenix_1_0_Output = string;
|
|
8208
|
+
declare abstract class Base_Ai_Cf_Leonardo_Phoenix_1_0 {
|
|
8209
|
+
inputs: Ai_Cf_Leonardo_Phoenix_1_0_Input;
|
|
8210
|
+
postProcessedOutputs: Ai_Cf_Leonardo_Phoenix_1_0_Output;
|
|
8211
|
+
}
|
|
8212
|
+
interface Ai_Cf_Leonardo_Lucid_Origin_Input {
|
|
8213
|
+
/**
|
|
8214
|
+
* A text description of the image you want to generate.
|
|
8215
|
+
*/
|
|
8216
|
+
prompt: string;
|
|
8217
|
+
/**
|
|
8218
|
+
* Controls how closely the generated image should adhere to the prompt; higher values make the image more aligned with the prompt
|
|
8219
|
+
*/
|
|
8220
|
+
guidance?: number;
|
|
8221
|
+
/**
|
|
8222
|
+
* Random seed for reproducibility of the image generation
|
|
8223
|
+
*/
|
|
8224
|
+
seed?: number;
|
|
8225
|
+
/**
|
|
8226
|
+
* The height of the generated image in pixels
|
|
8227
|
+
*/
|
|
8228
|
+
height?: number;
|
|
8229
|
+
/**
|
|
8230
|
+
* The width of the generated image in pixels
|
|
8231
|
+
*/
|
|
8232
|
+
width?: number;
|
|
8233
|
+
/**
|
|
8234
|
+
* The number of diffusion steps; higher values can improve quality but take longer
|
|
8235
|
+
*/
|
|
8236
|
+
num_steps?: number;
|
|
8237
|
+
/**
|
|
8238
|
+
* The number of diffusion steps; higher values can improve quality but take longer
|
|
8239
|
+
*/
|
|
8240
|
+
steps?: number;
|
|
8241
|
+
}
|
|
8242
|
+
interface Ai_Cf_Leonardo_Lucid_Origin_Output {
|
|
8243
|
+
/**
|
|
8244
|
+
* The generated image in Base64 format.
|
|
8245
|
+
*/
|
|
8246
|
+
image?: string;
|
|
8247
|
+
}
|
|
8248
|
+
declare abstract class Base_Ai_Cf_Leonardo_Lucid_Origin {
|
|
8249
|
+
inputs: Ai_Cf_Leonardo_Lucid_Origin_Input;
|
|
8250
|
+
postProcessedOutputs: Ai_Cf_Leonardo_Lucid_Origin_Output;
|
|
8251
|
+
}
|
|
8252
|
+
interface Ai_Cf_Deepgram_Aura_1_Input {
|
|
8253
|
+
/**
|
|
8254
|
+
* Speaker used to produce the audio.
|
|
8255
|
+
*/
|
|
8256
|
+
speaker?:
|
|
8257
|
+
| "angus"
|
|
8258
|
+
| "asteria"
|
|
8259
|
+
| "arcas"
|
|
8260
|
+
| "orion"
|
|
8261
|
+
| "orpheus"
|
|
8262
|
+
| "athena"
|
|
8263
|
+
| "luna"
|
|
8264
|
+
| "zeus"
|
|
8265
|
+
| "perseus"
|
|
8266
|
+
| "helios"
|
|
8267
|
+
| "hera"
|
|
8268
|
+
| "stella";
|
|
8269
|
+
/**
|
|
8270
|
+
* Encoding of the output audio.
|
|
8271
|
+
*/
|
|
8272
|
+
encoding?: "linear16" | "flac" | "mulaw" | "alaw" | "mp3" | "opus" | "aac";
|
|
8273
|
+
/**
|
|
8274
|
+
* Container specifies the file format wrapper for the output audio. The available options depend on the encoding type..
|
|
8275
|
+
*/
|
|
8276
|
+
container?: "none" | "wav" | "ogg";
|
|
8277
|
+
/**
|
|
8278
|
+
* The text content to be converted to speech
|
|
8279
|
+
*/
|
|
8280
|
+
text: string;
|
|
8281
|
+
/**
|
|
8282
|
+
* Sample Rate specifies the sample rate for the output audio. Based on the encoding, different sample rates are supported. For some encodings, the sample rate is not configurable
|
|
8283
|
+
*/
|
|
8284
|
+
sample_rate?: number;
|
|
8285
|
+
/**
|
|
8286
|
+
* The bitrate of the audio in bits per second. Choose from predefined ranges or specific values based on the encoding type.
|
|
8287
|
+
*/
|
|
8288
|
+
bit_rate?: number;
|
|
8289
|
+
}
|
|
8290
|
+
/**
|
|
8291
|
+
* The generated audio in MP3 format
|
|
8292
|
+
*/
|
|
8293
|
+
type Ai_Cf_Deepgram_Aura_1_Output = string;
|
|
8294
|
+
declare abstract class Base_Ai_Cf_Deepgram_Aura_1 {
|
|
8295
|
+
inputs: Ai_Cf_Deepgram_Aura_1_Input;
|
|
8296
|
+
postProcessedOutputs: Ai_Cf_Deepgram_Aura_1_Output;
|
|
8297
|
+
}
|
|
8298
|
+
interface Ai_Cf_Ai4Bharat_Indictrans2_En_Indic_1B_Input {
|
|
8299
|
+
/**
|
|
8300
|
+
* Input text to translate. Can be a single string or a list of strings.
|
|
8301
|
+
*/
|
|
8302
|
+
text: string | string[];
|
|
8303
|
+
/**
|
|
8304
|
+
* Target langauge to translate to
|
|
8305
|
+
*/
|
|
8306
|
+
target_language:
|
|
8307
|
+
| "asm_Beng"
|
|
8308
|
+
| "awa_Deva"
|
|
8309
|
+
| "ben_Beng"
|
|
8310
|
+
| "bho_Deva"
|
|
8311
|
+
| "brx_Deva"
|
|
8312
|
+
| "doi_Deva"
|
|
8313
|
+
| "eng_Latn"
|
|
8314
|
+
| "gom_Deva"
|
|
8315
|
+
| "gon_Deva"
|
|
8316
|
+
| "guj_Gujr"
|
|
8317
|
+
| "hin_Deva"
|
|
8318
|
+
| "hne_Deva"
|
|
8319
|
+
| "kan_Knda"
|
|
8320
|
+
| "kas_Arab"
|
|
8321
|
+
| "kas_Deva"
|
|
8322
|
+
| "kha_Latn"
|
|
8323
|
+
| "lus_Latn"
|
|
8324
|
+
| "mag_Deva"
|
|
8325
|
+
| "mai_Deva"
|
|
8326
|
+
| "mal_Mlym"
|
|
8327
|
+
| "mar_Deva"
|
|
8328
|
+
| "mni_Beng"
|
|
8329
|
+
| "mni_Mtei"
|
|
8330
|
+
| "npi_Deva"
|
|
8331
|
+
| "ory_Orya"
|
|
8332
|
+
| "pan_Guru"
|
|
8333
|
+
| "san_Deva"
|
|
8334
|
+
| "sat_Olck"
|
|
8335
|
+
| "snd_Arab"
|
|
8336
|
+
| "snd_Deva"
|
|
8337
|
+
| "tam_Taml"
|
|
8338
|
+
| "tel_Telu"
|
|
8339
|
+
| "urd_Arab"
|
|
8340
|
+
| "unr_Deva";
|
|
8341
|
+
}
|
|
8342
|
+
interface Ai_Cf_Ai4Bharat_Indictrans2_En_Indic_1B_Output {
|
|
8343
|
+
/**
|
|
8344
|
+
* Translated texts
|
|
8345
|
+
*/
|
|
8346
|
+
translations: string[];
|
|
8347
|
+
}
|
|
8348
|
+
declare abstract class Base_Ai_Cf_Ai4Bharat_Indictrans2_En_Indic_1B {
|
|
8349
|
+
inputs: Ai_Cf_Ai4Bharat_Indictrans2_En_Indic_1B_Input;
|
|
8350
|
+
postProcessedOutputs: Ai_Cf_Ai4Bharat_Indictrans2_En_Indic_1B_Output;
|
|
8351
|
+
}
|
|
8352
|
+
type Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Input =
|
|
8353
|
+
| Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Prompt
|
|
8354
|
+
| Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Messages
|
|
8355
|
+
| Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Async_Batch;
|
|
8356
|
+
interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Prompt {
|
|
8357
|
+
/**
|
|
8358
|
+
* The input text prompt for the model to generate a response.
|
|
8359
|
+
*/
|
|
8360
|
+
prompt: string;
|
|
8361
|
+
/**
|
|
8362
|
+
* Name of the LoRA (Low-Rank Adaptation) model to fine-tune the base model.
|
|
8363
|
+
*/
|
|
8364
|
+
lora?: string;
|
|
8365
|
+
response_format?: Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_JSON_Mode;
|
|
8366
|
+
/**
|
|
8367
|
+
* If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
|
|
8368
|
+
*/
|
|
8369
|
+
raw?: boolean;
|
|
8370
|
+
/**
|
|
8371
|
+
* If true, the response will be streamed back incrementally using SSE, Server Sent Events.
|
|
8372
|
+
*/
|
|
8373
|
+
stream?: boolean;
|
|
8374
|
+
/**
|
|
8375
|
+
* The maximum number of tokens to generate in the response.
|
|
8376
|
+
*/
|
|
8377
|
+
max_tokens?: number;
|
|
8378
|
+
/**
|
|
8379
|
+
* Controls the randomness of the output; higher values produce more random results.
|
|
8380
|
+
*/
|
|
8381
|
+
temperature?: number;
|
|
8382
|
+
/**
|
|
8383
|
+
* Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses.
|
|
8384
|
+
*/
|
|
8385
|
+
top_p?: number;
|
|
8386
|
+
/**
|
|
8387
|
+
* Limits the AI to choose from the top 'k' most probable words. Lower values make responses more focused; higher values introduce more variety and potential surprises.
|
|
8388
|
+
*/
|
|
8389
|
+
top_k?: number;
|
|
8390
|
+
/**
|
|
8391
|
+
* Random seed for reproducibility of the generation.
|
|
8392
|
+
*/
|
|
8393
|
+
seed?: number;
|
|
8394
|
+
/**
|
|
8395
|
+
* Penalty for repeated tokens; higher values discourage repetition.
|
|
8396
|
+
*/
|
|
8397
|
+
repetition_penalty?: number;
|
|
8398
|
+
/**
|
|
8399
|
+
* Decreases the likelihood of the model repeating the same lines verbatim.
|
|
8400
|
+
*/
|
|
8401
|
+
frequency_penalty?: number;
|
|
8402
|
+
/**
|
|
8403
|
+
* Increases the likelihood of the model introducing new topics.
|
|
8404
|
+
*/
|
|
8405
|
+
presence_penalty?: number;
|
|
8406
|
+
}
|
|
8407
|
+
interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_JSON_Mode {
|
|
8408
|
+
type?: "json_object" | "json_schema";
|
|
8409
|
+
json_schema?: unknown;
|
|
8410
|
+
}
|
|
8411
|
+
interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Messages {
|
|
8412
|
+
/**
|
|
8413
|
+
* An array of message objects representing the conversation history.
|
|
8414
|
+
*/
|
|
8415
|
+
messages: {
|
|
8416
|
+
/**
|
|
8417
|
+
* The role of the message sender (e.g., 'user', 'assistant', 'system', 'tool').
|
|
8418
|
+
*/
|
|
8419
|
+
role: string;
|
|
8420
|
+
/**
|
|
8421
|
+
* The content of the message as a string.
|
|
8422
|
+
*/
|
|
8423
|
+
content: string;
|
|
8424
|
+
}[];
|
|
8425
|
+
functions?: {
|
|
8426
|
+
name: string;
|
|
8427
|
+
code: string;
|
|
8428
|
+
}[];
|
|
8429
|
+
/**
|
|
8430
|
+
* A list of tools available for the assistant to use.
|
|
8431
|
+
*/
|
|
8432
|
+
tools?: (
|
|
8433
|
+
| {
|
|
8434
|
+
/**
|
|
8435
|
+
* The name of the tool. More descriptive the better.
|
|
8436
|
+
*/
|
|
8437
|
+
name: string;
|
|
8438
|
+
/**
|
|
8439
|
+
* A brief description of what the tool does.
|
|
8440
|
+
*/
|
|
8441
|
+
description: string;
|
|
8442
|
+
/**
|
|
8443
|
+
* Schema defining the parameters accepted by the tool.
|
|
8444
|
+
*/
|
|
8445
|
+
parameters: {
|
|
8446
|
+
/**
|
|
8447
|
+
* The type of the parameters object (usually 'object').
|
|
8448
|
+
*/
|
|
8449
|
+
type: string;
|
|
8450
|
+
/**
|
|
8451
|
+
* List of required parameter names.
|
|
8452
|
+
*/
|
|
8453
|
+
required?: string[];
|
|
8454
|
+
/**
|
|
8455
|
+
* Definitions of each parameter.
|
|
8456
|
+
*/
|
|
8457
|
+
properties: {
|
|
8458
|
+
[k: string]: {
|
|
8459
|
+
/**
|
|
8460
|
+
* The data type of the parameter.
|
|
8461
|
+
*/
|
|
8462
|
+
type: string;
|
|
8463
|
+
/**
|
|
8464
|
+
* A description of the expected parameter.
|
|
8465
|
+
*/
|
|
8466
|
+
description: string;
|
|
8467
|
+
};
|
|
8468
|
+
};
|
|
8469
|
+
};
|
|
8470
|
+
}
|
|
8471
|
+
| {
|
|
8472
|
+
/**
|
|
8473
|
+
* Specifies the type of tool (e.g., 'function').
|
|
8474
|
+
*/
|
|
8475
|
+
type: string;
|
|
8476
|
+
/**
|
|
8477
|
+
* Details of the function tool.
|
|
8478
|
+
*/
|
|
8479
|
+
function: {
|
|
8480
|
+
/**
|
|
8481
|
+
* The name of the function.
|
|
8482
|
+
*/
|
|
8483
|
+
name: string;
|
|
8484
|
+
/**
|
|
8485
|
+
* A brief description of what the function does.
|
|
8486
|
+
*/
|
|
8487
|
+
description: string;
|
|
8488
|
+
/**
|
|
8489
|
+
* Schema defining the parameters accepted by the function.
|
|
8490
|
+
*/
|
|
8491
|
+
parameters: {
|
|
8492
|
+
/**
|
|
8493
|
+
* The type of the parameters object (usually 'object').
|
|
8494
|
+
*/
|
|
8495
|
+
type: string;
|
|
8496
|
+
/**
|
|
8497
|
+
* List of required parameter names.
|
|
8498
|
+
*/
|
|
8499
|
+
required?: string[];
|
|
8500
|
+
/**
|
|
8501
|
+
* Definitions of each parameter.
|
|
8502
|
+
*/
|
|
8503
|
+
properties: {
|
|
8504
|
+
[k: string]: {
|
|
8505
|
+
/**
|
|
8506
|
+
* The data type of the parameter.
|
|
8507
|
+
*/
|
|
8508
|
+
type: string;
|
|
8509
|
+
/**
|
|
8510
|
+
* A description of the expected parameter.
|
|
8511
|
+
*/
|
|
8512
|
+
description: string;
|
|
8513
|
+
};
|
|
8514
|
+
};
|
|
8515
|
+
};
|
|
8516
|
+
};
|
|
8517
|
+
}
|
|
8518
|
+
)[];
|
|
8519
|
+
response_format?: Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_JSON_Mode_1;
|
|
8520
|
+
/**
|
|
8521
|
+
* If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
|
|
8522
|
+
*/
|
|
8523
|
+
raw?: boolean;
|
|
8524
|
+
/**
|
|
8525
|
+
* If true, the response will be streamed back incrementally using SSE, Server Sent Events.
|
|
8526
|
+
*/
|
|
8527
|
+
stream?: boolean;
|
|
8528
|
+
/**
|
|
8529
|
+
* The maximum number of tokens to generate in the response.
|
|
8530
|
+
*/
|
|
8531
|
+
max_tokens?: number;
|
|
8532
|
+
/**
|
|
8533
|
+
* Controls the randomness of the output; higher values produce more random results.
|
|
8534
|
+
*/
|
|
8535
|
+
temperature?: number;
|
|
8536
|
+
/**
|
|
8537
|
+
* Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses.
|
|
6947
8538
|
*/
|
|
6948
|
-
|
|
8539
|
+
top_p?: number;
|
|
6949
8540
|
/**
|
|
6950
|
-
*
|
|
8541
|
+
* Limits the AI to choose from the top 'k' most probable words. Lower values make responses more focused; higher values introduce more variety and potential surprises.
|
|
6951
8542
|
*/
|
|
6952
|
-
|
|
8543
|
+
top_k?: number;
|
|
6953
8544
|
/**
|
|
6954
|
-
*
|
|
8545
|
+
* Random seed for reproducibility of the generation.
|
|
6955
8546
|
*/
|
|
6956
|
-
|
|
8547
|
+
seed?: number;
|
|
6957
8548
|
/**
|
|
6958
|
-
*
|
|
8549
|
+
* Penalty for repeated tokens; higher values discourage repetition.
|
|
6959
8550
|
*/
|
|
6960
|
-
|
|
8551
|
+
repetition_penalty?: number;
|
|
6961
8552
|
/**
|
|
6962
|
-
*
|
|
8553
|
+
* Decreases the likelihood of the model repeating the same lines verbatim.
|
|
6963
8554
|
*/
|
|
6964
|
-
|
|
8555
|
+
frequency_penalty?: number;
|
|
6965
8556
|
/**
|
|
6966
|
-
*
|
|
8557
|
+
* Increases the likelihood of the model introducing new topics.
|
|
6967
8558
|
*/
|
|
6968
|
-
|
|
8559
|
+
presence_penalty?: number;
|
|
8560
|
+
}
|
|
8561
|
+
interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_JSON_Mode_1 {
|
|
8562
|
+
type?: "json_object" | "json_schema";
|
|
8563
|
+
json_schema?: unknown;
|
|
8564
|
+
}
|
|
8565
|
+
interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Async_Batch {
|
|
8566
|
+
requests: (
|
|
8567
|
+
| Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Prompt_1
|
|
8568
|
+
| Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Messages_1
|
|
8569
|
+
)[];
|
|
8570
|
+
}
|
|
8571
|
+
interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Prompt_1 {
|
|
6969
8572
|
/**
|
|
6970
|
-
*
|
|
8573
|
+
* The input text prompt for the model to generate a response.
|
|
6971
8574
|
*/
|
|
6972
|
-
|
|
8575
|
+
prompt: string;
|
|
6973
8576
|
/**
|
|
6974
|
-
*
|
|
8577
|
+
* Name of the LoRA (Low-Rank Adaptation) model to fine-tune the base model.
|
|
6975
8578
|
*/
|
|
6976
|
-
|
|
8579
|
+
lora?: string;
|
|
8580
|
+
response_format?: Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_JSON_Mode_2;
|
|
6977
8581
|
/**
|
|
6978
|
-
*
|
|
8582
|
+
* If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
|
|
6979
8583
|
*/
|
|
6980
|
-
|
|
8584
|
+
raw?: boolean;
|
|
6981
8585
|
/**
|
|
6982
|
-
*
|
|
8586
|
+
* If true, the response will be streamed back incrementally using SSE, Server Sent Events.
|
|
6983
8587
|
*/
|
|
6984
|
-
|
|
8588
|
+
stream?: boolean;
|
|
6985
8589
|
/**
|
|
6986
|
-
*
|
|
8590
|
+
* The maximum number of tokens to generate in the response.
|
|
6987
8591
|
*/
|
|
6988
|
-
|
|
8592
|
+
max_tokens?: number;
|
|
6989
8593
|
/**
|
|
6990
|
-
*
|
|
8594
|
+
* Controls the randomness of the output; higher values produce more random results.
|
|
6991
8595
|
*/
|
|
6992
|
-
|
|
8596
|
+
temperature?: number;
|
|
6993
8597
|
/**
|
|
6994
|
-
*
|
|
8598
|
+
* Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses.
|
|
6995
8599
|
*/
|
|
6996
|
-
|
|
8600
|
+
top_p?: number;
|
|
6997
8601
|
/**
|
|
6998
|
-
*
|
|
8602
|
+
* Limits the AI to choose from the top 'k' most probable words. Lower values make responses more focused; higher values introduce more variety and potential surprises.
|
|
6999
8603
|
*/
|
|
7000
|
-
|
|
8604
|
+
top_k?: number;
|
|
8605
|
+
/**
|
|
8606
|
+
* Random seed for reproducibility of the generation.
|
|
8607
|
+
*/
|
|
8608
|
+
seed?: number;
|
|
8609
|
+
/**
|
|
8610
|
+
* Penalty for repeated tokens; higher values discourage repetition.
|
|
8611
|
+
*/
|
|
8612
|
+
repetition_penalty?: number;
|
|
8613
|
+
/**
|
|
8614
|
+
* Decreases the likelihood of the model repeating the same lines verbatim.
|
|
8615
|
+
*/
|
|
8616
|
+
frequency_penalty?: number;
|
|
8617
|
+
/**
|
|
8618
|
+
* Increases the likelihood of the model introducing new topics.
|
|
8619
|
+
*/
|
|
8620
|
+
presence_penalty?: number;
|
|
7001
8621
|
}
|
|
7002
|
-
interface
|
|
7003
|
-
|
|
7004
|
-
|
|
7005
|
-
|
|
7006
|
-
|
|
7007
|
-
|
|
7008
|
-
|
|
7009
|
-
|
|
7010
|
-
|
|
7011
|
-
|
|
7012
|
-
|
|
7013
|
-
|
|
7014
|
-
|
|
7015
|
-
|
|
7016
|
-
|
|
7017
|
-
|
|
7018
|
-
|
|
7019
|
-
|
|
7020
|
-
|
|
7021
|
-
|
|
7022
|
-
|
|
7023
|
-
|
|
7024
|
-
|
|
7025
|
-
|
|
7026
|
-
|
|
7027
|
-
|
|
7028
|
-
|
|
7029
|
-
|
|
7030
|
-
|
|
7031
|
-
|
|
7032
|
-
|
|
7033
|
-
|
|
8622
|
+
interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_JSON_Mode_2 {
|
|
8623
|
+
type?: "json_object" | "json_schema";
|
|
8624
|
+
json_schema?: unknown;
|
|
8625
|
+
}
|
|
8626
|
+
interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Messages_1 {
|
|
8627
|
+
/**
|
|
8628
|
+
* An array of message objects representing the conversation history.
|
|
8629
|
+
*/
|
|
8630
|
+
messages: {
|
|
8631
|
+
/**
|
|
8632
|
+
* The role of the message sender (e.g., 'user', 'assistant', 'system', 'tool').
|
|
8633
|
+
*/
|
|
8634
|
+
role: string;
|
|
8635
|
+
/**
|
|
8636
|
+
* The content of the message as a string.
|
|
8637
|
+
*/
|
|
8638
|
+
content: string;
|
|
8639
|
+
}[];
|
|
8640
|
+
functions?: {
|
|
8641
|
+
name: string;
|
|
8642
|
+
code: string;
|
|
8643
|
+
}[];
|
|
8644
|
+
/**
|
|
8645
|
+
* A list of tools available for the assistant to use.
|
|
8646
|
+
*/
|
|
8647
|
+
tools?: (
|
|
8648
|
+
| {
|
|
8649
|
+
/**
|
|
8650
|
+
* The name of the tool. More descriptive the better.
|
|
8651
|
+
*/
|
|
8652
|
+
name: string;
|
|
8653
|
+
/**
|
|
8654
|
+
* A brief description of what the tool does.
|
|
8655
|
+
*/
|
|
8656
|
+
description: string;
|
|
8657
|
+
/**
|
|
8658
|
+
* Schema defining the parameters accepted by the tool.
|
|
8659
|
+
*/
|
|
8660
|
+
parameters: {
|
|
8661
|
+
/**
|
|
8662
|
+
* The type of the parameters object (usually 'object').
|
|
8663
|
+
*/
|
|
8664
|
+
type: string;
|
|
8665
|
+
/**
|
|
8666
|
+
* List of required parameter names.
|
|
8667
|
+
*/
|
|
8668
|
+
required?: string[];
|
|
8669
|
+
/**
|
|
8670
|
+
* Definitions of each parameter.
|
|
8671
|
+
*/
|
|
8672
|
+
properties: {
|
|
8673
|
+
[k: string]: {
|
|
8674
|
+
/**
|
|
8675
|
+
* The data type of the parameter.
|
|
8676
|
+
*/
|
|
8677
|
+
type: string;
|
|
8678
|
+
/**
|
|
8679
|
+
* A description of the expected parameter.
|
|
8680
|
+
*/
|
|
8681
|
+
description: string;
|
|
8682
|
+
};
|
|
8683
|
+
};
|
|
8684
|
+
};
|
|
8685
|
+
}
|
|
8686
|
+
| {
|
|
8687
|
+
/**
|
|
8688
|
+
* Specifies the type of tool (e.g., 'function').
|
|
8689
|
+
*/
|
|
8690
|
+
type: string;
|
|
8691
|
+
/**
|
|
8692
|
+
* Details of the function tool.
|
|
8693
|
+
*/
|
|
8694
|
+
function: {
|
|
8695
|
+
/**
|
|
8696
|
+
* The name of the function.
|
|
8697
|
+
*/
|
|
8698
|
+
name: string;
|
|
8699
|
+
/**
|
|
8700
|
+
* A brief description of what the function does.
|
|
8701
|
+
*/
|
|
8702
|
+
description: string;
|
|
8703
|
+
/**
|
|
8704
|
+
* Schema defining the parameters accepted by the function.
|
|
8705
|
+
*/
|
|
8706
|
+
parameters: {
|
|
8707
|
+
/**
|
|
8708
|
+
* The type of the parameters object (usually 'object').
|
|
8709
|
+
*/
|
|
8710
|
+
type: string;
|
|
8711
|
+
/**
|
|
8712
|
+
* List of required parameter names.
|
|
8713
|
+
*/
|
|
8714
|
+
required?: string[];
|
|
8715
|
+
/**
|
|
8716
|
+
* Definitions of each parameter.
|
|
8717
|
+
*/
|
|
8718
|
+
properties: {
|
|
8719
|
+
[k: string]: {
|
|
8720
|
+
/**
|
|
8721
|
+
* The data type of the parameter.
|
|
8722
|
+
*/
|
|
8723
|
+
type: string;
|
|
8724
|
+
/**
|
|
8725
|
+
* A description of the expected parameter.
|
|
8726
|
+
*/
|
|
8727
|
+
description: string;
|
|
8728
|
+
};
|
|
8729
|
+
};
|
|
8730
|
+
};
|
|
8731
|
+
};
|
|
8732
|
+
}
|
|
8733
|
+
)[];
|
|
8734
|
+
response_format?: Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_JSON_Mode_3;
|
|
8735
|
+
/**
|
|
8736
|
+
* If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
|
|
8737
|
+
*/
|
|
8738
|
+
raw?: boolean;
|
|
8739
|
+
/**
|
|
8740
|
+
* If true, the response will be streamed back incrementally using SSE, Server Sent Events.
|
|
8741
|
+
*/
|
|
8742
|
+
stream?: boolean;
|
|
8743
|
+
/**
|
|
8744
|
+
* The maximum number of tokens to generate in the response.
|
|
8745
|
+
*/
|
|
8746
|
+
max_tokens?: number;
|
|
8747
|
+
/**
|
|
8748
|
+
* Controls the randomness of the output; higher values produce more random results.
|
|
8749
|
+
*/
|
|
8750
|
+
temperature?: number;
|
|
8751
|
+
/**
|
|
8752
|
+
* Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses.
|
|
8753
|
+
*/
|
|
8754
|
+
top_p?: number;
|
|
8755
|
+
/**
|
|
8756
|
+
* Limits the AI to choose from the top 'k' most probable words. Lower values make responses more focused; higher values introduce more variety and potential surprises.
|
|
8757
|
+
*/
|
|
8758
|
+
top_k?: number;
|
|
8759
|
+
/**
|
|
8760
|
+
* Random seed for reproducibility of the generation.
|
|
8761
|
+
*/
|
|
8762
|
+
seed?: number;
|
|
8763
|
+
/**
|
|
8764
|
+
* Penalty for repeated tokens; higher values discourage repetition.
|
|
8765
|
+
*/
|
|
8766
|
+
repetition_penalty?: number;
|
|
8767
|
+
/**
|
|
8768
|
+
* Decreases the likelihood of the model repeating the same lines verbatim.
|
|
8769
|
+
*/
|
|
8770
|
+
frequency_penalty?: number;
|
|
8771
|
+
/**
|
|
8772
|
+
* Increases the likelihood of the model introducing new topics.
|
|
8773
|
+
*/
|
|
8774
|
+
presence_penalty?: number;
|
|
7034
8775
|
}
|
|
7035
|
-
|
|
7036
|
-
|
|
7037
|
-
|
|
8776
|
+
interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_JSON_Mode_3 {
|
|
8777
|
+
type?: "json_object" | "json_schema";
|
|
8778
|
+
json_schema?: unknown;
|
|
7038
8779
|
}
|
|
7039
|
-
type
|
|
7040
|
-
|
|
|
8780
|
+
type Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Output =
|
|
8781
|
+
| Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Chat_Completion_Response
|
|
8782
|
+
| Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Text_Completion_Response
|
|
8783
|
+
| string
|
|
8784
|
+
| Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_AsyncResponse;
|
|
8785
|
+
interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Chat_Completion_Response {
|
|
8786
|
+
/**
|
|
8787
|
+
* Unique identifier for the completion
|
|
8788
|
+
*/
|
|
8789
|
+
id?: string;
|
|
8790
|
+
/**
|
|
8791
|
+
* Object type identifier
|
|
8792
|
+
*/
|
|
8793
|
+
object?: "chat.completion";
|
|
8794
|
+
/**
|
|
8795
|
+
* Unix timestamp of when the completion was created
|
|
8796
|
+
*/
|
|
8797
|
+
created?: number;
|
|
8798
|
+
/**
|
|
8799
|
+
* Model used for the completion
|
|
8800
|
+
*/
|
|
8801
|
+
model?: string;
|
|
8802
|
+
/**
|
|
8803
|
+
* List of completion choices
|
|
8804
|
+
*/
|
|
8805
|
+
choices?: {
|
|
8806
|
+
/**
|
|
8807
|
+
* Index of the choice in the list
|
|
8808
|
+
*/
|
|
8809
|
+
index?: number;
|
|
8810
|
+
/**
|
|
8811
|
+
* The message generated by the model
|
|
8812
|
+
*/
|
|
8813
|
+
message?: {
|
|
7041
8814
|
/**
|
|
7042
|
-
*
|
|
8815
|
+
* Role of the message author
|
|
7043
8816
|
*/
|
|
7044
|
-
|
|
7045
|
-
body: object;
|
|
7046
|
-
contentType: string;
|
|
7047
|
-
};
|
|
8817
|
+
role: string;
|
|
7048
8818
|
/**
|
|
7049
|
-
*
|
|
8819
|
+
* The content of the message
|
|
7050
8820
|
*/
|
|
7051
|
-
|
|
7052
|
-
}
|
|
7053
|
-
| {
|
|
8821
|
+
content: string;
|
|
7054
8822
|
/**
|
|
7055
|
-
*
|
|
8823
|
+
* Internal reasoning content (if available)
|
|
7056
8824
|
*/
|
|
7057
|
-
|
|
8825
|
+
reasoning_content?: string;
|
|
7058
8826
|
/**
|
|
7059
|
-
*
|
|
8827
|
+
* Tool calls made by the assistant
|
|
7060
8828
|
*/
|
|
7061
|
-
|
|
8829
|
+
tool_calls?: {
|
|
8830
|
+
/**
|
|
8831
|
+
* Unique identifier for the tool call
|
|
8832
|
+
*/
|
|
8833
|
+
id: string;
|
|
8834
|
+
/**
|
|
8835
|
+
* Type of tool call
|
|
8836
|
+
*/
|
|
8837
|
+
type: "function";
|
|
8838
|
+
function: {
|
|
8839
|
+
/**
|
|
8840
|
+
* Name of the function to call
|
|
8841
|
+
*/
|
|
8842
|
+
name: string;
|
|
8843
|
+
/**
|
|
8844
|
+
* JSON string of arguments for the function
|
|
8845
|
+
*/
|
|
8846
|
+
arguments: string;
|
|
8847
|
+
};
|
|
8848
|
+
}[];
|
|
7062
8849
|
};
|
|
7063
|
-
|
|
8850
|
+
/**
|
|
8851
|
+
* Reason why the model stopped generating
|
|
8852
|
+
*/
|
|
8853
|
+
finish_reason?: string;
|
|
8854
|
+
/**
|
|
8855
|
+
* Stop reason (may be null)
|
|
8856
|
+
*/
|
|
8857
|
+
stop_reason?: string | null;
|
|
8858
|
+
/**
|
|
8859
|
+
* Log probabilities (if requested)
|
|
8860
|
+
*/
|
|
8861
|
+
logprobs?: {} | null;
|
|
8862
|
+
}[];
|
|
7064
8863
|
/**
|
|
7065
|
-
*
|
|
8864
|
+
* Usage statistics for the inference request
|
|
7066
8865
|
*/
|
|
7067
|
-
|
|
8866
|
+
usage?: {
|
|
8867
|
+
/**
|
|
8868
|
+
* Total number of tokens in input
|
|
8869
|
+
*/
|
|
8870
|
+
prompt_tokens?: number;
|
|
8871
|
+
/**
|
|
8872
|
+
* Total number of tokens in output
|
|
8873
|
+
*/
|
|
8874
|
+
completion_tokens?: number;
|
|
8875
|
+
/**
|
|
8876
|
+
* Total number of input and output tokens
|
|
8877
|
+
*/
|
|
8878
|
+
total_tokens?: number;
|
|
8879
|
+
};
|
|
7068
8880
|
/**
|
|
7069
|
-
*
|
|
8881
|
+
* Log probabilities for the prompt (if requested)
|
|
7070
8882
|
*/
|
|
7071
|
-
|
|
7072
|
-
}
|
|
7073
|
-
declare abstract class Base_Ai_Cf_Pipecat_Ai_Smart_Turn_V2 {
|
|
7074
|
-
inputs: Ai_Cf_Pipecat_Ai_Smart_Turn_V2_Input;
|
|
7075
|
-
postProcessedOutputs: Ai_Cf_Pipecat_Ai_Smart_Turn_V2_Output;
|
|
8883
|
+
prompt_logprobs?: {} | null;
|
|
7076
8884
|
}
|
|
7077
|
-
|
|
7078
|
-
|
|
7079
|
-
|
|
7080
|
-
|
|
8885
|
+
interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Text_Completion_Response {
|
|
8886
|
+
/**
|
|
8887
|
+
* Unique identifier for the completion
|
|
8888
|
+
*/
|
|
8889
|
+
id?: string;
|
|
8890
|
+
/**
|
|
8891
|
+
* Object type identifier
|
|
8892
|
+
*/
|
|
8893
|
+
object?: "text_completion";
|
|
8894
|
+
/**
|
|
8895
|
+
* Unix timestamp of when the completion was created
|
|
8896
|
+
*/
|
|
8897
|
+
created?: number;
|
|
8898
|
+
/**
|
|
8899
|
+
* Model used for the completion
|
|
8900
|
+
*/
|
|
8901
|
+
model?: string;
|
|
7081
8902
|
/**
|
|
7082
|
-
*
|
|
8903
|
+
* List of completion choices
|
|
7083
8904
|
*/
|
|
7084
|
-
|
|
7085
|
-
reasoning?: {
|
|
8905
|
+
choices?: {
|
|
7086
8906
|
/**
|
|
7087
|
-
*
|
|
8907
|
+
* Index of the choice in the list
|
|
7088
8908
|
*/
|
|
7089
|
-
|
|
8909
|
+
index: number;
|
|
7090
8910
|
/**
|
|
7091
|
-
*
|
|
8911
|
+
* The generated text completion
|
|
7092
8912
|
*/
|
|
7093
|
-
|
|
7094
|
-
};
|
|
7095
|
-
}
|
|
7096
|
-
interface GPT_OSS_120B_Responses_Async {
|
|
7097
|
-
requests: {
|
|
8913
|
+
text: string;
|
|
7098
8914
|
/**
|
|
7099
|
-
*
|
|
8915
|
+
* Reason why the model stopped generating
|
|
7100
8916
|
*/
|
|
7101
|
-
|
|
7102
|
-
|
|
7103
|
-
|
|
7104
|
-
|
|
7105
|
-
|
|
7106
|
-
|
|
7107
|
-
|
|
7108
|
-
|
|
7109
|
-
|
|
7110
|
-
|
|
7111
|
-
|
|
8917
|
+
finish_reason: string;
|
|
8918
|
+
/**
|
|
8919
|
+
* Stop reason (may be null)
|
|
8920
|
+
*/
|
|
8921
|
+
stop_reason?: string | null;
|
|
8922
|
+
/**
|
|
8923
|
+
* Log probabilities (if requested)
|
|
8924
|
+
*/
|
|
8925
|
+
logprobs?: {} | null;
|
|
8926
|
+
/**
|
|
8927
|
+
* Log probabilities for the prompt (if requested)
|
|
8928
|
+
*/
|
|
8929
|
+
prompt_logprobs?: {} | null;
|
|
7112
8930
|
}[];
|
|
7113
|
-
}
|
|
7114
|
-
type Ai_Cf_Openai_Gpt_Oss_120B_Output = {} | (string & NonNullable<unknown>);
|
|
7115
|
-
declare abstract class Base_Ai_Cf_Openai_Gpt_Oss_120B {
|
|
7116
|
-
inputs: Ai_Cf_Openai_Gpt_Oss_120B_Input;
|
|
7117
|
-
postProcessedOutputs: Ai_Cf_Openai_Gpt_Oss_120B_Output;
|
|
7118
|
-
}
|
|
7119
|
-
type Ai_Cf_Openai_Gpt_Oss_20B_Input =
|
|
7120
|
-
| GPT_OSS_20B_Responses
|
|
7121
|
-
| GPT_OSS_20B_Responses_Async;
|
|
7122
|
-
interface GPT_OSS_20B_Responses {
|
|
7123
8931
|
/**
|
|
7124
|
-
*
|
|
8932
|
+
* Usage statistics for the inference request
|
|
7125
8933
|
*/
|
|
7126
|
-
|
|
7127
|
-
reasoning?: {
|
|
8934
|
+
usage?: {
|
|
7128
8935
|
/**
|
|
7129
|
-
*
|
|
8936
|
+
* Total number of tokens in input
|
|
7130
8937
|
*/
|
|
7131
|
-
|
|
8938
|
+
prompt_tokens?: number;
|
|
7132
8939
|
/**
|
|
7133
|
-
*
|
|
8940
|
+
* Total number of tokens in output
|
|
7134
8941
|
*/
|
|
7135
|
-
|
|
7136
|
-
};
|
|
7137
|
-
}
|
|
7138
|
-
interface GPT_OSS_20B_Responses_Async {
|
|
7139
|
-
requests: {
|
|
8942
|
+
completion_tokens?: number;
|
|
7140
8943
|
/**
|
|
7141
|
-
*
|
|
8944
|
+
* Total number of input and output tokens
|
|
7142
8945
|
*/
|
|
7143
|
-
|
|
7144
|
-
|
|
7145
|
-
/**
|
|
7146
|
-
* Constrains effort on reasoning for reasoning models. Currently supported values are low, medium, and high. Reducing reasoning effort can result in faster responses and fewer tokens used on reasoning in a response.
|
|
7147
|
-
*/
|
|
7148
|
-
effort?: "low" | "medium" | "high";
|
|
7149
|
-
/**
|
|
7150
|
-
* A summary of the reasoning performed by the model. This can be useful for debugging and understanding the model's reasoning process. One of auto, concise, or detailed.
|
|
7151
|
-
*/
|
|
7152
|
-
summary?: "auto" | "concise" | "detailed";
|
|
7153
|
-
};
|
|
7154
|
-
}[];
|
|
8946
|
+
total_tokens?: number;
|
|
8947
|
+
};
|
|
7155
8948
|
}
|
|
7156
|
-
|
|
7157
|
-
|
|
7158
|
-
|
|
7159
|
-
|
|
8949
|
+
interface Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_AsyncResponse {
|
|
8950
|
+
/**
|
|
8951
|
+
* The async request id that can be used to obtain the results.
|
|
8952
|
+
*/
|
|
8953
|
+
request_id?: string;
|
|
7160
8954
|
}
|
|
7161
|
-
|
|
8955
|
+
declare abstract class Base_Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It {
|
|
8956
|
+
inputs: Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Input;
|
|
8957
|
+
postProcessedOutputs: Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It_Output;
|
|
8958
|
+
}
|
|
8959
|
+
interface Ai_Cf_Pfnet_Plamo_Embedding_1B_Input {
|
|
7162
8960
|
/**
|
|
7163
|
-
*
|
|
8961
|
+
* Input text to embed. Can be a single string or a list of strings.
|
|
7164
8962
|
*/
|
|
7165
|
-
|
|
8963
|
+
text: string | string[];
|
|
8964
|
+
}
|
|
8965
|
+
interface Ai_Cf_Pfnet_Plamo_Embedding_1B_Output {
|
|
7166
8966
|
/**
|
|
7167
|
-
*
|
|
8967
|
+
* Embedding vectors, where each vector is a list of floats.
|
|
7168
8968
|
*/
|
|
7169
|
-
|
|
8969
|
+
data: number[][];
|
|
7170
8970
|
/**
|
|
7171
|
-
*
|
|
8971
|
+
* Shape of the embedding data as [number_of_embeddings, embedding_dimension].
|
|
8972
|
+
*
|
|
8973
|
+
* @minItems 2
|
|
8974
|
+
* @maxItems 2
|
|
7172
8975
|
*/
|
|
7173
|
-
|
|
8976
|
+
shape: [number, number];
|
|
8977
|
+
}
|
|
8978
|
+
declare abstract class Base_Ai_Cf_Pfnet_Plamo_Embedding_1B {
|
|
8979
|
+
inputs: Ai_Cf_Pfnet_Plamo_Embedding_1B_Input;
|
|
8980
|
+
postProcessedOutputs: Ai_Cf_Pfnet_Plamo_Embedding_1B_Output;
|
|
8981
|
+
}
|
|
8982
|
+
interface Ai_Cf_Deepgram_Flux_Input {
|
|
7174
8983
|
/**
|
|
7175
|
-
*
|
|
8984
|
+
* Encoding of the audio stream. Currently only supports raw signed little-endian 16-bit PCM.
|
|
7176
8985
|
*/
|
|
7177
|
-
|
|
8986
|
+
encoding: "linear16";
|
|
7178
8987
|
/**
|
|
7179
|
-
*
|
|
8988
|
+
* Sample rate of the audio stream in Hz.
|
|
7180
8989
|
*/
|
|
7181
|
-
|
|
8990
|
+
sample_rate: string;
|
|
7182
8991
|
/**
|
|
7183
|
-
*
|
|
8992
|
+
* End-of-turn confidence required to fire an eager end-of-turn event. When set, enables EagerEndOfTurn and TurnResumed events. Valid Values 0.3 - 0.9.
|
|
7184
8993
|
*/
|
|
7185
|
-
|
|
8994
|
+
eager_eot_threshold?: string;
|
|
7186
8995
|
/**
|
|
7187
|
-
*
|
|
8996
|
+
* End-of-turn confidence required to finish a turn. Valid Values 0.5 - 0.9.
|
|
7188
8997
|
*/
|
|
7189
|
-
|
|
8998
|
+
eot_threshold?: string;
|
|
8999
|
+
/**
|
|
9000
|
+
* A turn will be finished when this much time has passed after speech, regardless of EOT confidence.
|
|
9001
|
+
*/
|
|
9002
|
+
eot_timeout_ms?: string;
|
|
9003
|
+
/**
|
|
9004
|
+
* Keyterm prompting can improve recognition of specialized terminology. Pass multiple keyterm query parameters to boost multiple keyterms.
|
|
9005
|
+
*/
|
|
9006
|
+
keyterm?: string;
|
|
9007
|
+
/**
|
|
9008
|
+
* Opts out requests from the Deepgram Model Improvement Program. Refer to Deepgram Docs for pricing impacts before setting this to true. https://dpgr.am/deepgram-mip
|
|
9009
|
+
*/
|
|
9010
|
+
mip_opt_out?: "true" | "false";
|
|
9011
|
+
/**
|
|
9012
|
+
* Label your requests for the purpose of identification during usage reporting
|
|
9013
|
+
*/
|
|
9014
|
+
tag?: string;
|
|
7190
9015
|
}
|
|
7191
9016
|
/**
|
|
7192
|
-
*
|
|
9017
|
+
* Output will be returned as websocket messages.
|
|
7193
9018
|
*/
|
|
7194
|
-
|
|
7195
|
-
declare abstract class Base_Ai_Cf_Leonardo_Phoenix_1_0 {
|
|
7196
|
-
inputs: Ai_Cf_Leonardo_Phoenix_1_0_Input;
|
|
7197
|
-
postProcessedOutputs: Ai_Cf_Leonardo_Phoenix_1_0_Output;
|
|
7198
|
-
}
|
|
7199
|
-
interface Ai_Cf_Leonardo_Lucid_Origin_Input {
|
|
9019
|
+
interface Ai_Cf_Deepgram_Flux_Output {
|
|
7200
9020
|
/**
|
|
7201
|
-
*
|
|
9021
|
+
* The unique identifier of the request (uuid)
|
|
7202
9022
|
*/
|
|
7203
|
-
|
|
9023
|
+
request_id?: string;
|
|
7204
9024
|
/**
|
|
7205
|
-
*
|
|
9025
|
+
* Starts at 0 and increments for each message the server sends to the client.
|
|
7206
9026
|
*/
|
|
7207
|
-
|
|
9027
|
+
sequence_id?: number;
|
|
7208
9028
|
/**
|
|
7209
|
-
*
|
|
9029
|
+
* The type of event being reported.
|
|
7210
9030
|
*/
|
|
7211
|
-
|
|
9031
|
+
event?:
|
|
9032
|
+
| "Update"
|
|
9033
|
+
| "StartOfTurn"
|
|
9034
|
+
| "EagerEndOfTurn"
|
|
9035
|
+
| "TurnResumed"
|
|
9036
|
+
| "EndOfTurn";
|
|
7212
9037
|
/**
|
|
7213
|
-
* The
|
|
9038
|
+
* The index of the current turn
|
|
7214
9039
|
*/
|
|
7215
|
-
|
|
9040
|
+
turn_index?: number;
|
|
7216
9041
|
/**
|
|
7217
|
-
*
|
|
9042
|
+
* Start time in seconds of the audio range that was transcribed
|
|
7218
9043
|
*/
|
|
7219
|
-
|
|
9044
|
+
audio_window_start?: number;
|
|
7220
9045
|
/**
|
|
7221
|
-
*
|
|
9046
|
+
* End time in seconds of the audio range that was transcribed
|
|
7222
9047
|
*/
|
|
7223
|
-
|
|
9048
|
+
audio_window_end?: number;
|
|
7224
9049
|
/**
|
|
7225
|
-
*
|
|
9050
|
+
* Text that was said over the course of the current turn
|
|
7226
9051
|
*/
|
|
7227
|
-
|
|
7228
|
-
}
|
|
7229
|
-
interface Ai_Cf_Leonardo_Lucid_Origin_Output {
|
|
9052
|
+
transcript?: string;
|
|
7230
9053
|
/**
|
|
7231
|
-
* The
|
|
9054
|
+
* The words in the transcript
|
|
7232
9055
|
*/
|
|
7233
|
-
|
|
9056
|
+
words?: {
|
|
9057
|
+
/**
|
|
9058
|
+
* The individual punctuated, properly-cased word from the transcript
|
|
9059
|
+
*/
|
|
9060
|
+
word: string;
|
|
9061
|
+
/**
|
|
9062
|
+
* Confidence that this word was transcribed correctly
|
|
9063
|
+
*/
|
|
9064
|
+
confidence: number;
|
|
9065
|
+
}[];
|
|
9066
|
+
/**
|
|
9067
|
+
* Confidence that no more speech is coming in this turn
|
|
9068
|
+
*/
|
|
9069
|
+
end_of_turn_confidence?: number;
|
|
7234
9070
|
}
|
|
7235
|
-
declare abstract class
|
|
7236
|
-
inputs:
|
|
7237
|
-
postProcessedOutputs:
|
|
9071
|
+
declare abstract class Base_Ai_Cf_Deepgram_Flux {
|
|
9072
|
+
inputs: Ai_Cf_Deepgram_Flux_Input;
|
|
9073
|
+
postProcessedOutputs: Ai_Cf_Deepgram_Flux_Output;
|
|
7238
9074
|
}
|
|
7239
|
-
interface
|
|
9075
|
+
interface Ai_Cf_Deepgram_Aura_2_En_Input {
|
|
7240
9076
|
/**
|
|
7241
9077
|
* Speaker used to produce the audio.
|
|
7242
9078
|
*/
|
|
7243
9079
|
speaker?:
|
|
7244
|
-
| "
|
|
7245
|
-
| "
|
|
9080
|
+
| "amalthea"
|
|
9081
|
+
| "andromeda"
|
|
9082
|
+
| "apollo"
|
|
7246
9083
|
| "arcas"
|
|
7247
|
-
| "
|
|
7248
|
-
| "
|
|
9084
|
+
| "aries"
|
|
9085
|
+
| "asteria"
|
|
7249
9086
|
| "athena"
|
|
7250
|
-
| "
|
|
7251
|
-
| "
|
|
7252
|
-
| "
|
|
7253
|
-
| "
|
|
9087
|
+
| "atlas"
|
|
9088
|
+
| "aurora"
|
|
9089
|
+
| "callista"
|
|
9090
|
+
| "cora"
|
|
9091
|
+
| "cordelia"
|
|
9092
|
+
| "delia"
|
|
9093
|
+
| "draco"
|
|
9094
|
+
| "electra"
|
|
9095
|
+
| "harmonia"
|
|
9096
|
+
| "helena"
|
|
7254
9097
|
| "hera"
|
|
7255
|
-
| "
|
|
9098
|
+
| "hermes"
|
|
9099
|
+
| "hyperion"
|
|
9100
|
+
| "iris"
|
|
9101
|
+
| "janus"
|
|
9102
|
+
| "juno"
|
|
9103
|
+
| "jupiter"
|
|
9104
|
+
| "luna"
|
|
9105
|
+
| "mars"
|
|
9106
|
+
| "minerva"
|
|
9107
|
+
| "neptune"
|
|
9108
|
+
| "odysseus"
|
|
9109
|
+
| "ophelia"
|
|
9110
|
+
| "orion"
|
|
9111
|
+
| "orpheus"
|
|
9112
|
+
| "pandora"
|
|
9113
|
+
| "phoebe"
|
|
9114
|
+
| "pluto"
|
|
9115
|
+
| "saturn"
|
|
9116
|
+
| "thalia"
|
|
9117
|
+
| "theia"
|
|
9118
|
+
| "vesta"
|
|
9119
|
+
| "zeus";
|
|
7256
9120
|
/**
|
|
7257
9121
|
* Encoding of the output audio.
|
|
7258
9122
|
*/
|
|
@@ -7277,10 +9141,54 @@ interface Ai_Cf_Deepgram_Aura_1_Input {
|
|
|
7277
9141
|
/**
|
|
7278
9142
|
* The generated audio in MP3 format
|
|
7279
9143
|
*/
|
|
7280
|
-
type
|
|
7281
|
-
declare abstract class
|
|
7282
|
-
inputs:
|
|
7283
|
-
postProcessedOutputs:
|
|
9144
|
+
type Ai_Cf_Deepgram_Aura_2_En_Output = string;
|
|
9145
|
+
declare abstract class Base_Ai_Cf_Deepgram_Aura_2_En {
|
|
9146
|
+
inputs: Ai_Cf_Deepgram_Aura_2_En_Input;
|
|
9147
|
+
postProcessedOutputs: Ai_Cf_Deepgram_Aura_2_En_Output;
|
|
9148
|
+
}
|
|
9149
|
+
interface Ai_Cf_Deepgram_Aura_2_Es_Input {
|
|
9150
|
+
/**
|
|
9151
|
+
* Speaker used to produce the audio.
|
|
9152
|
+
*/
|
|
9153
|
+
speaker?:
|
|
9154
|
+
| "sirio"
|
|
9155
|
+
| "nestor"
|
|
9156
|
+
| "carina"
|
|
9157
|
+
| "celeste"
|
|
9158
|
+
| "alvaro"
|
|
9159
|
+
| "diana"
|
|
9160
|
+
| "aquila"
|
|
9161
|
+
| "selena"
|
|
9162
|
+
| "estrella"
|
|
9163
|
+
| "javier";
|
|
9164
|
+
/**
|
|
9165
|
+
* Encoding of the output audio.
|
|
9166
|
+
*/
|
|
9167
|
+
encoding?: "linear16" | "flac" | "mulaw" | "alaw" | "mp3" | "opus" | "aac";
|
|
9168
|
+
/**
|
|
9169
|
+
* Container specifies the file format wrapper for the output audio. The available options depend on the encoding type..
|
|
9170
|
+
*/
|
|
9171
|
+
container?: "none" | "wav" | "ogg";
|
|
9172
|
+
/**
|
|
9173
|
+
* The text content to be converted to speech
|
|
9174
|
+
*/
|
|
9175
|
+
text: string;
|
|
9176
|
+
/**
|
|
9177
|
+
* Sample Rate specifies the sample rate for the output audio. Based on the encoding, different sample rates are supported. For some encodings, the sample rate is not configurable
|
|
9178
|
+
*/
|
|
9179
|
+
sample_rate?: number;
|
|
9180
|
+
/**
|
|
9181
|
+
* The bitrate of the audio in bits per second. Choose from predefined ranges or specific values based on the encoding type.
|
|
9182
|
+
*/
|
|
9183
|
+
bit_rate?: number;
|
|
9184
|
+
}
|
|
9185
|
+
/**
|
|
9186
|
+
* The generated audio in MP3 format
|
|
9187
|
+
*/
|
|
9188
|
+
type Ai_Cf_Deepgram_Aura_2_Es_Output = string;
|
|
9189
|
+
declare abstract class Base_Ai_Cf_Deepgram_Aura_2_Es {
|
|
9190
|
+
inputs: Ai_Cf_Deepgram_Aura_2_Es_Input;
|
|
9191
|
+
postProcessedOutputs: Ai_Cf_Deepgram_Aura_2_Es_Output;
|
|
7284
9192
|
}
|
|
7285
9193
|
interface AiModels {
|
|
7286
9194
|
"@cf/huggingface/distilbert-sst-2-int8": BaseAiTextClassification;
|
|
@@ -7325,12 +9233,12 @@ interface AiModels {
|
|
|
7325
9233
|
"@cf/meta/llama-3-8b-instruct": BaseAiTextGeneration;
|
|
7326
9234
|
"@cf/fblgit/una-cybertron-7b-v2-bf16": BaseAiTextGeneration;
|
|
7327
9235
|
"@cf/meta/llama-3-8b-instruct-awq": BaseAiTextGeneration;
|
|
7328
|
-
"@hf/meta-llama/meta-llama-3-8b-instruct": BaseAiTextGeneration;
|
|
7329
9236
|
"@cf/meta/llama-3.1-8b-instruct-fp8": BaseAiTextGeneration;
|
|
7330
9237
|
"@cf/meta/llama-3.1-8b-instruct-awq": BaseAiTextGeneration;
|
|
7331
9238
|
"@cf/meta/llama-3.2-3b-instruct": BaseAiTextGeneration;
|
|
7332
9239
|
"@cf/meta/llama-3.2-1b-instruct": BaseAiTextGeneration;
|
|
7333
9240
|
"@cf/deepseek-ai/deepseek-r1-distill-qwen-32b": BaseAiTextGeneration;
|
|
9241
|
+
"@cf/ibm-granite/granite-4.0-h-micro": BaseAiTextGeneration;
|
|
7334
9242
|
"@cf/facebook/bart-large-cnn": BaseAiSummarization;
|
|
7335
9243
|
"@cf/llava-hf/llava-1.5-7b-hf": BaseAiImageToText;
|
|
7336
9244
|
"@cf/baai/bge-base-en-v1.5": Base_Ai_Cf_Baai_Bge_Base_En_V1_5;
|
|
@@ -7352,13 +9260,21 @@ interface AiModels {
|
|
|
7352
9260
|
"@cf/mistralai/mistral-small-3.1-24b-instruct": Base_Ai_Cf_Mistralai_Mistral_Small_3_1_24B_Instruct;
|
|
7353
9261
|
"@cf/google/gemma-3-12b-it": Base_Ai_Cf_Google_Gemma_3_12B_It;
|
|
7354
9262
|
"@cf/meta/llama-4-scout-17b-16e-instruct": Base_Ai_Cf_Meta_Llama_4_Scout_17B_16E_Instruct;
|
|
9263
|
+
"@cf/qwen/qwen3-30b-a3b-fp8": Base_Ai_Cf_Qwen_Qwen3_30B_A3B_Fp8;
|
|
7355
9264
|
"@cf/deepgram/nova-3": Base_Ai_Cf_Deepgram_Nova_3;
|
|
9265
|
+
"@cf/qwen/qwen3-embedding-0.6b": Base_Ai_Cf_Qwen_Qwen3_Embedding_0_6B;
|
|
7356
9266
|
"@cf/pipecat-ai/smart-turn-v2": Base_Ai_Cf_Pipecat_Ai_Smart_Turn_V2;
|
|
7357
9267
|
"@cf/openai/gpt-oss-120b": Base_Ai_Cf_Openai_Gpt_Oss_120B;
|
|
7358
9268
|
"@cf/openai/gpt-oss-20b": Base_Ai_Cf_Openai_Gpt_Oss_20B;
|
|
7359
9269
|
"@cf/leonardo/phoenix-1.0": Base_Ai_Cf_Leonardo_Phoenix_1_0;
|
|
7360
9270
|
"@cf/leonardo/lucid-origin": Base_Ai_Cf_Leonardo_Lucid_Origin;
|
|
7361
9271
|
"@cf/deepgram/aura-1": Base_Ai_Cf_Deepgram_Aura_1;
|
|
9272
|
+
"@cf/ai4bharat/indictrans2-en-indic-1B": Base_Ai_Cf_Ai4Bharat_Indictrans2_En_Indic_1B;
|
|
9273
|
+
"@cf/aisingapore/gemma-sea-lion-v4-27b-it": Base_Ai_Cf_Aisingapore_Gemma_Sea_Lion_V4_27B_It;
|
|
9274
|
+
"@cf/pfnet/plamo-embedding-1b": Base_Ai_Cf_Pfnet_Plamo_Embedding_1B;
|
|
9275
|
+
"@cf/deepgram/flux": Base_Ai_Cf_Deepgram_Flux;
|
|
9276
|
+
"@cf/deepgram/aura-2-en": Base_Ai_Cf_Deepgram_Aura_2_En;
|
|
9277
|
+
"@cf/deepgram/aura-2-es": Base_Ai_Cf_Deepgram_Aura_2_Es;
|
|
7362
9278
|
}
|
|
7363
9279
|
type AiOptions = {
|
|
7364
9280
|
/**
|
|
@@ -7370,6 +9286,16 @@ type AiOptions = {
|
|
|
7370
9286
|
* Establish websocket connections, only works for supported models
|
|
7371
9287
|
*/
|
|
7372
9288
|
websocket?: boolean;
|
|
9289
|
+
/**
|
|
9290
|
+
* Tag your requests to group and view them in Cloudflare dashboard.
|
|
9291
|
+
*
|
|
9292
|
+
* Rules:
|
|
9293
|
+
* Tags must only contain letters, numbers, and the symbols: : - . / @
|
|
9294
|
+
* Each tag can have maximum 50 characters.
|
|
9295
|
+
* Maximum 5 tags are allowed each request.
|
|
9296
|
+
* Duplicate tags will removed.
|
|
9297
|
+
*/
|
|
9298
|
+
tags: string[];
|
|
7373
9299
|
gateway?: GatewayOptions;
|
|
7374
9300
|
returnRawResponse?: boolean;
|
|
7375
9301
|
prefix?: string;
|
|
@@ -9457,12 +11383,13 @@ declare namespace Rpc {
|
|
|
9457
11383
|
export type Provider<
|
|
9458
11384
|
T extends object,
|
|
9459
11385
|
Reserved extends string = never,
|
|
9460
|
-
> = MaybeCallableProvider<T> &
|
|
9461
|
-
|
|
9462
|
-
|
|
9463
|
-
|
|
9464
|
-
|
|
9465
|
-
|
|
11386
|
+
> = MaybeCallableProvider<T> &
|
|
11387
|
+
Pick<
|
|
11388
|
+
{
|
|
11389
|
+
[K in keyof T]: MethodOrProperty<T[K]>;
|
|
11390
|
+
},
|
|
11391
|
+
Exclude<keyof T, Reserved | symbol | keyof StubBase<never>>
|
|
11392
|
+
>;
|
|
9466
11393
|
}
|
|
9467
11394
|
declare namespace Cloudflare {
|
|
9468
11395
|
// Type of `env`.
|