scale-gp-beta 0.1.0a4__py3-none-any.whl → 0.1.0a6__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (42) hide show
  1. scale_gp_beta/_client.py +35 -17
  2. scale_gp_beta/_version.py +1 -1
  3. scale_gp_beta/resources/__init__.py +55 -27
  4. scale_gp_beta/resources/dataset_items.py +586 -0
  5. scale_gp_beta/resources/datasets.py +569 -0
  6. scale_gp_beta/resources/evaluation_items.py +295 -0
  7. scale_gp_beta/resources/{question_sets.py → evaluations.py} +259 -273
  8. scale_gp_beta/types/__init__.py +21 -11
  9. scale_gp_beta/types/dataset.py +27 -0
  10. scale_gp_beta/types/dataset_create_params.py +17 -0
  11. scale_gp_beta/types/{question_set_delete_response.py → dataset_delete_response.py} +3 -3
  12. scale_gp_beta/types/dataset_item.py +27 -0
  13. scale_gp_beta/types/dataset_item_batch_create_params.py +16 -0
  14. scale_gp_beta/types/dataset_item_batch_create_response.py +15 -0
  15. scale_gp_beta/types/dataset_item_delete_response.py +16 -0
  16. scale_gp_beta/types/dataset_item_list_params.py +30 -0
  17. scale_gp_beta/types/dataset_item_retrieve_params.py +13 -0
  18. scale_gp_beta/types/dataset_item_update_params.py +13 -0
  19. scale_gp_beta/types/{question_list_params.py → dataset_list_params.py} +4 -2
  20. scale_gp_beta/types/dataset_retrieve_params.py +11 -0
  21. scale_gp_beta/types/dataset_update_params.py +13 -0
  22. scale_gp_beta/types/evaluation.py +30 -0
  23. scale_gp_beta/types/evaluation_archive_response.py +16 -0
  24. scale_gp_beta/types/evaluation_create_params.py +734 -0
  25. scale_gp_beta/types/evaluation_item.py +29 -0
  26. scale_gp_beta/types/{question_set_list_params.py → evaluation_item_list_params.py} +6 -6
  27. scale_gp_beta/types/evaluation_item_retrieve_params.py +11 -0
  28. scale_gp_beta/types/evaluation_list_params.py +18 -0
  29. scale_gp_beta/types/evaluation_retrieve_params.py +11 -0
  30. {scale_gp_beta-0.1.0a4.dist-info → scale_gp_beta-0.1.0a6.dist-info}/METADATA +1 -1
  31. {scale_gp_beta-0.1.0a4.dist-info → scale_gp_beta-0.1.0a6.dist-info}/RECORD +33 -21
  32. scale_gp_beta/resources/questions.py +0 -396
  33. scale_gp_beta/types/question.py +0 -68
  34. scale_gp_beta/types/question_create_params.py +0 -59
  35. scale_gp_beta/types/question_list.py +0 -27
  36. scale_gp_beta/types/question_set.py +0 -106
  37. scale_gp_beta/types/question_set_create_params.py +0 -115
  38. scale_gp_beta/types/question_set_list.py +0 -27
  39. scale_gp_beta/types/question_set_retrieve_params.py +0 -12
  40. scale_gp_beta/types/question_set_update_params.py +0 -23
  41. {scale_gp_beta-0.1.0a4.dist-info → scale_gp_beta-0.1.0a6.dist-info}/WHEEL +0 -0
  42. {scale_gp_beta-0.1.0a4.dist-info → scale_gp_beta-0.1.0a6.dist-info}/licenses/LICENSE +0 -0
@@ -0,0 +1,734 @@
1
+ # File generated from our OpenAPI spec by Stainless. See CONTRIBUTING.md for details.
2
+
3
+ from __future__ import annotations
4
+
5
+ from typing import Dict, List, Union, Iterable
6
+ from typing_extensions import Literal, Required, TypeAlias, TypedDict
7
+
8
+ __all__ = [
9
+ "EvaluationCreateParams",
10
+ "EvaluationStandaloneCreateRequest",
11
+ "EvaluationStandaloneCreateRequestTask",
12
+ "EvaluationStandaloneCreateRequestTaskChatCompletionEvaluationTaskRequest",
13
+ "EvaluationStandaloneCreateRequestTaskChatCompletionEvaluationTaskRequestConfiguration",
14
+ "EvaluationStandaloneCreateRequestTaskGenericInferenceEvaluationTaskRequest",
15
+ "EvaluationStandaloneCreateRequestTaskGenericInferenceEvaluationTaskRequestConfiguration",
16
+ "EvaluationStandaloneCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfiguration",
17
+ "EvaluationStandaloneCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfigurationLaunchInferenceConfiguration",
18
+ "EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequest",
19
+ "EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfiguration",
20
+ "EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationHistoryUnionMember0",
21
+ "EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverrides",
22
+ "EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverrides",
23
+ "EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesInitialState",
24
+ "EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesPartialTrace",
25
+ "EvaluationFromDatasetCreateRequest",
26
+ "EvaluationFromDatasetCreateRequestData",
27
+ "EvaluationFromDatasetCreateRequestTask",
28
+ "EvaluationFromDatasetCreateRequestTaskChatCompletionEvaluationTaskRequest",
29
+ "EvaluationFromDatasetCreateRequestTaskChatCompletionEvaluationTaskRequestConfiguration",
30
+ "EvaluationFromDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequest",
31
+ "EvaluationFromDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfiguration",
32
+ "EvaluationFromDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfiguration",
33
+ "EvaluationFromDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfigurationLaunchInferenceConfiguration",
34
+ "EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequest",
35
+ "EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfiguration",
36
+ "EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationHistoryUnionMember0",
37
+ "EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverrides",
38
+ "EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverrides",
39
+ "EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesInitialState",
40
+ "EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesPartialTrace",
41
+ "EvaluationWithDatasetCreateRequest",
42
+ "EvaluationWithDatasetCreateRequestDataset",
43
+ "EvaluationWithDatasetCreateRequestTask",
44
+ "EvaluationWithDatasetCreateRequestTaskChatCompletionEvaluationTaskRequest",
45
+ "EvaluationWithDatasetCreateRequestTaskChatCompletionEvaluationTaskRequestConfiguration",
46
+ "EvaluationWithDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequest",
47
+ "EvaluationWithDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfiguration",
48
+ "EvaluationWithDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfiguration",
49
+ "EvaluationWithDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfigurationLaunchInferenceConfiguration",
50
+ "EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequest",
51
+ "EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfiguration",
52
+ "EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationHistoryUnionMember0",
53
+ "EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverrides",
54
+ "EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverrides",
55
+ "EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesInitialState",
56
+ "EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesPartialTrace",
57
+ ]
58
+
59
+
60
+ class EvaluationStandaloneCreateRequest(TypedDict, total=False):
61
+ data: Required[Iterable[Dict[str, object]]]
62
+ """Items to be evaluated"""
63
+
64
+ name: Required[str]
65
+
66
+ description: str
67
+
68
+ tasks: Iterable[EvaluationStandaloneCreateRequestTask]
69
+ """Tasks allow you to augment and evaluate your data"""
70
+
71
+
72
+ class EvaluationStandaloneCreateRequestTaskChatCompletionEvaluationTaskRequestConfigurationTyped(
73
+ TypedDict, total=False
74
+ ):
75
+ messages: Required[Union[Iterable[Dict[str, object]], str]]
76
+
77
+ model: Required[str]
78
+
79
+ audio: Union[Dict[str, object], str]
80
+
81
+ frequency_penalty: Union[float, str]
82
+
83
+ function_call: Union[Dict[str, object], str]
84
+
85
+ functions: Union[Iterable[Dict[str, object]], str]
86
+
87
+ logit_bias: Union[Dict[str, int], str]
88
+
89
+ logprobs: Union[bool, str]
90
+
91
+ max_completion_tokens: Union[int, str]
92
+
93
+ max_tokens: Union[int, str]
94
+
95
+ metadata: Union[Dict[str, str], str]
96
+
97
+ modalities: Union[List[str], str]
98
+
99
+ n: Union[int, str]
100
+
101
+ parallel_tool_calls: Union[bool, str]
102
+
103
+ prediction: Union[Dict[str, object], str]
104
+
105
+ presence_penalty: Union[float, str]
106
+
107
+ reasoning_effort: str
108
+
109
+ response_format: Union[Dict[str, object], str]
110
+
111
+ seed: Union[int, str]
112
+
113
+ stop: str
114
+
115
+ store: Union[bool, str]
116
+
117
+ temperature: Union[float, str]
118
+
119
+ tool_choice: str
120
+
121
+ tools: Union[Iterable[Dict[str, object]], str]
122
+
123
+ top_k: Union[int, str]
124
+
125
+ top_logprobs: Union[int, str]
126
+
127
+ top_p: Union[float, str]
128
+
129
+
130
+ EvaluationStandaloneCreateRequestTaskChatCompletionEvaluationTaskRequestConfiguration: TypeAlias = Union[
131
+ EvaluationStandaloneCreateRequestTaskChatCompletionEvaluationTaskRequestConfigurationTyped, Dict[str, object]
132
+ ]
133
+
134
+
135
+ class EvaluationStandaloneCreateRequestTaskChatCompletionEvaluationTaskRequest(TypedDict, total=False):
136
+ configuration: Required[EvaluationStandaloneCreateRequestTaskChatCompletionEvaluationTaskRequestConfiguration]
137
+
138
+ alias: str
139
+ """Alias to title the results column. Defaults to the `task_type`"""
140
+
141
+ task_type: Literal["chat_completion"]
142
+
143
+
144
+ class EvaluationStandaloneCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfigurationLaunchInferenceConfiguration(
145
+ TypedDict, total=False
146
+ ):
147
+ num_retries: int
148
+
149
+ timeout_seconds: int
150
+
151
+
152
+ EvaluationStandaloneCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfiguration: TypeAlias = Union[
153
+ EvaluationStandaloneCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfigurationLaunchInferenceConfiguration,
154
+ str,
155
+ ]
156
+
157
+
158
+ class EvaluationStandaloneCreateRequestTaskGenericInferenceEvaluationTaskRequestConfiguration(TypedDict, total=False):
159
+ model: Required[str]
160
+
161
+ args: Union[Dict[str, object], str]
162
+
163
+ inference_configuration: (
164
+ EvaluationStandaloneCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfiguration
165
+ )
166
+
167
+
168
+ class EvaluationStandaloneCreateRequestTaskGenericInferenceEvaluationTaskRequest(TypedDict, total=False):
169
+ configuration: Required[EvaluationStandaloneCreateRequestTaskGenericInferenceEvaluationTaskRequestConfiguration]
170
+
171
+ alias: str
172
+ """Alias to title the results column. Defaults to the `task_type`"""
173
+
174
+ task_type: Literal["inference"]
175
+
176
+
177
+ class EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationHistoryUnionMember0(
178
+ TypedDict, total=False
179
+ ):
180
+ request: Required[str]
181
+ """Request inputs"""
182
+
183
+ response: Required[str]
184
+ """Response outputs"""
185
+
186
+ session_data: Dict[str, object]
187
+ """Session data corresponding to the request response pair"""
188
+
189
+
190
+ class EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesInitialState(
191
+ TypedDict, total=False
192
+ ):
193
+ current_node: Required[str]
194
+
195
+ state: Required[Dict[str, object]]
196
+
197
+
198
+ class EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesPartialTrace(
199
+ TypedDict, total=False
200
+ ):
201
+ duration_ms: Required[int]
202
+
203
+ node_id: Required[str]
204
+
205
+ operation_input: Required[str]
206
+
207
+ operation_output: Required[str]
208
+
209
+ operation_type: Required[str]
210
+
211
+ start_timestamp: Required[str]
212
+
213
+ workflow_id: Required[str]
214
+
215
+ operation_metadata: Dict[str, object]
216
+
217
+
218
+ class EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverrides(
219
+ TypedDict, total=False
220
+ ):
221
+ concurrent: bool
222
+
223
+ initial_state: EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesInitialState
224
+
225
+ partial_trace: Iterable[
226
+ EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesPartialTrace
227
+ ]
228
+
229
+ use_channels: bool
230
+
231
+
232
+ EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverrides: TypeAlias = Union[
233
+ EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverrides,
234
+ str,
235
+ ]
236
+
237
+
238
+ class EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfiguration(
239
+ TypedDict, total=False
240
+ ):
241
+ application_variant_id: Required[str]
242
+
243
+ inputs: Required[Union[Dict[str, object], str]]
244
+
245
+ history: Union[
246
+ Iterable[
247
+ EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationHistoryUnionMember0
248
+ ],
249
+ str,
250
+ ]
251
+
252
+ operation_metadata: Union[Dict[str, object], str]
253
+
254
+ overrides: EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverrides
255
+ """Execution override options for agentic applications"""
256
+
257
+
258
+ class EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequest(TypedDict, total=False):
259
+ configuration: Required[EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfiguration]
260
+
261
+ alias: str
262
+ """Alias to title the results column. Defaults to the `task_type`"""
263
+
264
+ task_type: Literal["application_variant"]
265
+
266
+
267
+ EvaluationStandaloneCreateRequestTask: TypeAlias = Union[
268
+ EvaluationStandaloneCreateRequestTaskChatCompletionEvaluationTaskRequest,
269
+ EvaluationStandaloneCreateRequestTaskGenericInferenceEvaluationTaskRequest,
270
+ EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequest,
271
+ ]
272
+
273
+
274
+ class EvaluationFromDatasetCreateRequest(TypedDict, total=False):
275
+ data: Required[Iterable[EvaluationFromDatasetCreateRequestData]]
276
+ """Items to be evaluated, including references to the input dataset items"""
277
+
278
+ dataset_id: Required[str]
279
+ """The ID of the dataset containing the items referenced by the `data` field"""
280
+
281
+ name: Required[str]
282
+
283
+ description: str
284
+
285
+ tasks: Iterable[EvaluationFromDatasetCreateRequestTask]
286
+ """Tasks allow you to augment and evaluate your data"""
287
+
288
+
289
+ class EvaluationFromDatasetCreateRequestDataTyped(TypedDict, total=False):
290
+ dataset_item_id: Required[str]
291
+
292
+
293
+ EvaluationFromDatasetCreateRequestData: TypeAlias = Union[
294
+ EvaluationFromDatasetCreateRequestDataTyped, Dict[str, object]
295
+ ]
296
+
297
+
298
+ class EvaluationFromDatasetCreateRequestTaskChatCompletionEvaluationTaskRequestConfigurationTyped(
299
+ TypedDict, total=False
300
+ ):
301
+ messages: Required[Union[Iterable[Dict[str, object]], str]]
302
+
303
+ model: Required[str]
304
+
305
+ audio: Union[Dict[str, object], str]
306
+
307
+ frequency_penalty: Union[float, str]
308
+
309
+ function_call: Union[Dict[str, object], str]
310
+
311
+ functions: Union[Iterable[Dict[str, object]], str]
312
+
313
+ logit_bias: Union[Dict[str, int], str]
314
+
315
+ logprobs: Union[bool, str]
316
+
317
+ max_completion_tokens: Union[int, str]
318
+
319
+ max_tokens: Union[int, str]
320
+
321
+ metadata: Union[Dict[str, str], str]
322
+
323
+ modalities: Union[List[str], str]
324
+
325
+ n: Union[int, str]
326
+
327
+ parallel_tool_calls: Union[bool, str]
328
+
329
+ prediction: Union[Dict[str, object], str]
330
+
331
+ presence_penalty: Union[float, str]
332
+
333
+ reasoning_effort: str
334
+
335
+ response_format: Union[Dict[str, object], str]
336
+
337
+ seed: Union[int, str]
338
+
339
+ stop: str
340
+
341
+ store: Union[bool, str]
342
+
343
+ temperature: Union[float, str]
344
+
345
+ tool_choice: str
346
+
347
+ tools: Union[Iterable[Dict[str, object]], str]
348
+
349
+ top_k: Union[int, str]
350
+
351
+ top_logprobs: Union[int, str]
352
+
353
+ top_p: Union[float, str]
354
+
355
+
356
+ EvaluationFromDatasetCreateRequestTaskChatCompletionEvaluationTaskRequestConfiguration: TypeAlias = Union[
357
+ EvaluationFromDatasetCreateRequestTaskChatCompletionEvaluationTaskRequestConfigurationTyped, Dict[str, object]
358
+ ]
359
+
360
+
361
+ class EvaluationFromDatasetCreateRequestTaskChatCompletionEvaluationTaskRequest(TypedDict, total=False):
362
+ configuration: Required[EvaluationFromDatasetCreateRequestTaskChatCompletionEvaluationTaskRequestConfiguration]
363
+
364
+ alias: str
365
+ """Alias to title the results column. Defaults to the `task_type`"""
366
+
367
+ task_type: Literal["chat_completion"]
368
+
369
+
370
+ class EvaluationFromDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfigurationLaunchInferenceConfiguration(
371
+ TypedDict, total=False
372
+ ):
373
+ num_retries: int
374
+
375
+ timeout_seconds: int
376
+
377
+
378
+ EvaluationFromDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfiguration: TypeAlias = Union[
379
+ EvaluationFromDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfigurationLaunchInferenceConfiguration,
380
+ str,
381
+ ]
382
+
383
+
384
+ class EvaluationFromDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfiguration(TypedDict, total=False):
385
+ model: Required[str]
386
+
387
+ args: Union[Dict[str, object], str]
388
+
389
+ inference_configuration: (
390
+ EvaluationFromDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfiguration
391
+ )
392
+
393
+
394
+ class EvaluationFromDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequest(TypedDict, total=False):
395
+ configuration: Required[EvaluationFromDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfiguration]
396
+
397
+ alias: str
398
+ """Alias to title the results column. Defaults to the `task_type`"""
399
+
400
+ task_type: Literal["inference"]
401
+
402
+
403
+ class EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationHistoryUnionMember0(
404
+ TypedDict, total=False
405
+ ):
406
+ request: Required[str]
407
+ """Request inputs"""
408
+
409
+ response: Required[str]
410
+ """Response outputs"""
411
+
412
+ session_data: Dict[str, object]
413
+ """Session data corresponding to the request response pair"""
414
+
415
+
416
+ class EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesInitialState(
417
+ TypedDict, total=False
418
+ ):
419
+ current_node: Required[str]
420
+
421
+ state: Required[Dict[str, object]]
422
+
423
+
424
+ class EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesPartialTrace(
425
+ TypedDict, total=False
426
+ ):
427
+ duration_ms: Required[int]
428
+
429
+ node_id: Required[str]
430
+
431
+ operation_input: Required[str]
432
+
433
+ operation_output: Required[str]
434
+
435
+ operation_type: Required[str]
436
+
437
+ start_timestamp: Required[str]
438
+
439
+ workflow_id: Required[str]
440
+
441
+ operation_metadata: Dict[str, object]
442
+
443
+
444
+ class EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverrides(
445
+ TypedDict, total=False
446
+ ):
447
+ concurrent: bool
448
+
449
+ initial_state: EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesInitialState
450
+
451
+ partial_trace: Iterable[
452
+ EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesPartialTrace
453
+ ]
454
+
455
+ use_channels: bool
456
+
457
+
458
+ EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverrides: TypeAlias = Union[
459
+ EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverrides,
460
+ str,
461
+ ]
462
+
463
+
464
+ class EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfiguration(
465
+ TypedDict, total=False
466
+ ):
467
+ application_variant_id: Required[str]
468
+
469
+ inputs: Required[Union[Dict[str, object], str]]
470
+
471
+ history: Union[
472
+ Iterable[
473
+ EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationHistoryUnionMember0
474
+ ],
475
+ str,
476
+ ]
477
+
478
+ operation_metadata: Union[Dict[str, object], str]
479
+
480
+ overrides: EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverrides
481
+ """Execution override options for agentic applications"""
482
+
483
+
484
+ class EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequest(TypedDict, total=False):
485
+ configuration: Required[
486
+ EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfiguration
487
+ ]
488
+
489
+ alias: str
490
+ """Alias to title the results column. Defaults to the `task_type`"""
491
+
492
+ task_type: Literal["application_variant"]
493
+
494
+
495
+ EvaluationFromDatasetCreateRequestTask: TypeAlias = Union[
496
+ EvaluationFromDatasetCreateRequestTaskChatCompletionEvaluationTaskRequest,
497
+ EvaluationFromDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequest,
498
+ EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequest,
499
+ ]
500
+
501
+
502
+ class EvaluationWithDatasetCreateRequest(TypedDict, total=False):
503
+ data: Required[Iterable[Dict[str, object]]]
504
+ """Items to be evaluated"""
505
+
506
+ dataset: Required[EvaluationWithDatasetCreateRequestDataset]
507
+ """Create a reusable dataset from items in the `data` field"""
508
+
509
+ name: Required[str]
510
+
511
+ description: str
512
+
513
+ tasks: Iterable[EvaluationWithDatasetCreateRequestTask]
514
+ """Tasks allow you to augment and evaluate your data"""
515
+
516
+
517
+ class EvaluationWithDatasetCreateRequestDataset(TypedDict, total=False):
518
+ name: Required[str]
519
+
520
+ description: str
521
+
522
+ keys: List[str]
523
+ """Keys from items in the `data` field that should be included in the dataset.
524
+
525
+ If not provided, all keys will be included.
526
+ """
527
+
528
+
529
+ class EvaluationWithDatasetCreateRequestTaskChatCompletionEvaluationTaskRequestConfigurationTyped(
530
+ TypedDict, total=False
531
+ ):
532
+ messages: Required[Union[Iterable[Dict[str, object]], str]]
533
+
534
+ model: Required[str]
535
+
536
+ audio: Union[Dict[str, object], str]
537
+
538
+ frequency_penalty: Union[float, str]
539
+
540
+ function_call: Union[Dict[str, object], str]
541
+
542
+ functions: Union[Iterable[Dict[str, object]], str]
543
+
544
+ logit_bias: Union[Dict[str, int], str]
545
+
546
+ logprobs: Union[bool, str]
547
+
548
+ max_completion_tokens: Union[int, str]
549
+
550
+ max_tokens: Union[int, str]
551
+
552
+ metadata: Union[Dict[str, str], str]
553
+
554
+ modalities: Union[List[str], str]
555
+
556
+ n: Union[int, str]
557
+
558
+ parallel_tool_calls: Union[bool, str]
559
+
560
+ prediction: Union[Dict[str, object], str]
561
+
562
+ presence_penalty: Union[float, str]
563
+
564
+ reasoning_effort: str
565
+
566
+ response_format: Union[Dict[str, object], str]
567
+
568
+ seed: Union[int, str]
569
+
570
+ stop: str
571
+
572
+ store: Union[bool, str]
573
+
574
+ temperature: Union[float, str]
575
+
576
+ tool_choice: str
577
+
578
+ tools: Union[Iterable[Dict[str, object]], str]
579
+
580
+ top_k: Union[int, str]
581
+
582
+ top_logprobs: Union[int, str]
583
+
584
+ top_p: Union[float, str]
585
+
586
+
587
+ EvaluationWithDatasetCreateRequestTaskChatCompletionEvaluationTaskRequestConfiguration: TypeAlias = Union[
588
+ EvaluationWithDatasetCreateRequestTaskChatCompletionEvaluationTaskRequestConfigurationTyped, Dict[str, object]
589
+ ]
590
+
591
+
592
+ class EvaluationWithDatasetCreateRequestTaskChatCompletionEvaluationTaskRequest(TypedDict, total=False):
593
+ configuration: Required[EvaluationWithDatasetCreateRequestTaskChatCompletionEvaluationTaskRequestConfiguration]
594
+
595
+ alias: str
596
+ """Alias to title the results column. Defaults to the `task_type`"""
597
+
598
+ task_type: Literal["chat_completion"]
599
+
600
+
601
+ class EvaluationWithDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfigurationLaunchInferenceConfiguration(
602
+ TypedDict, total=False
603
+ ):
604
+ num_retries: int
605
+
606
+ timeout_seconds: int
607
+
608
+
609
+ EvaluationWithDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfiguration: TypeAlias = Union[
610
+ EvaluationWithDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfigurationLaunchInferenceConfiguration,
611
+ str,
612
+ ]
613
+
614
+
615
+ class EvaluationWithDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfiguration(TypedDict, total=False):
616
+ model: Required[str]
617
+
618
+ args: Union[Dict[str, object], str]
619
+
620
+ inference_configuration: (
621
+ EvaluationWithDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfiguration
622
+ )
623
+
624
+
625
+ class EvaluationWithDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequest(TypedDict, total=False):
626
+ configuration: Required[EvaluationWithDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfiguration]
627
+
628
+ alias: str
629
+ """Alias to title the results column. Defaults to the `task_type`"""
630
+
631
+ task_type: Literal["inference"]
632
+
633
+
634
+ class EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationHistoryUnionMember0(
635
+ TypedDict, total=False
636
+ ):
637
+ request: Required[str]
638
+ """Request inputs"""
639
+
640
+ response: Required[str]
641
+ """Response outputs"""
642
+
643
+ session_data: Dict[str, object]
644
+ """Session data corresponding to the request response pair"""
645
+
646
+
647
+ class EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesInitialState(
648
+ TypedDict, total=False
649
+ ):
650
+ current_node: Required[str]
651
+
652
+ state: Required[Dict[str, object]]
653
+
654
+
655
+ class EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesPartialTrace(
656
+ TypedDict, total=False
657
+ ):
658
+ duration_ms: Required[int]
659
+
660
+ node_id: Required[str]
661
+
662
+ operation_input: Required[str]
663
+
664
+ operation_output: Required[str]
665
+
666
+ operation_type: Required[str]
667
+
668
+ start_timestamp: Required[str]
669
+
670
+ workflow_id: Required[str]
671
+
672
+ operation_metadata: Dict[str, object]
673
+
674
+
675
+ class EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverrides(
676
+ TypedDict, total=False
677
+ ):
678
+ concurrent: bool
679
+
680
+ initial_state: EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesInitialState
681
+
682
+ partial_trace: Iterable[
683
+ EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesPartialTrace
684
+ ]
685
+
686
+ use_channels: bool
687
+
688
+
689
+ EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverrides: TypeAlias = Union[
690
+ EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverrides,
691
+ str,
692
+ ]
693
+
694
+
695
+ class EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfiguration(
696
+ TypedDict, total=False
697
+ ):
698
+ application_variant_id: Required[str]
699
+
700
+ inputs: Required[Union[Dict[str, object], str]]
701
+
702
+ history: Union[
703
+ Iterable[
704
+ EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationHistoryUnionMember0
705
+ ],
706
+ str,
707
+ ]
708
+
709
+ operation_metadata: Union[Dict[str, object], str]
710
+
711
+ overrides: EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverrides
712
+ """Execution override options for agentic applications"""
713
+
714
+
715
+ class EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequest(TypedDict, total=False):
716
+ configuration: Required[
717
+ EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfiguration
718
+ ]
719
+
720
+ alias: str
721
+ """Alias to title the results column. Defaults to the `task_type`"""
722
+
723
+ task_type: Literal["application_variant"]
724
+
725
+
726
+ EvaluationWithDatasetCreateRequestTask: TypeAlias = Union[
727
+ EvaluationWithDatasetCreateRequestTaskChatCompletionEvaluationTaskRequest,
728
+ EvaluationWithDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequest,
729
+ EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequest,
730
+ ]
731
+
732
+ EvaluationCreateParams: TypeAlias = Union[
733
+ EvaluationStandaloneCreateRequest, EvaluationFromDatasetCreateRequest, EvaluationWithDatasetCreateRequest
734
+ ]