scale-gp-beta 0.1.0a4__py3-none-any.whl → 0.1.0a6__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- scale_gp_beta/_client.py +35 -17
- scale_gp_beta/_version.py +1 -1
- scale_gp_beta/resources/__init__.py +55 -27
- scale_gp_beta/resources/dataset_items.py +586 -0
- scale_gp_beta/resources/datasets.py +569 -0
- scale_gp_beta/resources/evaluation_items.py +295 -0
- scale_gp_beta/resources/{question_sets.py → evaluations.py} +259 -273
- scale_gp_beta/types/__init__.py +21 -11
- scale_gp_beta/types/dataset.py +27 -0
- scale_gp_beta/types/dataset_create_params.py +17 -0
- scale_gp_beta/types/{question_set_delete_response.py → dataset_delete_response.py} +3 -3
- scale_gp_beta/types/dataset_item.py +27 -0
- scale_gp_beta/types/dataset_item_batch_create_params.py +16 -0
- scale_gp_beta/types/dataset_item_batch_create_response.py +15 -0
- scale_gp_beta/types/dataset_item_delete_response.py +16 -0
- scale_gp_beta/types/dataset_item_list_params.py +30 -0
- scale_gp_beta/types/dataset_item_retrieve_params.py +13 -0
- scale_gp_beta/types/dataset_item_update_params.py +13 -0
- scale_gp_beta/types/{question_list_params.py → dataset_list_params.py} +4 -2
- scale_gp_beta/types/dataset_retrieve_params.py +11 -0
- scale_gp_beta/types/dataset_update_params.py +13 -0
- scale_gp_beta/types/evaluation.py +30 -0
- scale_gp_beta/types/evaluation_archive_response.py +16 -0
- scale_gp_beta/types/evaluation_create_params.py +734 -0
- scale_gp_beta/types/evaluation_item.py +29 -0
- scale_gp_beta/types/{question_set_list_params.py → evaluation_item_list_params.py} +6 -6
- scale_gp_beta/types/evaluation_item_retrieve_params.py +11 -0
- scale_gp_beta/types/evaluation_list_params.py +18 -0
- scale_gp_beta/types/evaluation_retrieve_params.py +11 -0
- {scale_gp_beta-0.1.0a4.dist-info → scale_gp_beta-0.1.0a6.dist-info}/METADATA +1 -1
- {scale_gp_beta-0.1.0a4.dist-info → scale_gp_beta-0.1.0a6.dist-info}/RECORD +33 -21
- scale_gp_beta/resources/questions.py +0 -396
- scale_gp_beta/types/question.py +0 -68
- scale_gp_beta/types/question_create_params.py +0 -59
- scale_gp_beta/types/question_list.py +0 -27
- scale_gp_beta/types/question_set.py +0 -106
- scale_gp_beta/types/question_set_create_params.py +0 -115
- scale_gp_beta/types/question_set_list.py +0 -27
- scale_gp_beta/types/question_set_retrieve_params.py +0 -12
- scale_gp_beta/types/question_set_update_params.py +0 -23
- {scale_gp_beta-0.1.0a4.dist-info → scale_gp_beta-0.1.0a6.dist-info}/WHEEL +0 -0
- {scale_gp_beta-0.1.0a4.dist-info → scale_gp_beta-0.1.0a6.dist-info}/licenses/LICENSE +0 -0
|
@@ -0,0 +1,734 @@
|
|
|
1
|
+
# File generated from our OpenAPI spec by Stainless. See CONTRIBUTING.md for details.
|
|
2
|
+
|
|
3
|
+
from __future__ import annotations
|
|
4
|
+
|
|
5
|
+
from typing import Dict, List, Union, Iterable
|
|
6
|
+
from typing_extensions import Literal, Required, TypeAlias, TypedDict
|
|
7
|
+
|
|
8
|
+
__all__ = [
|
|
9
|
+
"EvaluationCreateParams",
|
|
10
|
+
"EvaluationStandaloneCreateRequest",
|
|
11
|
+
"EvaluationStandaloneCreateRequestTask",
|
|
12
|
+
"EvaluationStandaloneCreateRequestTaskChatCompletionEvaluationTaskRequest",
|
|
13
|
+
"EvaluationStandaloneCreateRequestTaskChatCompletionEvaluationTaskRequestConfiguration",
|
|
14
|
+
"EvaluationStandaloneCreateRequestTaskGenericInferenceEvaluationTaskRequest",
|
|
15
|
+
"EvaluationStandaloneCreateRequestTaskGenericInferenceEvaluationTaskRequestConfiguration",
|
|
16
|
+
"EvaluationStandaloneCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfiguration",
|
|
17
|
+
"EvaluationStandaloneCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfigurationLaunchInferenceConfiguration",
|
|
18
|
+
"EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequest",
|
|
19
|
+
"EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfiguration",
|
|
20
|
+
"EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationHistoryUnionMember0",
|
|
21
|
+
"EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverrides",
|
|
22
|
+
"EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverrides",
|
|
23
|
+
"EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesInitialState",
|
|
24
|
+
"EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesPartialTrace",
|
|
25
|
+
"EvaluationFromDatasetCreateRequest",
|
|
26
|
+
"EvaluationFromDatasetCreateRequestData",
|
|
27
|
+
"EvaluationFromDatasetCreateRequestTask",
|
|
28
|
+
"EvaluationFromDatasetCreateRequestTaskChatCompletionEvaluationTaskRequest",
|
|
29
|
+
"EvaluationFromDatasetCreateRequestTaskChatCompletionEvaluationTaskRequestConfiguration",
|
|
30
|
+
"EvaluationFromDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequest",
|
|
31
|
+
"EvaluationFromDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfiguration",
|
|
32
|
+
"EvaluationFromDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfiguration",
|
|
33
|
+
"EvaluationFromDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfigurationLaunchInferenceConfiguration",
|
|
34
|
+
"EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequest",
|
|
35
|
+
"EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfiguration",
|
|
36
|
+
"EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationHistoryUnionMember0",
|
|
37
|
+
"EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverrides",
|
|
38
|
+
"EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverrides",
|
|
39
|
+
"EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesInitialState",
|
|
40
|
+
"EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesPartialTrace",
|
|
41
|
+
"EvaluationWithDatasetCreateRequest",
|
|
42
|
+
"EvaluationWithDatasetCreateRequestDataset",
|
|
43
|
+
"EvaluationWithDatasetCreateRequestTask",
|
|
44
|
+
"EvaluationWithDatasetCreateRequestTaskChatCompletionEvaluationTaskRequest",
|
|
45
|
+
"EvaluationWithDatasetCreateRequestTaskChatCompletionEvaluationTaskRequestConfiguration",
|
|
46
|
+
"EvaluationWithDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequest",
|
|
47
|
+
"EvaluationWithDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfiguration",
|
|
48
|
+
"EvaluationWithDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfiguration",
|
|
49
|
+
"EvaluationWithDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfigurationLaunchInferenceConfiguration",
|
|
50
|
+
"EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequest",
|
|
51
|
+
"EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfiguration",
|
|
52
|
+
"EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationHistoryUnionMember0",
|
|
53
|
+
"EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverrides",
|
|
54
|
+
"EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverrides",
|
|
55
|
+
"EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesInitialState",
|
|
56
|
+
"EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesPartialTrace",
|
|
57
|
+
]
|
|
58
|
+
|
|
59
|
+
|
|
60
|
+
class EvaluationStandaloneCreateRequest(TypedDict, total=False):
|
|
61
|
+
data: Required[Iterable[Dict[str, object]]]
|
|
62
|
+
"""Items to be evaluated"""
|
|
63
|
+
|
|
64
|
+
name: Required[str]
|
|
65
|
+
|
|
66
|
+
description: str
|
|
67
|
+
|
|
68
|
+
tasks: Iterable[EvaluationStandaloneCreateRequestTask]
|
|
69
|
+
"""Tasks allow you to augment and evaluate your data"""
|
|
70
|
+
|
|
71
|
+
|
|
72
|
+
class EvaluationStandaloneCreateRequestTaskChatCompletionEvaluationTaskRequestConfigurationTyped(
|
|
73
|
+
TypedDict, total=False
|
|
74
|
+
):
|
|
75
|
+
messages: Required[Union[Iterable[Dict[str, object]], str]]
|
|
76
|
+
|
|
77
|
+
model: Required[str]
|
|
78
|
+
|
|
79
|
+
audio: Union[Dict[str, object], str]
|
|
80
|
+
|
|
81
|
+
frequency_penalty: Union[float, str]
|
|
82
|
+
|
|
83
|
+
function_call: Union[Dict[str, object], str]
|
|
84
|
+
|
|
85
|
+
functions: Union[Iterable[Dict[str, object]], str]
|
|
86
|
+
|
|
87
|
+
logit_bias: Union[Dict[str, int], str]
|
|
88
|
+
|
|
89
|
+
logprobs: Union[bool, str]
|
|
90
|
+
|
|
91
|
+
max_completion_tokens: Union[int, str]
|
|
92
|
+
|
|
93
|
+
max_tokens: Union[int, str]
|
|
94
|
+
|
|
95
|
+
metadata: Union[Dict[str, str], str]
|
|
96
|
+
|
|
97
|
+
modalities: Union[List[str], str]
|
|
98
|
+
|
|
99
|
+
n: Union[int, str]
|
|
100
|
+
|
|
101
|
+
parallel_tool_calls: Union[bool, str]
|
|
102
|
+
|
|
103
|
+
prediction: Union[Dict[str, object], str]
|
|
104
|
+
|
|
105
|
+
presence_penalty: Union[float, str]
|
|
106
|
+
|
|
107
|
+
reasoning_effort: str
|
|
108
|
+
|
|
109
|
+
response_format: Union[Dict[str, object], str]
|
|
110
|
+
|
|
111
|
+
seed: Union[int, str]
|
|
112
|
+
|
|
113
|
+
stop: str
|
|
114
|
+
|
|
115
|
+
store: Union[bool, str]
|
|
116
|
+
|
|
117
|
+
temperature: Union[float, str]
|
|
118
|
+
|
|
119
|
+
tool_choice: str
|
|
120
|
+
|
|
121
|
+
tools: Union[Iterable[Dict[str, object]], str]
|
|
122
|
+
|
|
123
|
+
top_k: Union[int, str]
|
|
124
|
+
|
|
125
|
+
top_logprobs: Union[int, str]
|
|
126
|
+
|
|
127
|
+
top_p: Union[float, str]
|
|
128
|
+
|
|
129
|
+
|
|
130
|
+
EvaluationStandaloneCreateRequestTaskChatCompletionEvaluationTaskRequestConfiguration: TypeAlias = Union[
|
|
131
|
+
EvaluationStandaloneCreateRequestTaskChatCompletionEvaluationTaskRequestConfigurationTyped, Dict[str, object]
|
|
132
|
+
]
|
|
133
|
+
|
|
134
|
+
|
|
135
|
+
class EvaluationStandaloneCreateRequestTaskChatCompletionEvaluationTaskRequest(TypedDict, total=False):
|
|
136
|
+
configuration: Required[EvaluationStandaloneCreateRequestTaskChatCompletionEvaluationTaskRequestConfiguration]
|
|
137
|
+
|
|
138
|
+
alias: str
|
|
139
|
+
"""Alias to title the results column. Defaults to the `task_type`"""
|
|
140
|
+
|
|
141
|
+
task_type: Literal["chat_completion"]
|
|
142
|
+
|
|
143
|
+
|
|
144
|
+
class EvaluationStandaloneCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfigurationLaunchInferenceConfiguration(
|
|
145
|
+
TypedDict, total=False
|
|
146
|
+
):
|
|
147
|
+
num_retries: int
|
|
148
|
+
|
|
149
|
+
timeout_seconds: int
|
|
150
|
+
|
|
151
|
+
|
|
152
|
+
EvaluationStandaloneCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfiguration: TypeAlias = Union[
|
|
153
|
+
EvaluationStandaloneCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfigurationLaunchInferenceConfiguration,
|
|
154
|
+
str,
|
|
155
|
+
]
|
|
156
|
+
|
|
157
|
+
|
|
158
|
+
class EvaluationStandaloneCreateRequestTaskGenericInferenceEvaluationTaskRequestConfiguration(TypedDict, total=False):
|
|
159
|
+
model: Required[str]
|
|
160
|
+
|
|
161
|
+
args: Union[Dict[str, object], str]
|
|
162
|
+
|
|
163
|
+
inference_configuration: (
|
|
164
|
+
EvaluationStandaloneCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfiguration
|
|
165
|
+
)
|
|
166
|
+
|
|
167
|
+
|
|
168
|
+
class EvaluationStandaloneCreateRequestTaskGenericInferenceEvaluationTaskRequest(TypedDict, total=False):
|
|
169
|
+
configuration: Required[EvaluationStandaloneCreateRequestTaskGenericInferenceEvaluationTaskRequestConfiguration]
|
|
170
|
+
|
|
171
|
+
alias: str
|
|
172
|
+
"""Alias to title the results column. Defaults to the `task_type`"""
|
|
173
|
+
|
|
174
|
+
task_type: Literal["inference"]
|
|
175
|
+
|
|
176
|
+
|
|
177
|
+
class EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationHistoryUnionMember0(
|
|
178
|
+
TypedDict, total=False
|
|
179
|
+
):
|
|
180
|
+
request: Required[str]
|
|
181
|
+
"""Request inputs"""
|
|
182
|
+
|
|
183
|
+
response: Required[str]
|
|
184
|
+
"""Response outputs"""
|
|
185
|
+
|
|
186
|
+
session_data: Dict[str, object]
|
|
187
|
+
"""Session data corresponding to the request response pair"""
|
|
188
|
+
|
|
189
|
+
|
|
190
|
+
class EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesInitialState(
|
|
191
|
+
TypedDict, total=False
|
|
192
|
+
):
|
|
193
|
+
current_node: Required[str]
|
|
194
|
+
|
|
195
|
+
state: Required[Dict[str, object]]
|
|
196
|
+
|
|
197
|
+
|
|
198
|
+
class EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesPartialTrace(
|
|
199
|
+
TypedDict, total=False
|
|
200
|
+
):
|
|
201
|
+
duration_ms: Required[int]
|
|
202
|
+
|
|
203
|
+
node_id: Required[str]
|
|
204
|
+
|
|
205
|
+
operation_input: Required[str]
|
|
206
|
+
|
|
207
|
+
operation_output: Required[str]
|
|
208
|
+
|
|
209
|
+
operation_type: Required[str]
|
|
210
|
+
|
|
211
|
+
start_timestamp: Required[str]
|
|
212
|
+
|
|
213
|
+
workflow_id: Required[str]
|
|
214
|
+
|
|
215
|
+
operation_metadata: Dict[str, object]
|
|
216
|
+
|
|
217
|
+
|
|
218
|
+
class EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverrides(
|
|
219
|
+
TypedDict, total=False
|
|
220
|
+
):
|
|
221
|
+
concurrent: bool
|
|
222
|
+
|
|
223
|
+
initial_state: EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesInitialState
|
|
224
|
+
|
|
225
|
+
partial_trace: Iterable[
|
|
226
|
+
EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesPartialTrace
|
|
227
|
+
]
|
|
228
|
+
|
|
229
|
+
use_channels: bool
|
|
230
|
+
|
|
231
|
+
|
|
232
|
+
EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverrides: TypeAlias = Union[
|
|
233
|
+
EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverrides,
|
|
234
|
+
str,
|
|
235
|
+
]
|
|
236
|
+
|
|
237
|
+
|
|
238
|
+
class EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfiguration(
|
|
239
|
+
TypedDict, total=False
|
|
240
|
+
):
|
|
241
|
+
application_variant_id: Required[str]
|
|
242
|
+
|
|
243
|
+
inputs: Required[Union[Dict[str, object], str]]
|
|
244
|
+
|
|
245
|
+
history: Union[
|
|
246
|
+
Iterable[
|
|
247
|
+
EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationHistoryUnionMember0
|
|
248
|
+
],
|
|
249
|
+
str,
|
|
250
|
+
]
|
|
251
|
+
|
|
252
|
+
operation_metadata: Union[Dict[str, object], str]
|
|
253
|
+
|
|
254
|
+
overrides: EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverrides
|
|
255
|
+
"""Execution override options for agentic applications"""
|
|
256
|
+
|
|
257
|
+
|
|
258
|
+
class EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequest(TypedDict, total=False):
|
|
259
|
+
configuration: Required[EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfiguration]
|
|
260
|
+
|
|
261
|
+
alias: str
|
|
262
|
+
"""Alias to title the results column. Defaults to the `task_type`"""
|
|
263
|
+
|
|
264
|
+
task_type: Literal["application_variant"]
|
|
265
|
+
|
|
266
|
+
|
|
267
|
+
EvaluationStandaloneCreateRequestTask: TypeAlias = Union[
|
|
268
|
+
EvaluationStandaloneCreateRequestTaskChatCompletionEvaluationTaskRequest,
|
|
269
|
+
EvaluationStandaloneCreateRequestTaskGenericInferenceEvaluationTaskRequest,
|
|
270
|
+
EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequest,
|
|
271
|
+
]
|
|
272
|
+
|
|
273
|
+
|
|
274
|
+
class EvaluationFromDatasetCreateRequest(TypedDict, total=False):
|
|
275
|
+
data: Required[Iterable[EvaluationFromDatasetCreateRequestData]]
|
|
276
|
+
"""Items to be evaluated, including references to the input dataset items"""
|
|
277
|
+
|
|
278
|
+
dataset_id: Required[str]
|
|
279
|
+
"""The ID of the dataset containing the items referenced by the `data` field"""
|
|
280
|
+
|
|
281
|
+
name: Required[str]
|
|
282
|
+
|
|
283
|
+
description: str
|
|
284
|
+
|
|
285
|
+
tasks: Iterable[EvaluationFromDatasetCreateRequestTask]
|
|
286
|
+
"""Tasks allow you to augment and evaluate your data"""
|
|
287
|
+
|
|
288
|
+
|
|
289
|
+
class EvaluationFromDatasetCreateRequestDataTyped(TypedDict, total=False):
|
|
290
|
+
dataset_item_id: Required[str]
|
|
291
|
+
|
|
292
|
+
|
|
293
|
+
EvaluationFromDatasetCreateRequestData: TypeAlias = Union[
|
|
294
|
+
EvaluationFromDatasetCreateRequestDataTyped, Dict[str, object]
|
|
295
|
+
]
|
|
296
|
+
|
|
297
|
+
|
|
298
|
+
class EvaluationFromDatasetCreateRequestTaskChatCompletionEvaluationTaskRequestConfigurationTyped(
|
|
299
|
+
TypedDict, total=False
|
|
300
|
+
):
|
|
301
|
+
messages: Required[Union[Iterable[Dict[str, object]], str]]
|
|
302
|
+
|
|
303
|
+
model: Required[str]
|
|
304
|
+
|
|
305
|
+
audio: Union[Dict[str, object], str]
|
|
306
|
+
|
|
307
|
+
frequency_penalty: Union[float, str]
|
|
308
|
+
|
|
309
|
+
function_call: Union[Dict[str, object], str]
|
|
310
|
+
|
|
311
|
+
functions: Union[Iterable[Dict[str, object]], str]
|
|
312
|
+
|
|
313
|
+
logit_bias: Union[Dict[str, int], str]
|
|
314
|
+
|
|
315
|
+
logprobs: Union[bool, str]
|
|
316
|
+
|
|
317
|
+
max_completion_tokens: Union[int, str]
|
|
318
|
+
|
|
319
|
+
max_tokens: Union[int, str]
|
|
320
|
+
|
|
321
|
+
metadata: Union[Dict[str, str], str]
|
|
322
|
+
|
|
323
|
+
modalities: Union[List[str], str]
|
|
324
|
+
|
|
325
|
+
n: Union[int, str]
|
|
326
|
+
|
|
327
|
+
parallel_tool_calls: Union[bool, str]
|
|
328
|
+
|
|
329
|
+
prediction: Union[Dict[str, object], str]
|
|
330
|
+
|
|
331
|
+
presence_penalty: Union[float, str]
|
|
332
|
+
|
|
333
|
+
reasoning_effort: str
|
|
334
|
+
|
|
335
|
+
response_format: Union[Dict[str, object], str]
|
|
336
|
+
|
|
337
|
+
seed: Union[int, str]
|
|
338
|
+
|
|
339
|
+
stop: str
|
|
340
|
+
|
|
341
|
+
store: Union[bool, str]
|
|
342
|
+
|
|
343
|
+
temperature: Union[float, str]
|
|
344
|
+
|
|
345
|
+
tool_choice: str
|
|
346
|
+
|
|
347
|
+
tools: Union[Iterable[Dict[str, object]], str]
|
|
348
|
+
|
|
349
|
+
top_k: Union[int, str]
|
|
350
|
+
|
|
351
|
+
top_logprobs: Union[int, str]
|
|
352
|
+
|
|
353
|
+
top_p: Union[float, str]
|
|
354
|
+
|
|
355
|
+
|
|
356
|
+
EvaluationFromDatasetCreateRequestTaskChatCompletionEvaluationTaskRequestConfiguration: TypeAlias = Union[
|
|
357
|
+
EvaluationFromDatasetCreateRequestTaskChatCompletionEvaluationTaskRequestConfigurationTyped, Dict[str, object]
|
|
358
|
+
]
|
|
359
|
+
|
|
360
|
+
|
|
361
|
+
class EvaluationFromDatasetCreateRequestTaskChatCompletionEvaluationTaskRequest(TypedDict, total=False):
|
|
362
|
+
configuration: Required[EvaluationFromDatasetCreateRequestTaskChatCompletionEvaluationTaskRequestConfiguration]
|
|
363
|
+
|
|
364
|
+
alias: str
|
|
365
|
+
"""Alias to title the results column. Defaults to the `task_type`"""
|
|
366
|
+
|
|
367
|
+
task_type: Literal["chat_completion"]
|
|
368
|
+
|
|
369
|
+
|
|
370
|
+
class EvaluationFromDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfigurationLaunchInferenceConfiguration(
|
|
371
|
+
TypedDict, total=False
|
|
372
|
+
):
|
|
373
|
+
num_retries: int
|
|
374
|
+
|
|
375
|
+
timeout_seconds: int
|
|
376
|
+
|
|
377
|
+
|
|
378
|
+
EvaluationFromDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfiguration: TypeAlias = Union[
|
|
379
|
+
EvaluationFromDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfigurationLaunchInferenceConfiguration,
|
|
380
|
+
str,
|
|
381
|
+
]
|
|
382
|
+
|
|
383
|
+
|
|
384
|
+
class EvaluationFromDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfiguration(TypedDict, total=False):
|
|
385
|
+
model: Required[str]
|
|
386
|
+
|
|
387
|
+
args: Union[Dict[str, object], str]
|
|
388
|
+
|
|
389
|
+
inference_configuration: (
|
|
390
|
+
EvaluationFromDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfiguration
|
|
391
|
+
)
|
|
392
|
+
|
|
393
|
+
|
|
394
|
+
class EvaluationFromDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequest(TypedDict, total=False):
|
|
395
|
+
configuration: Required[EvaluationFromDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfiguration]
|
|
396
|
+
|
|
397
|
+
alias: str
|
|
398
|
+
"""Alias to title the results column. Defaults to the `task_type`"""
|
|
399
|
+
|
|
400
|
+
task_type: Literal["inference"]
|
|
401
|
+
|
|
402
|
+
|
|
403
|
+
class EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationHistoryUnionMember0(
|
|
404
|
+
TypedDict, total=False
|
|
405
|
+
):
|
|
406
|
+
request: Required[str]
|
|
407
|
+
"""Request inputs"""
|
|
408
|
+
|
|
409
|
+
response: Required[str]
|
|
410
|
+
"""Response outputs"""
|
|
411
|
+
|
|
412
|
+
session_data: Dict[str, object]
|
|
413
|
+
"""Session data corresponding to the request response pair"""
|
|
414
|
+
|
|
415
|
+
|
|
416
|
+
class EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesInitialState(
|
|
417
|
+
TypedDict, total=False
|
|
418
|
+
):
|
|
419
|
+
current_node: Required[str]
|
|
420
|
+
|
|
421
|
+
state: Required[Dict[str, object]]
|
|
422
|
+
|
|
423
|
+
|
|
424
|
+
class EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesPartialTrace(
|
|
425
|
+
TypedDict, total=False
|
|
426
|
+
):
|
|
427
|
+
duration_ms: Required[int]
|
|
428
|
+
|
|
429
|
+
node_id: Required[str]
|
|
430
|
+
|
|
431
|
+
operation_input: Required[str]
|
|
432
|
+
|
|
433
|
+
operation_output: Required[str]
|
|
434
|
+
|
|
435
|
+
operation_type: Required[str]
|
|
436
|
+
|
|
437
|
+
start_timestamp: Required[str]
|
|
438
|
+
|
|
439
|
+
workflow_id: Required[str]
|
|
440
|
+
|
|
441
|
+
operation_metadata: Dict[str, object]
|
|
442
|
+
|
|
443
|
+
|
|
444
|
+
class EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverrides(
|
|
445
|
+
TypedDict, total=False
|
|
446
|
+
):
|
|
447
|
+
concurrent: bool
|
|
448
|
+
|
|
449
|
+
initial_state: EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesInitialState
|
|
450
|
+
|
|
451
|
+
partial_trace: Iterable[
|
|
452
|
+
EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesPartialTrace
|
|
453
|
+
]
|
|
454
|
+
|
|
455
|
+
use_channels: bool
|
|
456
|
+
|
|
457
|
+
|
|
458
|
+
EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverrides: TypeAlias = Union[
|
|
459
|
+
EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverrides,
|
|
460
|
+
str,
|
|
461
|
+
]
|
|
462
|
+
|
|
463
|
+
|
|
464
|
+
class EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfiguration(
|
|
465
|
+
TypedDict, total=False
|
|
466
|
+
):
|
|
467
|
+
application_variant_id: Required[str]
|
|
468
|
+
|
|
469
|
+
inputs: Required[Union[Dict[str, object], str]]
|
|
470
|
+
|
|
471
|
+
history: Union[
|
|
472
|
+
Iterable[
|
|
473
|
+
EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationHistoryUnionMember0
|
|
474
|
+
],
|
|
475
|
+
str,
|
|
476
|
+
]
|
|
477
|
+
|
|
478
|
+
operation_metadata: Union[Dict[str, object], str]
|
|
479
|
+
|
|
480
|
+
overrides: EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverrides
|
|
481
|
+
"""Execution override options for agentic applications"""
|
|
482
|
+
|
|
483
|
+
|
|
484
|
+
class EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequest(TypedDict, total=False):
|
|
485
|
+
configuration: Required[
|
|
486
|
+
EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfiguration
|
|
487
|
+
]
|
|
488
|
+
|
|
489
|
+
alias: str
|
|
490
|
+
"""Alias to title the results column. Defaults to the `task_type`"""
|
|
491
|
+
|
|
492
|
+
task_type: Literal["application_variant"]
|
|
493
|
+
|
|
494
|
+
|
|
495
|
+
EvaluationFromDatasetCreateRequestTask: TypeAlias = Union[
|
|
496
|
+
EvaluationFromDatasetCreateRequestTaskChatCompletionEvaluationTaskRequest,
|
|
497
|
+
EvaluationFromDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequest,
|
|
498
|
+
EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequest,
|
|
499
|
+
]
|
|
500
|
+
|
|
501
|
+
|
|
502
|
+
class EvaluationWithDatasetCreateRequest(TypedDict, total=False):
|
|
503
|
+
data: Required[Iterable[Dict[str, object]]]
|
|
504
|
+
"""Items to be evaluated"""
|
|
505
|
+
|
|
506
|
+
dataset: Required[EvaluationWithDatasetCreateRequestDataset]
|
|
507
|
+
"""Create a reusable dataset from items in the `data` field"""
|
|
508
|
+
|
|
509
|
+
name: Required[str]
|
|
510
|
+
|
|
511
|
+
description: str
|
|
512
|
+
|
|
513
|
+
tasks: Iterable[EvaluationWithDatasetCreateRequestTask]
|
|
514
|
+
"""Tasks allow you to augment and evaluate your data"""
|
|
515
|
+
|
|
516
|
+
|
|
517
|
+
class EvaluationWithDatasetCreateRequestDataset(TypedDict, total=False):
|
|
518
|
+
name: Required[str]
|
|
519
|
+
|
|
520
|
+
description: str
|
|
521
|
+
|
|
522
|
+
keys: List[str]
|
|
523
|
+
"""Keys from items in the `data` field that should be included in the dataset.
|
|
524
|
+
|
|
525
|
+
If not provided, all keys will be included.
|
|
526
|
+
"""
|
|
527
|
+
|
|
528
|
+
|
|
529
|
+
class EvaluationWithDatasetCreateRequestTaskChatCompletionEvaluationTaskRequestConfigurationTyped(
|
|
530
|
+
TypedDict, total=False
|
|
531
|
+
):
|
|
532
|
+
messages: Required[Union[Iterable[Dict[str, object]], str]]
|
|
533
|
+
|
|
534
|
+
model: Required[str]
|
|
535
|
+
|
|
536
|
+
audio: Union[Dict[str, object], str]
|
|
537
|
+
|
|
538
|
+
frequency_penalty: Union[float, str]
|
|
539
|
+
|
|
540
|
+
function_call: Union[Dict[str, object], str]
|
|
541
|
+
|
|
542
|
+
functions: Union[Iterable[Dict[str, object]], str]
|
|
543
|
+
|
|
544
|
+
logit_bias: Union[Dict[str, int], str]
|
|
545
|
+
|
|
546
|
+
logprobs: Union[bool, str]
|
|
547
|
+
|
|
548
|
+
max_completion_tokens: Union[int, str]
|
|
549
|
+
|
|
550
|
+
max_tokens: Union[int, str]
|
|
551
|
+
|
|
552
|
+
metadata: Union[Dict[str, str], str]
|
|
553
|
+
|
|
554
|
+
modalities: Union[List[str], str]
|
|
555
|
+
|
|
556
|
+
n: Union[int, str]
|
|
557
|
+
|
|
558
|
+
parallel_tool_calls: Union[bool, str]
|
|
559
|
+
|
|
560
|
+
prediction: Union[Dict[str, object], str]
|
|
561
|
+
|
|
562
|
+
presence_penalty: Union[float, str]
|
|
563
|
+
|
|
564
|
+
reasoning_effort: str
|
|
565
|
+
|
|
566
|
+
response_format: Union[Dict[str, object], str]
|
|
567
|
+
|
|
568
|
+
seed: Union[int, str]
|
|
569
|
+
|
|
570
|
+
stop: str
|
|
571
|
+
|
|
572
|
+
store: Union[bool, str]
|
|
573
|
+
|
|
574
|
+
temperature: Union[float, str]
|
|
575
|
+
|
|
576
|
+
tool_choice: str
|
|
577
|
+
|
|
578
|
+
tools: Union[Iterable[Dict[str, object]], str]
|
|
579
|
+
|
|
580
|
+
top_k: Union[int, str]
|
|
581
|
+
|
|
582
|
+
top_logprobs: Union[int, str]
|
|
583
|
+
|
|
584
|
+
top_p: Union[float, str]
|
|
585
|
+
|
|
586
|
+
|
|
587
|
+
EvaluationWithDatasetCreateRequestTaskChatCompletionEvaluationTaskRequestConfiguration: TypeAlias = Union[
|
|
588
|
+
EvaluationWithDatasetCreateRequestTaskChatCompletionEvaluationTaskRequestConfigurationTyped, Dict[str, object]
|
|
589
|
+
]
|
|
590
|
+
|
|
591
|
+
|
|
592
|
+
class EvaluationWithDatasetCreateRequestTaskChatCompletionEvaluationTaskRequest(TypedDict, total=False):
|
|
593
|
+
configuration: Required[EvaluationWithDatasetCreateRequestTaskChatCompletionEvaluationTaskRequestConfiguration]
|
|
594
|
+
|
|
595
|
+
alias: str
|
|
596
|
+
"""Alias to title the results column. Defaults to the `task_type`"""
|
|
597
|
+
|
|
598
|
+
task_type: Literal["chat_completion"]
|
|
599
|
+
|
|
600
|
+
|
|
601
|
+
class EvaluationWithDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfigurationLaunchInferenceConfiguration(
|
|
602
|
+
TypedDict, total=False
|
|
603
|
+
):
|
|
604
|
+
num_retries: int
|
|
605
|
+
|
|
606
|
+
timeout_seconds: int
|
|
607
|
+
|
|
608
|
+
|
|
609
|
+
EvaluationWithDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfiguration: TypeAlias = Union[
|
|
610
|
+
EvaluationWithDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfigurationLaunchInferenceConfiguration,
|
|
611
|
+
str,
|
|
612
|
+
]
|
|
613
|
+
|
|
614
|
+
|
|
615
|
+
class EvaluationWithDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfiguration(TypedDict, total=False):
|
|
616
|
+
model: Required[str]
|
|
617
|
+
|
|
618
|
+
args: Union[Dict[str, object], str]
|
|
619
|
+
|
|
620
|
+
inference_configuration: (
|
|
621
|
+
EvaluationWithDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfiguration
|
|
622
|
+
)
|
|
623
|
+
|
|
624
|
+
|
|
625
|
+
class EvaluationWithDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequest(TypedDict, total=False):
|
|
626
|
+
configuration: Required[EvaluationWithDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfiguration]
|
|
627
|
+
|
|
628
|
+
alias: str
|
|
629
|
+
"""Alias to title the results column. Defaults to the `task_type`"""
|
|
630
|
+
|
|
631
|
+
task_type: Literal["inference"]
|
|
632
|
+
|
|
633
|
+
|
|
634
|
+
class EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationHistoryUnionMember0(
|
|
635
|
+
TypedDict, total=False
|
|
636
|
+
):
|
|
637
|
+
request: Required[str]
|
|
638
|
+
"""Request inputs"""
|
|
639
|
+
|
|
640
|
+
response: Required[str]
|
|
641
|
+
"""Response outputs"""
|
|
642
|
+
|
|
643
|
+
session_data: Dict[str, object]
|
|
644
|
+
"""Session data corresponding to the request response pair"""
|
|
645
|
+
|
|
646
|
+
|
|
647
|
+
class EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesInitialState(
|
|
648
|
+
TypedDict, total=False
|
|
649
|
+
):
|
|
650
|
+
current_node: Required[str]
|
|
651
|
+
|
|
652
|
+
state: Required[Dict[str, object]]
|
|
653
|
+
|
|
654
|
+
|
|
655
|
+
class EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesPartialTrace(
|
|
656
|
+
TypedDict, total=False
|
|
657
|
+
):
|
|
658
|
+
duration_ms: Required[int]
|
|
659
|
+
|
|
660
|
+
node_id: Required[str]
|
|
661
|
+
|
|
662
|
+
operation_input: Required[str]
|
|
663
|
+
|
|
664
|
+
operation_output: Required[str]
|
|
665
|
+
|
|
666
|
+
operation_type: Required[str]
|
|
667
|
+
|
|
668
|
+
start_timestamp: Required[str]
|
|
669
|
+
|
|
670
|
+
workflow_id: Required[str]
|
|
671
|
+
|
|
672
|
+
operation_metadata: Dict[str, object]
|
|
673
|
+
|
|
674
|
+
|
|
675
|
+
class EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverrides(
|
|
676
|
+
TypedDict, total=False
|
|
677
|
+
):
|
|
678
|
+
concurrent: bool
|
|
679
|
+
|
|
680
|
+
initial_state: EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesInitialState
|
|
681
|
+
|
|
682
|
+
partial_trace: Iterable[
|
|
683
|
+
EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesPartialTrace
|
|
684
|
+
]
|
|
685
|
+
|
|
686
|
+
use_channels: bool
|
|
687
|
+
|
|
688
|
+
|
|
689
|
+
EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverrides: TypeAlias = Union[
|
|
690
|
+
EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverrides,
|
|
691
|
+
str,
|
|
692
|
+
]
|
|
693
|
+
|
|
694
|
+
|
|
695
|
+
class EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfiguration(
|
|
696
|
+
TypedDict, total=False
|
|
697
|
+
):
|
|
698
|
+
application_variant_id: Required[str]
|
|
699
|
+
|
|
700
|
+
inputs: Required[Union[Dict[str, object], str]]
|
|
701
|
+
|
|
702
|
+
history: Union[
|
|
703
|
+
Iterable[
|
|
704
|
+
EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationHistoryUnionMember0
|
|
705
|
+
],
|
|
706
|
+
str,
|
|
707
|
+
]
|
|
708
|
+
|
|
709
|
+
operation_metadata: Union[Dict[str, object], str]
|
|
710
|
+
|
|
711
|
+
overrides: EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverrides
|
|
712
|
+
"""Execution override options for agentic applications"""
|
|
713
|
+
|
|
714
|
+
|
|
715
|
+
class EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequest(TypedDict, total=False):
|
|
716
|
+
configuration: Required[
|
|
717
|
+
EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfiguration
|
|
718
|
+
]
|
|
719
|
+
|
|
720
|
+
alias: str
|
|
721
|
+
"""Alias to title the results column. Defaults to the `task_type`"""
|
|
722
|
+
|
|
723
|
+
task_type: Literal["application_variant"]
|
|
724
|
+
|
|
725
|
+
|
|
726
|
+
EvaluationWithDatasetCreateRequestTask: TypeAlias = Union[
|
|
727
|
+
EvaluationWithDatasetCreateRequestTaskChatCompletionEvaluationTaskRequest,
|
|
728
|
+
EvaluationWithDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequest,
|
|
729
|
+
EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequest,
|
|
730
|
+
]
|
|
731
|
+
|
|
732
|
+
EvaluationCreateParams: TypeAlias = Union[
|
|
733
|
+
EvaluationStandaloneCreateRequest, EvaluationFromDatasetCreateRequest, EvaluationWithDatasetCreateRequest
|
|
734
|
+
]
|