scale-gp-beta 0.1.0a7__py3-none-any.whl → 0.1.0a9__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- scale_gp_beta/_version.py +1 -1
- scale_gp_beta/resources/evaluations.py +27 -12
- scale_gp_beta/types/__init__.py +2 -0
- scale_gp_beta/types/evaluation.py +4 -0
- scale_gp_beta/types/evaluation_create_params.py +6 -655
- scale_gp_beta/types/evaluation_list_params.py +4 -2
- scale_gp_beta/types/evaluation_retrieve_params.py +4 -1
- scale_gp_beta/types/evaluation_task.py +205 -0
- scale_gp_beta/types/evaluation_task_param.py +206 -0
- {scale_gp_beta-0.1.0a7.dist-info → scale_gp_beta-0.1.0a9.dist-info}/METADATA +1 -1
- {scale_gp_beta-0.1.0a7.dist-info → scale_gp_beta-0.1.0a9.dist-info}/RECORD +13 -11
- {scale_gp_beta-0.1.0a7.dist-info → scale_gp_beta-0.1.0a9.dist-info}/WHEEL +0 -0
- {scale_gp_beta-0.1.0a7.dist-info → scale_gp_beta-0.1.0a9.dist-info}/licenses/LICENSE +0 -0
|
@@ -3,57 +3,17 @@
|
|
|
3
3
|
from __future__ import annotations
|
|
4
4
|
|
|
5
5
|
from typing import Dict, List, Union, Iterable
|
|
6
|
-
from typing_extensions import
|
|
6
|
+
from typing_extensions import Required, TypeAlias, TypedDict
|
|
7
|
+
|
|
8
|
+
from .evaluation_task_param import EvaluationTaskParam
|
|
7
9
|
|
|
8
10
|
__all__ = [
|
|
9
11
|
"EvaluationCreateParams",
|
|
10
12
|
"EvaluationStandaloneCreateRequest",
|
|
11
|
-
"EvaluationStandaloneCreateRequestTask",
|
|
12
|
-
"EvaluationStandaloneCreateRequestTaskChatCompletionEvaluationTaskRequest",
|
|
13
|
-
"EvaluationStandaloneCreateRequestTaskChatCompletionEvaluationTaskRequestConfiguration",
|
|
14
|
-
"EvaluationStandaloneCreateRequestTaskGenericInferenceEvaluationTaskRequest",
|
|
15
|
-
"EvaluationStandaloneCreateRequestTaskGenericInferenceEvaluationTaskRequestConfiguration",
|
|
16
|
-
"EvaluationStandaloneCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfiguration",
|
|
17
|
-
"EvaluationStandaloneCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfigurationLaunchInferenceConfiguration",
|
|
18
|
-
"EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequest",
|
|
19
|
-
"EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfiguration",
|
|
20
|
-
"EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationHistoryUnionMember0",
|
|
21
|
-
"EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverrides",
|
|
22
|
-
"EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverrides",
|
|
23
|
-
"EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesInitialState",
|
|
24
|
-
"EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesPartialTrace",
|
|
25
13
|
"EvaluationFromDatasetCreateRequest",
|
|
26
14
|
"EvaluationFromDatasetCreateRequestData",
|
|
27
|
-
"EvaluationFromDatasetCreateRequestTask",
|
|
28
|
-
"EvaluationFromDatasetCreateRequestTaskChatCompletionEvaluationTaskRequest",
|
|
29
|
-
"EvaluationFromDatasetCreateRequestTaskChatCompletionEvaluationTaskRequestConfiguration",
|
|
30
|
-
"EvaluationFromDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequest",
|
|
31
|
-
"EvaluationFromDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfiguration",
|
|
32
|
-
"EvaluationFromDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfiguration",
|
|
33
|
-
"EvaluationFromDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfigurationLaunchInferenceConfiguration",
|
|
34
|
-
"EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequest",
|
|
35
|
-
"EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfiguration",
|
|
36
|
-
"EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationHistoryUnionMember0",
|
|
37
|
-
"EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverrides",
|
|
38
|
-
"EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverrides",
|
|
39
|
-
"EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesInitialState",
|
|
40
|
-
"EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesPartialTrace",
|
|
41
15
|
"EvaluationWithDatasetCreateRequest",
|
|
42
16
|
"EvaluationWithDatasetCreateRequestDataset",
|
|
43
|
-
"EvaluationWithDatasetCreateRequestTask",
|
|
44
|
-
"EvaluationWithDatasetCreateRequestTaskChatCompletionEvaluationTaskRequest",
|
|
45
|
-
"EvaluationWithDatasetCreateRequestTaskChatCompletionEvaluationTaskRequestConfiguration",
|
|
46
|
-
"EvaluationWithDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequest",
|
|
47
|
-
"EvaluationWithDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfiguration",
|
|
48
|
-
"EvaluationWithDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfiguration",
|
|
49
|
-
"EvaluationWithDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfigurationLaunchInferenceConfiguration",
|
|
50
|
-
"EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequest",
|
|
51
|
-
"EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfiguration",
|
|
52
|
-
"EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationHistoryUnionMember0",
|
|
53
|
-
"EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverrides",
|
|
54
|
-
"EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverrides",
|
|
55
|
-
"EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesInitialState",
|
|
56
|
-
"EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesPartialTrace",
|
|
57
17
|
]
|
|
58
18
|
|
|
59
19
|
|
|
@@ -65,212 +25,10 @@ class EvaluationStandaloneCreateRequest(TypedDict, total=False):
|
|
|
65
25
|
|
|
66
26
|
description: str
|
|
67
27
|
|
|
68
|
-
tasks: Iterable[
|
|
28
|
+
tasks: Iterable[EvaluationTaskParam]
|
|
69
29
|
"""Tasks allow you to augment and evaluate your data"""
|
|
70
30
|
|
|
71
31
|
|
|
72
|
-
class EvaluationStandaloneCreateRequestTaskChatCompletionEvaluationTaskRequestConfigurationTyped(
|
|
73
|
-
TypedDict, total=False
|
|
74
|
-
):
|
|
75
|
-
messages: Required[Union[Iterable[Dict[str, object]], str]]
|
|
76
|
-
|
|
77
|
-
model: Required[str]
|
|
78
|
-
|
|
79
|
-
audio: Union[Dict[str, object], str]
|
|
80
|
-
|
|
81
|
-
frequency_penalty: Union[float, str]
|
|
82
|
-
|
|
83
|
-
function_call: Union[Dict[str, object], str]
|
|
84
|
-
|
|
85
|
-
functions: Union[Iterable[Dict[str, object]], str]
|
|
86
|
-
|
|
87
|
-
logit_bias: Union[Dict[str, int], str]
|
|
88
|
-
|
|
89
|
-
logprobs: Union[bool, str]
|
|
90
|
-
|
|
91
|
-
max_completion_tokens: Union[int, str]
|
|
92
|
-
|
|
93
|
-
max_tokens: Union[int, str]
|
|
94
|
-
|
|
95
|
-
metadata: Union[Dict[str, str], str]
|
|
96
|
-
|
|
97
|
-
modalities: Union[List[str], str]
|
|
98
|
-
|
|
99
|
-
n: Union[int, str]
|
|
100
|
-
|
|
101
|
-
parallel_tool_calls: Union[bool, str]
|
|
102
|
-
|
|
103
|
-
prediction: Union[Dict[str, object], str]
|
|
104
|
-
|
|
105
|
-
presence_penalty: Union[float, str]
|
|
106
|
-
|
|
107
|
-
reasoning_effort: str
|
|
108
|
-
|
|
109
|
-
response_format: Union[Dict[str, object], str]
|
|
110
|
-
|
|
111
|
-
seed: Union[int, str]
|
|
112
|
-
|
|
113
|
-
stop: str
|
|
114
|
-
|
|
115
|
-
store: Union[bool, str]
|
|
116
|
-
|
|
117
|
-
temperature: Union[float, str]
|
|
118
|
-
|
|
119
|
-
tool_choice: str
|
|
120
|
-
|
|
121
|
-
tools: Union[Iterable[Dict[str, object]], str]
|
|
122
|
-
|
|
123
|
-
top_k: Union[int, str]
|
|
124
|
-
|
|
125
|
-
top_logprobs: Union[int, str]
|
|
126
|
-
|
|
127
|
-
top_p: Union[float, str]
|
|
128
|
-
|
|
129
|
-
|
|
130
|
-
EvaluationStandaloneCreateRequestTaskChatCompletionEvaluationTaskRequestConfiguration: TypeAlias = Union[
|
|
131
|
-
EvaluationStandaloneCreateRequestTaskChatCompletionEvaluationTaskRequestConfigurationTyped, Dict[str, object]
|
|
132
|
-
]
|
|
133
|
-
|
|
134
|
-
|
|
135
|
-
class EvaluationStandaloneCreateRequestTaskChatCompletionEvaluationTaskRequest(TypedDict, total=False):
|
|
136
|
-
configuration: Required[EvaluationStandaloneCreateRequestTaskChatCompletionEvaluationTaskRequestConfiguration]
|
|
137
|
-
|
|
138
|
-
alias: str
|
|
139
|
-
"""Alias to title the results column. Defaults to the `task_type`"""
|
|
140
|
-
|
|
141
|
-
task_type: Literal["chat_completion"]
|
|
142
|
-
|
|
143
|
-
|
|
144
|
-
class EvaluationStandaloneCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfigurationLaunchInferenceConfiguration(
|
|
145
|
-
TypedDict, total=False
|
|
146
|
-
):
|
|
147
|
-
num_retries: int
|
|
148
|
-
|
|
149
|
-
timeout_seconds: int
|
|
150
|
-
|
|
151
|
-
|
|
152
|
-
EvaluationStandaloneCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfiguration: TypeAlias = Union[
|
|
153
|
-
EvaluationStandaloneCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfigurationLaunchInferenceConfiguration,
|
|
154
|
-
str,
|
|
155
|
-
]
|
|
156
|
-
|
|
157
|
-
|
|
158
|
-
class EvaluationStandaloneCreateRequestTaskGenericInferenceEvaluationTaskRequestConfiguration(TypedDict, total=False):
|
|
159
|
-
model: Required[str]
|
|
160
|
-
|
|
161
|
-
args: Union[Dict[str, object], str]
|
|
162
|
-
|
|
163
|
-
inference_configuration: (
|
|
164
|
-
EvaluationStandaloneCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfiguration
|
|
165
|
-
)
|
|
166
|
-
|
|
167
|
-
|
|
168
|
-
class EvaluationStandaloneCreateRequestTaskGenericInferenceEvaluationTaskRequest(TypedDict, total=False):
|
|
169
|
-
configuration: Required[EvaluationStandaloneCreateRequestTaskGenericInferenceEvaluationTaskRequestConfiguration]
|
|
170
|
-
|
|
171
|
-
alias: str
|
|
172
|
-
"""Alias to title the results column. Defaults to the `task_type`"""
|
|
173
|
-
|
|
174
|
-
task_type: Literal["inference"]
|
|
175
|
-
|
|
176
|
-
|
|
177
|
-
class EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationHistoryUnionMember0(
|
|
178
|
-
TypedDict, total=False
|
|
179
|
-
):
|
|
180
|
-
request: Required[str]
|
|
181
|
-
"""Request inputs"""
|
|
182
|
-
|
|
183
|
-
response: Required[str]
|
|
184
|
-
"""Response outputs"""
|
|
185
|
-
|
|
186
|
-
session_data: Dict[str, object]
|
|
187
|
-
"""Session data corresponding to the request response pair"""
|
|
188
|
-
|
|
189
|
-
|
|
190
|
-
class EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesInitialState(
|
|
191
|
-
TypedDict, total=False
|
|
192
|
-
):
|
|
193
|
-
current_node: Required[str]
|
|
194
|
-
|
|
195
|
-
state: Required[Dict[str, object]]
|
|
196
|
-
|
|
197
|
-
|
|
198
|
-
class EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesPartialTrace(
|
|
199
|
-
TypedDict, total=False
|
|
200
|
-
):
|
|
201
|
-
duration_ms: Required[int]
|
|
202
|
-
|
|
203
|
-
node_id: Required[str]
|
|
204
|
-
|
|
205
|
-
operation_input: Required[str]
|
|
206
|
-
|
|
207
|
-
operation_output: Required[str]
|
|
208
|
-
|
|
209
|
-
operation_type: Required[str]
|
|
210
|
-
|
|
211
|
-
start_timestamp: Required[str]
|
|
212
|
-
|
|
213
|
-
workflow_id: Required[str]
|
|
214
|
-
|
|
215
|
-
operation_metadata: Dict[str, object]
|
|
216
|
-
|
|
217
|
-
|
|
218
|
-
class EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverrides(
|
|
219
|
-
TypedDict, total=False
|
|
220
|
-
):
|
|
221
|
-
concurrent: bool
|
|
222
|
-
|
|
223
|
-
initial_state: EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesInitialState
|
|
224
|
-
|
|
225
|
-
partial_trace: Iterable[
|
|
226
|
-
EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesPartialTrace
|
|
227
|
-
]
|
|
228
|
-
|
|
229
|
-
use_channels: bool
|
|
230
|
-
|
|
231
|
-
|
|
232
|
-
EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverrides: TypeAlias = Union[
|
|
233
|
-
EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverrides,
|
|
234
|
-
str,
|
|
235
|
-
]
|
|
236
|
-
|
|
237
|
-
|
|
238
|
-
class EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfiguration(
|
|
239
|
-
TypedDict, total=False
|
|
240
|
-
):
|
|
241
|
-
application_variant_id: Required[str]
|
|
242
|
-
|
|
243
|
-
inputs: Required[Union[Dict[str, object], str]]
|
|
244
|
-
|
|
245
|
-
history: Union[
|
|
246
|
-
Iterable[
|
|
247
|
-
EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationHistoryUnionMember0
|
|
248
|
-
],
|
|
249
|
-
str,
|
|
250
|
-
]
|
|
251
|
-
|
|
252
|
-
operation_metadata: Union[Dict[str, object], str]
|
|
253
|
-
|
|
254
|
-
overrides: EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverrides
|
|
255
|
-
"""Execution override options for agentic applications"""
|
|
256
|
-
|
|
257
|
-
|
|
258
|
-
class EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequest(TypedDict, total=False):
|
|
259
|
-
configuration: Required[EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfiguration]
|
|
260
|
-
|
|
261
|
-
alias: str
|
|
262
|
-
"""Alias to title the results column. Defaults to the `task_type`"""
|
|
263
|
-
|
|
264
|
-
task_type: Literal["application_variant"]
|
|
265
|
-
|
|
266
|
-
|
|
267
|
-
EvaluationStandaloneCreateRequestTask: TypeAlias = Union[
|
|
268
|
-
EvaluationStandaloneCreateRequestTaskChatCompletionEvaluationTaskRequest,
|
|
269
|
-
EvaluationStandaloneCreateRequestTaskGenericInferenceEvaluationTaskRequest,
|
|
270
|
-
EvaluationStandaloneCreateRequestTaskApplicationVariantV1EvaluationTaskRequest,
|
|
271
|
-
]
|
|
272
|
-
|
|
273
|
-
|
|
274
32
|
class EvaluationFromDatasetCreateRequest(TypedDict, total=False):
|
|
275
33
|
dataset_id: Required[str]
|
|
276
34
|
"""The ID of the dataset containing the items referenced by the `data` field"""
|
|
@@ -282,7 +40,7 @@ class EvaluationFromDatasetCreateRequest(TypedDict, total=False):
|
|
|
282
40
|
|
|
283
41
|
description: str
|
|
284
42
|
|
|
285
|
-
tasks: Iterable[
|
|
43
|
+
tasks: Iterable[EvaluationTaskParam]
|
|
286
44
|
"""Tasks allow you to augment and evaluate your data"""
|
|
287
45
|
|
|
288
46
|
|
|
@@ -295,210 +53,6 @@ EvaluationFromDatasetCreateRequestData: TypeAlias = Union[
|
|
|
295
53
|
]
|
|
296
54
|
|
|
297
55
|
|
|
298
|
-
class EvaluationFromDatasetCreateRequestTaskChatCompletionEvaluationTaskRequestConfigurationTyped(
|
|
299
|
-
TypedDict, total=False
|
|
300
|
-
):
|
|
301
|
-
messages: Required[Union[Iterable[Dict[str, object]], str]]
|
|
302
|
-
|
|
303
|
-
model: Required[str]
|
|
304
|
-
|
|
305
|
-
audio: Union[Dict[str, object], str]
|
|
306
|
-
|
|
307
|
-
frequency_penalty: Union[float, str]
|
|
308
|
-
|
|
309
|
-
function_call: Union[Dict[str, object], str]
|
|
310
|
-
|
|
311
|
-
functions: Union[Iterable[Dict[str, object]], str]
|
|
312
|
-
|
|
313
|
-
logit_bias: Union[Dict[str, int], str]
|
|
314
|
-
|
|
315
|
-
logprobs: Union[bool, str]
|
|
316
|
-
|
|
317
|
-
max_completion_tokens: Union[int, str]
|
|
318
|
-
|
|
319
|
-
max_tokens: Union[int, str]
|
|
320
|
-
|
|
321
|
-
metadata: Union[Dict[str, str], str]
|
|
322
|
-
|
|
323
|
-
modalities: Union[List[str], str]
|
|
324
|
-
|
|
325
|
-
n: Union[int, str]
|
|
326
|
-
|
|
327
|
-
parallel_tool_calls: Union[bool, str]
|
|
328
|
-
|
|
329
|
-
prediction: Union[Dict[str, object], str]
|
|
330
|
-
|
|
331
|
-
presence_penalty: Union[float, str]
|
|
332
|
-
|
|
333
|
-
reasoning_effort: str
|
|
334
|
-
|
|
335
|
-
response_format: Union[Dict[str, object], str]
|
|
336
|
-
|
|
337
|
-
seed: Union[int, str]
|
|
338
|
-
|
|
339
|
-
stop: str
|
|
340
|
-
|
|
341
|
-
store: Union[bool, str]
|
|
342
|
-
|
|
343
|
-
temperature: Union[float, str]
|
|
344
|
-
|
|
345
|
-
tool_choice: str
|
|
346
|
-
|
|
347
|
-
tools: Union[Iterable[Dict[str, object]], str]
|
|
348
|
-
|
|
349
|
-
top_k: Union[int, str]
|
|
350
|
-
|
|
351
|
-
top_logprobs: Union[int, str]
|
|
352
|
-
|
|
353
|
-
top_p: Union[float, str]
|
|
354
|
-
|
|
355
|
-
|
|
356
|
-
EvaluationFromDatasetCreateRequestTaskChatCompletionEvaluationTaskRequestConfiguration: TypeAlias = Union[
|
|
357
|
-
EvaluationFromDatasetCreateRequestTaskChatCompletionEvaluationTaskRequestConfigurationTyped, Dict[str, object]
|
|
358
|
-
]
|
|
359
|
-
|
|
360
|
-
|
|
361
|
-
class EvaluationFromDatasetCreateRequestTaskChatCompletionEvaluationTaskRequest(TypedDict, total=False):
|
|
362
|
-
configuration: Required[EvaluationFromDatasetCreateRequestTaskChatCompletionEvaluationTaskRequestConfiguration]
|
|
363
|
-
|
|
364
|
-
alias: str
|
|
365
|
-
"""Alias to title the results column. Defaults to the `task_type`"""
|
|
366
|
-
|
|
367
|
-
task_type: Literal["chat_completion"]
|
|
368
|
-
|
|
369
|
-
|
|
370
|
-
class EvaluationFromDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfigurationLaunchInferenceConfiguration(
|
|
371
|
-
TypedDict, total=False
|
|
372
|
-
):
|
|
373
|
-
num_retries: int
|
|
374
|
-
|
|
375
|
-
timeout_seconds: int
|
|
376
|
-
|
|
377
|
-
|
|
378
|
-
EvaluationFromDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfiguration: TypeAlias = Union[
|
|
379
|
-
EvaluationFromDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfigurationLaunchInferenceConfiguration,
|
|
380
|
-
str,
|
|
381
|
-
]
|
|
382
|
-
|
|
383
|
-
|
|
384
|
-
class EvaluationFromDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfiguration(TypedDict, total=False):
|
|
385
|
-
model: Required[str]
|
|
386
|
-
|
|
387
|
-
args: Union[Dict[str, object], str]
|
|
388
|
-
|
|
389
|
-
inference_configuration: (
|
|
390
|
-
EvaluationFromDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfiguration
|
|
391
|
-
)
|
|
392
|
-
|
|
393
|
-
|
|
394
|
-
class EvaluationFromDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequest(TypedDict, total=False):
|
|
395
|
-
configuration: Required[EvaluationFromDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfiguration]
|
|
396
|
-
|
|
397
|
-
alias: str
|
|
398
|
-
"""Alias to title the results column. Defaults to the `task_type`"""
|
|
399
|
-
|
|
400
|
-
task_type: Literal["inference"]
|
|
401
|
-
|
|
402
|
-
|
|
403
|
-
class EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationHistoryUnionMember0(
|
|
404
|
-
TypedDict, total=False
|
|
405
|
-
):
|
|
406
|
-
request: Required[str]
|
|
407
|
-
"""Request inputs"""
|
|
408
|
-
|
|
409
|
-
response: Required[str]
|
|
410
|
-
"""Response outputs"""
|
|
411
|
-
|
|
412
|
-
session_data: Dict[str, object]
|
|
413
|
-
"""Session data corresponding to the request response pair"""
|
|
414
|
-
|
|
415
|
-
|
|
416
|
-
class EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesInitialState(
|
|
417
|
-
TypedDict, total=False
|
|
418
|
-
):
|
|
419
|
-
current_node: Required[str]
|
|
420
|
-
|
|
421
|
-
state: Required[Dict[str, object]]
|
|
422
|
-
|
|
423
|
-
|
|
424
|
-
class EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesPartialTrace(
|
|
425
|
-
TypedDict, total=False
|
|
426
|
-
):
|
|
427
|
-
duration_ms: Required[int]
|
|
428
|
-
|
|
429
|
-
node_id: Required[str]
|
|
430
|
-
|
|
431
|
-
operation_input: Required[str]
|
|
432
|
-
|
|
433
|
-
operation_output: Required[str]
|
|
434
|
-
|
|
435
|
-
operation_type: Required[str]
|
|
436
|
-
|
|
437
|
-
start_timestamp: Required[str]
|
|
438
|
-
|
|
439
|
-
workflow_id: Required[str]
|
|
440
|
-
|
|
441
|
-
operation_metadata: Dict[str, object]
|
|
442
|
-
|
|
443
|
-
|
|
444
|
-
class EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverrides(
|
|
445
|
-
TypedDict, total=False
|
|
446
|
-
):
|
|
447
|
-
concurrent: bool
|
|
448
|
-
|
|
449
|
-
initial_state: EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesInitialState
|
|
450
|
-
|
|
451
|
-
partial_trace: Iterable[
|
|
452
|
-
EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesPartialTrace
|
|
453
|
-
]
|
|
454
|
-
|
|
455
|
-
use_channels: bool
|
|
456
|
-
|
|
457
|
-
|
|
458
|
-
EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverrides: TypeAlias = Union[
|
|
459
|
-
EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverrides,
|
|
460
|
-
str,
|
|
461
|
-
]
|
|
462
|
-
|
|
463
|
-
|
|
464
|
-
class EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfiguration(
|
|
465
|
-
TypedDict, total=False
|
|
466
|
-
):
|
|
467
|
-
application_variant_id: Required[str]
|
|
468
|
-
|
|
469
|
-
inputs: Required[Union[Dict[str, object], str]]
|
|
470
|
-
|
|
471
|
-
history: Union[
|
|
472
|
-
Iterable[
|
|
473
|
-
EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationHistoryUnionMember0
|
|
474
|
-
],
|
|
475
|
-
str,
|
|
476
|
-
]
|
|
477
|
-
|
|
478
|
-
operation_metadata: Union[Dict[str, object], str]
|
|
479
|
-
|
|
480
|
-
overrides: EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverrides
|
|
481
|
-
"""Execution override options for agentic applications"""
|
|
482
|
-
|
|
483
|
-
|
|
484
|
-
class EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequest(TypedDict, total=False):
|
|
485
|
-
configuration: Required[
|
|
486
|
-
EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfiguration
|
|
487
|
-
]
|
|
488
|
-
|
|
489
|
-
alias: str
|
|
490
|
-
"""Alias to title the results column. Defaults to the `task_type`"""
|
|
491
|
-
|
|
492
|
-
task_type: Literal["application_variant"]
|
|
493
|
-
|
|
494
|
-
|
|
495
|
-
EvaluationFromDatasetCreateRequestTask: TypeAlias = Union[
|
|
496
|
-
EvaluationFromDatasetCreateRequestTaskChatCompletionEvaluationTaskRequest,
|
|
497
|
-
EvaluationFromDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequest,
|
|
498
|
-
EvaluationFromDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequest,
|
|
499
|
-
]
|
|
500
|
-
|
|
501
|
-
|
|
502
56
|
class EvaluationWithDatasetCreateRequest(TypedDict, total=False):
|
|
503
57
|
data: Required[Iterable[Dict[str, object]]]
|
|
504
58
|
"""Items to be evaluated"""
|
|
@@ -510,7 +64,7 @@ class EvaluationWithDatasetCreateRequest(TypedDict, total=False):
|
|
|
510
64
|
|
|
511
65
|
description: str
|
|
512
66
|
|
|
513
|
-
tasks: Iterable[
|
|
67
|
+
tasks: Iterable[EvaluationTaskParam]
|
|
514
68
|
"""Tasks allow you to augment and evaluate your data"""
|
|
515
69
|
|
|
516
70
|
|
|
@@ -526,209 +80,6 @@ class EvaluationWithDatasetCreateRequestDataset(TypedDict, total=False):
|
|
|
526
80
|
"""
|
|
527
81
|
|
|
528
82
|
|
|
529
|
-
class EvaluationWithDatasetCreateRequestTaskChatCompletionEvaluationTaskRequestConfigurationTyped(
|
|
530
|
-
TypedDict, total=False
|
|
531
|
-
):
|
|
532
|
-
messages: Required[Union[Iterable[Dict[str, object]], str]]
|
|
533
|
-
|
|
534
|
-
model: Required[str]
|
|
535
|
-
|
|
536
|
-
audio: Union[Dict[str, object], str]
|
|
537
|
-
|
|
538
|
-
frequency_penalty: Union[float, str]
|
|
539
|
-
|
|
540
|
-
function_call: Union[Dict[str, object], str]
|
|
541
|
-
|
|
542
|
-
functions: Union[Iterable[Dict[str, object]], str]
|
|
543
|
-
|
|
544
|
-
logit_bias: Union[Dict[str, int], str]
|
|
545
|
-
|
|
546
|
-
logprobs: Union[bool, str]
|
|
547
|
-
|
|
548
|
-
max_completion_tokens: Union[int, str]
|
|
549
|
-
|
|
550
|
-
max_tokens: Union[int, str]
|
|
551
|
-
|
|
552
|
-
metadata: Union[Dict[str, str], str]
|
|
553
|
-
|
|
554
|
-
modalities: Union[List[str], str]
|
|
555
|
-
|
|
556
|
-
n: Union[int, str]
|
|
557
|
-
|
|
558
|
-
parallel_tool_calls: Union[bool, str]
|
|
559
|
-
|
|
560
|
-
prediction: Union[Dict[str, object], str]
|
|
561
|
-
|
|
562
|
-
presence_penalty: Union[float, str]
|
|
563
|
-
|
|
564
|
-
reasoning_effort: str
|
|
565
|
-
|
|
566
|
-
response_format: Union[Dict[str, object], str]
|
|
567
|
-
|
|
568
|
-
seed: Union[int, str]
|
|
569
|
-
|
|
570
|
-
stop: str
|
|
571
|
-
|
|
572
|
-
store: Union[bool, str]
|
|
573
|
-
|
|
574
|
-
temperature: Union[float, str]
|
|
575
|
-
|
|
576
|
-
tool_choice: str
|
|
577
|
-
|
|
578
|
-
tools: Union[Iterable[Dict[str, object]], str]
|
|
579
|
-
|
|
580
|
-
top_k: Union[int, str]
|
|
581
|
-
|
|
582
|
-
top_logprobs: Union[int, str]
|
|
583
|
-
|
|
584
|
-
top_p: Union[float, str]
|
|
585
|
-
|
|
586
|
-
|
|
587
|
-
EvaluationWithDatasetCreateRequestTaskChatCompletionEvaluationTaskRequestConfiguration: TypeAlias = Union[
|
|
588
|
-
EvaluationWithDatasetCreateRequestTaskChatCompletionEvaluationTaskRequestConfigurationTyped, Dict[str, object]
|
|
589
|
-
]
|
|
590
|
-
|
|
591
|
-
|
|
592
|
-
class EvaluationWithDatasetCreateRequestTaskChatCompletionEvaluationTaskRequest(TypedDict, total=False):
|
|
593
|
-
configuration: Required[EvaluationWithDatasetCreateRequestTaskChatCompletionEvaluationTaskRequestConfiguration]
|
|
594
|
-
|
|
595
|
-
alias: str
|
|
596
|
-
"""Alias to title the results column. Defaults to the `task_type`"""
|
|
597
|
-
|
|
598
|
-
task_type: Literal["chat_completion"]
|
|
599
|
-
|
|
600
|
-
|
|
601
|
-
class EvaluationWithDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfigurationLaunchInferenceConfiguration(
|
|
602
|
-
TypedDict, total=False
|
|
603
|
-
):
|
|
604
|
-
num_retries: int
|
|
605
|
-
|
|
606
|
-
timeout_seconds: int
|
|
607
|
-
|
|
608
|
-
|
|
609
|
-
EvaluationWithDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfiguration: TypeAlias = Union[
|
|
610
|
-
EvaluationWithDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfigurationLaunchInferenceConfiguration,
|
|
611
|
-
str,
|
|
612
|
-
]
|
|
613
|
-
|
|
614
|
-
|
|
615
|
-
class EvaluationWithDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfiguration(TypedDict, total=False):
|
|
616
|
-
model: Required[str]
|
|
617
|
-
|
|
618
|
-
args: Union[Dict[str, object], str]
|
|
619
|
-
|
|
620
|
-
inference_configuration: (
|
|
621
|
-
EvaluationWithDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfigurationInferenceConfiguration
|
|
622
|
-
)
|
|
623
|
-
|
|
624
|
-
|
|
625
|
-
class EvaluationWithDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequest(TypedDict, total=False):
|
|
626
|
-
configuration: Required[EvaluationWithDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequestConfiguration]
|
|
627
|
-
|
|
628
|
-
alias: str
|
|
629
|
-
"""Alias to title the results column. Defaults to the `task_type`"""
|
|
630
|
-
|
|
631
|
-
task_type: Literal["inference"]
|
|
632
|
-
|
|
633
|
-
|
|
634
|
-
class EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationHistoryUnionMember0(
|
|
635
|
-
TypedDict, total=False
|
|
636
|
-
):
|
|
637
|
-
request: Required[str]
|
|
638
|
-
"""Request inputs"""
|
|
639
|
-
|
|
640
|
-
response: Required[str]
|
|
641
|
-
"""Response outputs"""
|
|
642
|
-
|
|
643
|
-
session_data: Dict[str, object]
|
|
644
|
-
"""Session data corresponding to the request response pair"""
|
|
645
|
-
|
|
646
|
-
|
|
647
|
-
class EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesInitialState(
|
|
648
|
-
TypedDict, total=False
|
|
649
|
-
):
|
|
650
|
-
current_node: Required[str]
|
|
651
|
-
|
|
652
|
-
state: Required[Dict[str, object]]
|
|
653
|
-
|
|
654
|
-
|
|
655
|
-
class EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesPartialTrace(
|
|
656
|
-
TypedDict, total=False
|
|
657
|
-
):
|
|
658
|
-
duration_ms: Required[int]
|
|
659
|
-
|
|
660
|
-
node_id: Required[str]
|
|
661
|
-
|
|
662
|
-
operation_input: Required[str]
|
|
663
|
-
|
|
664
|
-
operation_output: Required[str]
|
|
665
|
-
|
|
666
|
-
operation_type: Required[str]
|
|
667
|
-
|
|
668
|
-
start_timestamp: Required[str]
|
|
669
|
-
|
|
670
|
-
workflow_id: Required[str]
|
|
671
|
-
|
|
672
|
-
operation_metadata: Dict[str, object]
|
|
673
|
-
|
|
674
|
-
|
|
675
|
-
class EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverrides(
|
|
676
|
-
TypedDict, total=False
|
|
677
|
-
):
|
|
678
|
-
concurrent: bool
|
|
679
|
-
|
|
680
|
-
initial_state: EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesInitialState
|
|
681
|
-
|
|
682
|
-
partial_trace: Iterable[
|
|
683
|
-
EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverridesPartialTrace
|
|
684
|
-
]
|
|
685
|
-
|
|
686
|
-
use_channels: bool
|
|
687
|
-
|
|
688
|
-
|
|
689
|
-
EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverrides: TypeAlias = Union[
|
|
690
|
-
EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverridesAgenticApplicationOverrides,
|
|
691
|
-
str,
|
|
692
|
-
]
|
|
693
|
-
|
|
694
|
-
|
|
695
|
-
class EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfiguration(
|
|
696
|
-
TypedDict, total=False
|
|
697
|
-
):
|
|
698
|
-
application_variant_id: Required[str]
|
|
699
|
-
|
|
700
|
-
inputs: Required[Union[Dict[str, object], str]]
|
|
701
|
-
|
|
702
|
-
history: Union[
|
|
703
|
-
Iterable[
|
|
704
|
-
EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationHistoryUnionMember0
|
|
705
|
-
],
|
|
706
|
-
str,
|
|
707
|
-
]
|
|
708
|
-
|
|
709
|
-
operation_metadata: Union[Dict[str, object], str]
|
|
710
|
-
|
|
711
|
-
overrides: EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfigurationOverrides
|
|
712
|
-
"""Execution override options for agentic applications"""
|
|
713
|
-
|
|
714
|
-
|
|
715
|
-
class EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequest(TypedDict, total=False):
|
|
716
|
-
configuration: Required[
|
|
717
|
-
EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequestConfiguration
|
|
718
|
-
]
|
|
719
|
-
|
|
720
|
-
alias: str
|
|
721
|
-
"""Alias to title the results column. Defaults to the `task_type`"""
|
|
722
|
-
|
|
723
|
-
task_type: Literal["application_variant"]
|
|
724
|
-
|
|
725
|
-
|
|
726
|
-
EvaluationWithDatasetCreateRequestTask: TypeAlias = Union[
|
|
727
|
-
EvaluationWithDatasetCreateRequestTaskChatCompletionEvaluationTaskRequest,
|
|
728
|
-
EvaluationWithDatasetCreateRequestTaskGenericInferenceEvaluationTaskRequest,
|
|
729
|
-
EvaluationWithDatasetCreateRequestTaskApplicationVariantV1EvaluationTaskRequest,
|
|
730
|
-
]
|
|
731
|
-
|
|
732
83
|
EvaluationCreateParams: TypeAlias = Union[
|
|
733
84
|
EvaluationStandaloneCreateRequest, EvaluationFromDatasetCreateRequest, EvaluationWithDatasetCreateRequest
|
|
734
85
|
]
|