@roarkanalytics/sdk 0.332.0 → 2.0.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/CHANGELOG.md +25 -0
- package/core.d.ts +2 -2
- package/core.d.ts.map +1 -1
- package/core.js +4 -2
- package/core.js.map +1 -1
- package/core.mjs +4 -2
- package/core.mjs.map +1 -1
- package/package.json +1 -1
- package/resources/evaluation.d.ts +831 -50
- package/resources/evaluation.d.ts.map +1 -1
- package/resources/evaluation.js.map +1 -1
- package/resources/evaluation.mjs.map +1 -1
- package/src/core.ts +5 -3
- package/src/resources/evaluation.ts +1085 -102
- package/src/version.ts +1 -1
- package/version.d.ts +1 -1
- package/version.d.ts.map +1 -1
- package/version.js +1 -1
- package/version.js.map +1 -1
- package/version.mjs +1 -1
- package/version.mjs.map +1 -1
|
@@ -8,13 +8,13 @@ export declare class Evaluation extends APIResource {
|
|
|
8
8
|
/**
|
|
9
9
|
* Returns a specific evaluator with its blocks and configuration.
|
|
10
10
|
*/
|
|
11
|
-
getEvaluatorById(evaluatorId: string, options?: Core.RequestOptions): Core.APIPromise<
|
|
11
|
+
getEvaluatorById(evaluatorId: string, options?: Core.RequestOptions): Core.APIPromise<EvaluationGetEvaluatorByIDResponse>;
|
|
12
12
|
/**
|
|
13
13
|
* Returns a list of evaluators with their blocks and configuration for the
|
|
14
14
|
* authenticated project.
|
|
15
15
|
*/
|
|
16
|
-
getEvaluators(query?: EvaluationGetEvaluatorsParams, options?: Core.RequestOptions): Core.APIPromise<
|
|
17
|
-
getEvaluators(options?: Core.RequestOptions): Core.APIPromise<
|
|
16
|
+
getEvaluators(query?: EvaluationGetEvaluatorsParams, options?: Core.RequestOptions): Core.APIPromise<EvaluationGetEvaluatorsResponse>;
|
|
17
|
+
getEvaluators(options?: Core.RequestOptions): Core.APIPromise<EvaluationGetEvaluatorsResponse>;
|
|
18
18
|
/**
|
|
19
19
|
* Retrieve details of a specific evaluation job
|
|
20
20
|
*/
|
|
@@ -40,8 +40,752 @@ export declare namespace EvaluationCreateJobResponse {
|
|
|
40
40
|
status: 'PENDING' | 'PROCESSING' | 'SUCCESS' | 'FAILURE';
|
|
41
41
|
}
|
|
42
42
|
}
|
|
43
|
-
|
|
44
|
-
|
|
43
|
+
/**
|
|
44
|
+
* Evaluator with its configured blocks
|
|
45
|
+
*/
|
|
46
|
+
export interface EvaluationGetEvaluatorByIDResponse {
|
|
47
|
+
/**
|
|
48
|
+
* Unique identifier for the evaluator
|
|
49
|
+
*/
|
|
50
|
+
id: string;
|
|
51
|
+
/**
|
|
52
|
+
* Array of evaluation blocks configured for this evaluator
|
|
53
|
+
*/
|
|
54
|
+
blocks: Array<EvaluationGetEvaluatorByIDResponse.UnionMember0 | EvaluationGetEvaluatorByIDResponse.UnionMember1 | EvaluationGetEvaluatorByIDResponse.UnionMember2 | EvaluationGetEvaluatorByIDResponse.UnionMember3 | EvaluationGetEvaluatorByIDResponse.UnionMember4 | EvaluationGetEvaluatorByIDResponse.UnionMember5 | EvaluationGetEvaluatorByIDResponse.UnionMember6 | EvaluationGetEvaluatorByIDResponse.UnionMember7 | EvaluationGetEvaluatorByIDResponse.UnionMember8>;
|
|
55
|
+
/**
|
|
56
|
+
* ISO timestamp when the evaluator was created
|
|
57
|
+
*/
|
|
58
|
+
createdAt: string;
|
|
59
|
+
/**
|
|
60
|
+
* Optional description of the evaluator
|
|
61
|
+
*/
|
|
62
|
+
description: string | null;
|
|
63
|
+
/**
|
|
64
|
+
* Name of the evaluator
|
|
65
|
+
*/
|
|
66
|
+
name: string;
|
|
67
|
+
/**
|
|
68
|
+
* Unique slug identifier for the evaluator
|
|
69
|
+
*/
|
|
70
|
+
slug: string;
|
|
71
|
+
/**
|
|
72
|
+
* ISO timestamp when the evaluator was last updated
|
|
73
|
+
*/
|
|
74
|
+
updatedAt: string;
|
|
75
|
+
}
|
|
76
|
+
export declare namespace EvaluationGetEvaluatorByIDResponse {
|
|
77
|
+
interface UnionMember0 {
|
|
78
|
+
/**
|
|
79
|
+
* Unique identifier for the block
|
|
80
|
+
*/
|
|
81
|
+
id: string;
|
|
82
|
+
/**
|
|
83
|
+
* Block type identifier
|
|
84
|
+
*/
|
|
85
|
+
blockType: 'CUSTOM_PROMPT';
|
|
86
|
+
/**
|
|
87
|
+
* Optional description of what this block evaluates
|
|
88
|
+
*/
|
|
89
|
+
description: string | null;
|
|
90
|
+
/**
|
|
91
|
+
* Name of the metric this prompt evaluates
|
|
92
|
+
*/
|
|
93
|
+
metricName: string;
|
|
94
|
+
/**
|
|
95
|
+
* Display name of the evaluation block
|
|
96
|
+
*/
|
|
97
|
+
name: string;
|
|
98
|
+
/**
|
|
99
|
+
* Order in which this block is executed
|
|
100
|
+
*/
|
|
101
|
+
orderIndex: number;
|
|
102
|
+
/**
|
|
103
|
+
* The prompt to evaluate the call against
|
|
104
|
+
*/
|
|
105
|
+
prompt: string;
|
|
106
|
+
/**
|
|
107
|
+
* Minimum score threshold to pass evaluation (0-1)
|
|
108
|
+
*/
|
|
109
|
+
threshold: number;
|
|
110
|
+
/**
|
|
111
|
+
* Weight of this block in the overall evaluation score (0-100)
|
|
112
|
+
*/
|
|
113
|
+
weight: number;
|
|
114
|
+
}
|
|
115
|
+
interface UnionMember1 {
|
|
116
|
+
/**
|
|
117
|
+
* Unique identifier for the block
|
|
118
|
+
*/
|
|
119
|
+
id: string;
|
|
120
|
+
/**
|
|
121
|
+
* Block type identifier
|
|
122
|
+
*/
|
|
123
|
+
blockType: 'DATAFIELD_CHECK';
|
|
124
|
+
/**
|
|
125
|
+
* Optional description of what this block evaluates
|
|
126
|
+
*/
|
|
127
|
+
description: string | null;
|
|
128
|
+
/**
|
|
129
|
+
* Criteria for evaluating the property
|
|
130
|
+
*/
|
|
131
|
+
evaluationCriteria: string;
|
|
132
|
+
/**
|
|
133
|
+
* Whether this property must be present
|
|
134
|
+
*/
|
|
135
|
+
isRequired: boolean;
|
|
136
|
+
/**
|
|
137
|
+
* Display name of the evaluation block
|
|
138
|
+
*/
|
|
139
|
+
name: string;
|
|
140
|
+
/**
|
|
141
|
+
* Order in which this block is executed
|
|
142
|
+
*/
|
|
143
|
+
orderIndex: number;
|
|
144
|
+
/**
|
|
145
|
+
* Name of the property to check
|
|
146
|
+
*/
|
|
147
|
+
propertyName: string;
|
|
148
|
+
/**
|
|
149
|
+
* Minimum score threshold to pass evaluation (0-1)
|
|
150
|
+
*/
|
|
151
|
+
threshold: number;
|
|
152
|
+
/**
|
|
153
|
+
* Expected type of the property value
|
|
154
|
+
*/
|
|
155
|
+
valueType: string;
|
|
156
|
+
/**
|
|
157
|
+
* Weight of this block in the overall evaluation score (0-100)
|
|
158
|
+
*/
|
|
159
|
+
weight: number;
|
|
160
|
+
}
|
|
161
|
+
interface UnionMember2 {
|
|
162
|
+
/**
|
|
163
|
+
* Unique identifier for the block
|
|
164
|
+
*/
|
|
165
|
+
id: string;
|
|
166
|
+
/**
|
|
167
|
+
* Block type identifier
|
|
168
|
+
*/
|
|
169
|
+
blockType: 'EMOTION';
|
|
170
|
+
/**
|
|
171
|
+
* Optional description of what this block evaluates
|
|
172
|
+
*/
|
|
173
|
+
description: string | null;
|
|
174
|
+
/**
|
|
175
|
+
* Display name of the evaluation block
|
|
176
|
+
*/
|
|
177
|
+
name: string;
|
|
178
|
+
/**
|
|
179
|
+
* Order in which this block is executed
|
|
180
|
+
*/
|
|
181
|
+
orderIndex: number;
|
|
182
|
+
/**
|
|
183
|
+
* The emotion to detect (e.g., "joy", "anger", "sadness")
|
|
184
|
+
*/
|
|
185
|
+
selectedEmotion: string;
|
|
186
|
+
/**
|
|
187
|
+
* Minimum confidence threshold for emotion detection (0-1)
|
|
188
|
+
*/
|
|
189
|
+
threshold: number;
|
|
190
|
+
/**
|
|
191
|
+
* Weight of this block in the overall evaluation score (0-100)
|
|
192
|
+
*/
|
|
193
|
+
weight: number;
|
|
194
|
+
}
|
|
195
|
+
interface UnionMember3 {
|
|
196
|
+
/**
|
|
197
|
+
* Unique identifier for the block
|
|
198
|
+
*/
|
|
199
|
+
id: string;
|
|
200
|
+
/**
|
|
201
|
+
* Block type identifier
|
|
202
|
+
*/
|
|
203
|
+
blockType: 'LATENCY';
|
|
204
|
+
/**
|
|
205
|
+
* Optional description of what this block evaluates
|
|
206
|
+
*/
|
|
207
|
+
description: string | null;
|
|
208
|
+
/**
|
|
209
|
+
* Maximum number of silence periods allowed
|
|
210
|
+
*/
|
|
211
|
+
maxAllowedSilences: number;
|
|
212
|
+
/**
|
|
213
|
+
* Minimum duration of silence in milliseconds to be considered
|
|
214
|
+
*/
|
|
215
|
+
minSilenceDuration: number;
|
|
216
|
+
/**
|
|
217
|
+
* Display name of the evaluation block
|
|
218
|
+
*/
|
|
219
|
+
name: string;
|
|
220
|
+
/**
|
|
221
|
+
* Order in which this block is executed
|
|
222
|
+
*/
|
|
223
|
+
orderIndex: number;
|
|
224
|
+
/**
|
|
225
|
+
* Maximum allowed latency score
|
|
226
|
+
*/
|
|
227
|
+
threshold: number;
|
|
228
|
+
/**
|
|
229
|
+
* Weight of this block in the overall evaluation score (0-100)
|
|
230
|
+
*/
|
|
231
|
+
weight: number;
|
|
232
|
+
}
|
|
233
|
+
interface UnionMember4 {
|
|
234
|
+
/**
|
|
235
|
+
* Unique identifier for the block
|
|
236
|
+
*/
|
|
237
|
+
id: string;
|
|
238
|
+
/**
|
|
239
|
+
* Block type identifier
|
|
240
|
+
*/
|
|
241
|
+
blockType: 'POLITENESS';
|
|
242
|
+
/**
|
|
243
|
+
* Optional description of what this block evaluates
|
|
244
|
+
*/
|
|
245
|
+
description: string | null;
|
|
246
|
+
/**
|
|
247
|
+
* Display name of the evaluation block
|
|
248
|
+
*/
|
|
249
|
+
name: string;
|
|
250
|
+
/**
|
|
251
|
+
* Order in which this block is executed
|
|
252
|
+
*/
|
|
253
|
+
orderIndex: number;
|
|
254
|
+
/**
|
|
255
|
+
* Minimum politeness score threshold (0-1)
|
|
256
|
+
*/
|
|
257
|
+
threshold: number;
|
|
258
|
+
/**
|
|
259
|
+
* Weight of this block in the overall evaluation score (0-100)
|
|
260
|
+
*/
|
|
261
|
+
weight: number;
|
|
262
|
+
}
|
|
263
|
+
interface UnionMember5 {
|
|
264
|
+
/**
|
|
265
|
+
* Unique identifier for the block
|
|
266
|
+
*/
|
|
267
|
+
id: string;
|
|
268
|
+
/**
|
|
269
|
+
* Block type identifier
|
|
270
|
+
*/
|
|
271
|
+
blockType: 'SENTIMENT';
|
|
272
|
+
/**
|
|
273
|
+
* Optional description of what this block evaluates
|
|
274
|
+
*/
|
|
275
|
+
description: string | null;
|
|
276
|
+
/**
|
|
277
|
+
* Display name of the evaluation block
|
|
278
|
+
*/
|
|
279
|
+
name: string;
|
|
280
|
+
/**
|
|
281
|
+
* Order in which this block is executed
|
|
282
|
+
*/
|
|
283
|
+
orderIndex: number;
|
|
284
|
+
/**
|
|
285
|
+
* Minimum sentiment score threshold (0-1)
|
|
286
|
+
*/
|
|
287
|
+
threshold: number;
|
|
288
|
+
/**
|
|
289
|
+
* Weight of this block in the overall evaluation score (0-100)
|
|
290
|
+
*/
|
|
291
|
+
weight: number;
|
|
292
|
+
}
|
|
293
|
+
interface UnionMember6 {
|
|
294
|
+
/**
|
|
295
|
+
* Unique identifier for the block
|
|
296
|
+
*/
|
|
297
|
+
id: string;
|
|
298
|
+
/**
|
|
299
|
+
* Block type identifier
|
|
300
|
+
*/
|
|
301
|
+
blockType: 'TOOL_CALLS';
|
|
302
|
+
/**
|
|
303
|
+
* Optional description of what this block evaluates
|
|
304
|
+
*/
|
|
305
|
+
description: string | null;
|
|
306
|
+
/**
|
|
307
|
+
* Condition that must be met for tool invocation
|
|
308
|
+
*/
|
|
309
|
+
invocationCondition: string | null;
|
|
310
|
+
/**
|
|
311
|
+
* Minimum number of times the tool should be invoked
|
|
312
|
+
*/
|
|
313
|
+
minInvocationCount: number | null;
|
|
314
|
+
/**
|
|
315
|
+
* Display name of the evaluation block
|
|
316
|
+
*/
|
|
317
|
+
name: string;
|
|
318
|
+
/**
|
|
319
|
+
* Order in which this block is executed
|
|
320
|
+
*/
|
|
321
|
+
orderIndex: number;
|
|
322
|
+
/**
|
|
323
|
+
* Whether the tool should be invoked
|
|
324
|
+
*/
|
|
325
|
+
shouldBeInvoked: boolean;
|
|
326
|
+
/**
|
|
327
|
+
* ID of the tool definition
|
|
328
|
+
*/
|
|
329
|
+
toolDefinitionId: string;
|
|
330
|
+
/**
|
|
331
|
+
* Weight of this block in the overall evaluation score (0-100)
|
|
332
|
+
*/
|
|
333
|
+
weight: number;
|
|
334
|
+
}
|
|
335
|
+
interface UnionMember7 {
|
|
336
|
+
/**
|
|
337
|
+
* Unique identifier for the block
|
|
338
|
+
*/
|
|
339
|
+
id: string;
|
|
340
|
+
/**
|
|
341
|
+
* Block type identifier
|
|
342
|
+
*/
|
|
343
|
+
blockType: 'TOXICITY';
|
|
344
|
+
/**
|
|
345
|
+
* Optional description of what this block evaluates
|
|
346
|
+
*/
|
|
347
|
+
description: string | null;
|
|
348
|
+
/**
|
|
349
|
+
* Display name of the evaluation block
|
|
350
|
+
*/
|
|
351
|
+
name: string;
|
|
352
|
+
/**
|
|
353
|
+
* Order in which this block is executed
|
|
354
|
+
*/
|
|
355
|
+
orderIndex: number;
|
|
356
|
+
/**
|
|
357
|
+
* Maximum allowed toxicity score (0-1)
|
|
358
|
+
*/
|
|
359
|
+
threshold: number;
|
|
360
|
+
/**
|
|
361
|
+
* Weight of this block in the overall evaluation score (0-100)
|
|
362
|
+
*/
|
|
363
|
+
weight: number;
|
|
364
|
+
}
|
|
365
|
+
interface UnionMember8 {
|
|
366
|
+
/**
|
|
367
|
+
* Unique identifier for the block
|
|
368
|
+
*/
|
|
369
|
+
id: string;
|
|
370
|
+
/**
|
|
371
|
+
* Block type identifier
|
|
372
|
+
*/
|
|
373
|
+
blockType: 'VOCAL_CUE';
|
|
374
|
+
/**
|
|
375
|
+
* Optional description of what this block evaluates
|
|
376
|
+
*/
|
|
377
|
+
description: string | null;
|
|
378
|
+
/**
|
|
379
|
+
* Display name of the evaluation block
|
|
380
|
+
*/
|
|
381
|
+
name: string;
|
|
382
|
+
/**
|
|
383
|
+
* Order in which this block is executed
|
|
384
|
+
*/
|
|
385
|
+
orderIndex: number;
|
|
386
|
+
/**
|
|
387
|
+
* The vocal cue to detect (e.g., "pace", "tone", "volume")
|
|
388
|
+
*/
|
|
389
|
+
selectedCue: string;
|
|
390
|
+
/**
|
|
391
|
+
* Minimum confidence threshold for vocal cue detection (0-1)
|
|
392
|
+
*/
|
|
393
|
+
threshold: number;
|
|
394
|
+
/**
|
|
395
|
+
* Weight of this block in the overall evaluation score (0-100)
|
|
396
|
+
*/
|
|
397
|
+
weight: number;
|
|
398
|
+
}
|
|
399
|
+
}
|
|
400
|
+
/**
|
|
401
|
+
* Response containing evaluators and pagination info
|
|
402
|
+
*/
|
|
403
|
+
export interface EvaluationGetEvaluatorsResponse {
|
|
404
|
+
/**
|
|
405
|
+
* Array of evaluators with their blocks
|
|
406
|
+
*/
|
|
407
|
+
data: Array<EvaluationGetEvaluatorsResponse.Data>;
|
|
408
|
+
/**
|
|
409
|
+
* Pagination information
|
|
410
|
+
*/
|
|
411
|
+
pagination: EvaluationGetEvaluatorsResponse.Pagination;
|
|
412
|
+
}
|
|
413
|
+
export declare namespace EvaluationGetEvaluatorsResponse {
|
|
414
|
+
/**
|
|
415
|
+
* Evaluator with its configured blocks
|
|
416
|
+
*/
|
|
417
|
+
interface Data {
|
|
418
|
+
/**
|
|
419
|
+
* Unique identifier for the evaluator
|
|
420
|
+
*/
|
|
421
|
+
id: string;
|
|
422
|
+
/**
|
|
423
|
+
* Array of evaluation blocks configured for this evaluator
|
|
424
|
+
*/
|
|
425
|
+
blocks: Array<Data.UnionMember0 | Data.UnionMember1 | Data.UnionMember2 | Data.UnionMember3 | Data.UnionMember4 | Data.UnionMember5 | Data.UnionMember6 | Data.UnionMember7 | Data.UnionMember8>;
|
|
426
|
+
/**
|
|
427
|
+
* ISO timestamp when the evaluator was created
|
|
428
|
+
*/
|
|
429
|
+
createdAt: string;
|
|
430
|
+
/**
|
|
431
|
+
* Optional description of the evaluator
|
|
432
|
+
*/
|
|
433
|
+
description: string | null;
|
|
434
|
+
/**
|
|
435
|
+
* Name of the evaluator
|
|
436
|
+
*/
|
|
437
|
+
name: string;
|
|
438
|
+
/**
|
|
439
|
+
* Unique slug identifier for the evaluator
|
|
440
|
+
*/
|
|
441
|
+
slug: string;
|
|
442
|
+
/**
|
|
443
|
+
* ISO timestamp when the evaluator was last updated
|
|
444
|
+
*/
|
|
445
|
+
updatedAt: string;
|
|
446
|
+
}
|
|
447
|
+
namespace Data {
|
|
448
|
+
interface UnionMember0 {
|
|
449
|
+
/**
|
|
450
|
+
* Unique identifier for the block
|
|
451
|
+
*/
|
|
452
|
+
id: string;
|
|
453
|
+
/**
|
|
454
|
+
* Block type identifier
|
|
455
|
+
*/
|
|
456
|
+
blockType: 'CUSTOM_PROMPT';
|
|
457
|
+
/**
|
|
458
|
+
* Optional description of what this block evaluates
|
|
459
|
+
*/
|
|
460
|
+
description: string | null;
|
|
461
|
+
/**
|
|
462
|
+
* Name of the metric this prompt evaluates
|
|
463
|
+
*/
|
|
464
|
+
metricName: string;
|
|
465
|
+
/**
|
|
466
|
+
* Display name of the evaluation block
|
|
467
|
+
*/
|
|
468
|
+
name: string;
|
|
469
|
+
/**
|
|
470
|
+
* Order in which this block is executed
|
|
471
|
+
*/
|
|
472
|
+
orderIndex: number;
|
|
473
|
+
/**
|
|
474
|
+
* The prompt to evaluate the call against
|
|
475
|
+
*/
|
|
476
|
+
prompt: string;
|
|
477
|
+
/**
|
|
478
|
+
* Minimum score threshold to pass evaluation (0-1)
|
|
479
|
+
*/
|
|
480
|
+
threshold: number;
|
|
481
|
+
/**
|
|
482
|
+
* Weight of this block in the overall evaluation score (0-100)
|
|
483
|
+
*/
|
|
484
|
+
weight: number;
|
|
485
|
+
}
|
|
486
|
+
interface UnionMember1 {
|
|
487
|
+
/**
|
|
488
|
+
* Unique identifier for the block
|
|
489
|
+
*/
|
|
490
|
+
id: string;
|
|
491
|
+
/**
|
|
492
|
+
* Block type identifier
|
|
493
|
+
*/
|
|
494
|
+
blockType: 'DATAFIELD_CHECK';
|
|
495
|
+
/**
|
|
496
|
+
* Optional description of what this block evaluates
|
|
497
|
+
*/
|
|
498
|
+
description: string | null;
|
|
499
|
+
/**
|
|
500
|
+
* Criteria for evaluating the property
|
|
501
|
+
*/
|
|
502
|
+
evaluationCriteria: string;
|
|
503
|
+
/**
|
|
504
|
+
* Whether this property must be present
|
|
505
|
+
*/
|
|
506
|
+
isRequired: boolean;
|
|
507
|
+
/**
|
|
508
|
+
* Display name of the evaluation block
|
|
509
|
+
*/
|
|
510
|
+
name: string;
|
|
511
|
+
/**
|
|
512
|
+
* Order in which this block is executed
|
|
513
|
+
*/
|
|
514
|
+
orderIndex: number;
|
|
515
|
+
/**
|
|
516
|
+
* Name of the property to check
|
|
517
|
+
*/
|
|
518
|
+
propertyName: string;
|
|
519
|
+
/**
|
|
520
|
+
* Minimum score threshold to pass evaluation (0-1)
|
|
521
|
+
*/
|
|
522
|
+
threshold: number;
|
|
523
|
+
/**
|
|
524
|
+
* Expected type of the property value
|
|
525
|
+
*/
|
|
526
|
+
valueType: string;
|
|
527
|
+
/**
|
|
528
|
+
* Weight of this block in the overall evaluation score (0-100)
|
|
529
|
+
*/
|
|
530
|
+
weight: number;
|
|
531
|
+
}
|
|
532
|
+
interface UnionMember2 {
|
|
533
|
+
/**
|
|
534
|
+
* Unique identifier for the block
|
|
535
|
+
*/
|
|
536
|
+
id: string;
|
|
537
|
+
/**
|
|
538
|
+
* Block type identifier
|
|
539
|
+
*/
|
|
540
|
+
blockType: 'EMOTION';
|
|
541
|
+
/**
|
|
542
|
+
* Optional description of what this block evaluates
|
|
543
|
+
*/
|
|
544
|
+
description: string | null;
|
|
545
|
+
/**
|
|
546
|
+
* Display name of the evaluation block
|
|
547
|
+
*/
|
|
548
|
+
name: string;
|
|
549
|
+
/**
|
|
550
|
+
* Order in which this block is executed
|
|
551
|
+
*/
|
|
552
|
+
orderIndex: number;
|
|
553
|
+
/**
|
|
554
|
+
* The emotion to detect (e.g., "joy", "anger", "sadness")
|
|
555
|
+
*/
|
|
556
|
+
selectedEmotion: string;
|
|
557
|
+
/**
|
|
558
|
+
* Minimum confidence threshold for emotion detection (0-1)
|
|
559
|
+
*/
|
|
560
|
+
threshold: number;
|
|
561
|
+
/**
|
|
562
|
+
* Weight of this block in the overall evaluation score (0-100)
|
|
563
|
+
*/
|
|
564
|
+
weight: number;
|
|
565
|
+
}
|
|
566
|
+
interface UnionMember3 {
|
|
567
|
+
/**
|
|
568
|
+
* Unique identifier for the block
|
|
569
|
+
*/
|
|
570
|
+
id: string;
|
|
571
|
+
/**
|
|
572
|
+
* Block type identifier
|
|
573
|
+
*/
|
|
574
|
+
blockType: 'LATENCY';
|
|
575
|
+
/**
|
|
576
|
+
* Optional description of what this block evaluates
|
|
577
|
+
*/
|
|
578
|
+
description: string | null;
|
|
579
|
+
/**
|
|
580
|
+
* Maximum number of silence periods allowed
|
|
581
|
+
*/
|
|
582
|
+
maxAllowedSilences: number;
|
|
583
|
+
/**
|
|
584
|
+
* Minimum duration of silence in milliseconds to be considered
|
|
585
|
+
*/
|
|
586
|
+
minSilenceDuration: number;
|
|
587
|
+
/**
|
|
588
|
+
* Display name of the evaluation block
|
|
589
|
+
*/
|
|
590
|
+
name: string;
|
|
591
|
+
/**
|
|
592
|
+
* Order in which this block is executed
|
|
593
|
+
*/
|
|
594
|
+
orderIndex: number;
|
|
595
|
+
/**
|
|
596
|
+
* Maximum allowed latency score
|
|
597
|
+
*/
|
|
598
|
+
threshold: number;
|
|
599
|
+
/**
|
|
600
|
+
* Weight of this block in the overall evaluation score (0-100)
|
|
601
|
+
*/
|
|
602
|
+
weight: number;
|
|
603
|
+
}
|
|
604
|
+
interface UnionMember4 {
|
|
605
|
+
/**
|
|
606
|
+
* Unique identifier for the block
|
|
607
|
+
*/
|
|
608
|
+
id: string;
|
|
609
|
+
/**
|
|
610
|
+
* Block type identifier
|
|
611
|
+
*/
|
|
612
|
+
blockType: 'POLITENESS';
|
|
613
|
+
/**
|
|
614
|
+
* Optional description of what this block evaluates
|
|
615
|
+
*/
|
|
616
|
+
description: string | null;
|
|
617
|
+
/**
|
|
618
|
+
* Display name of the evaluation block
|
|
619
|
+
*/
|
|
620
|
+
name: string;
|
|
621
|
+
/**
|
|
622
|
+
* Order in which this block is executed
|
|
623
|
+
*/
|
|
624
|
+
orderIndex: number;
|
|
625
|
+
/**
|
|
626
|
+
* Minimum politeness score threshold (0-1)
|
|
627
|
+
*/
|
|
628
|
+
threshold: number;
|
|
629
|
+
/**
|
|
630
|
+
* Weight of this block in the overall evaluation score (0-100)
|
|
631
|
+
*/
|
|
632
|
+
weight: number;
|
|
633
|
+
}
|
|
634
|
+
interface UnionMember5 {
|
|
635
|
+
/**
|
|
636
|
+
* Unique identifier for the block
|
|
637
|
+
*/
|
|
638
|
+
id: string;
|
|
639
|
+
/**
|
|
640
|
+
* Block type identifier
|
|
641
|
+
*/
|
|
642
|
+
blockType: 'SENTIMENT';
|
|
643
|
+
/**
|
|
644
|
+
* Optional description of what this block evaluates
|
|
645
|
+
*/
|
|
646
|
+
description: string | null;
|
|
647
|
+
/**
|
|
648
|
+
* Display name of the evaluation block
|
|
649
|
+
*/
|
|
650
|
+
name: string;
|
|
651
|
+
/**
|
|
652
|
+
* Order in which this block is executed
|
|
653
|
+
*/
|
|
654
|
+
orderIndex: number;
|
|
655
|
+
/**
|
|
656
|
+
* Minimum sentiment score threshold (0-1)
|
|
657
|
+
*/
|
|
658
|
+
threshold: number;
|
|
659
|
+
/**
|
|
660
|
+
* Weight of this block in the overall evaluation score (0-100)
|
|
661
|
+
*/
|
|
662
|
+
weight: number;
|
|
663
|
+
}
|
|
664
|
+
interface UnionMember6 {
|
|
665
|
+
/**
|
|
666
|
+
* Unique identifier for the block
|
|
667
|
+
*/
|
|
668
|
+
id: string;
|
|
669
|
+
/**
|
|
670
|
+
* Block type identifier
|
|
671
|
+
*/
|
|
672
|
+
blockType: 'TOOL_CALLS';
|
|
673
|
+
/**
|
|
674
|
+
* Optional description of what this block evaluates
|
|
675
|
+
*/
|
|
676
|
+
description: string | null;
|
|
677
|
+
/**
|
|
678
|
+
* Condition that must be met for tool invocation
|
|
679
|
+
*/
|
|
680
|
+
invocationCondition: string | null;
|
|
681
|
+
/**
|
|
682
|
+
* Minimum number of times the tool should be invoked
|
|
683
|
+
*/
|
|
684
|
+
minInvocationCount: number | null;
|
|
685
|
+
/**
|
|
686
|
+
* Display name of the evaluation block
|
|
687
|
+
*/
|
|
688
|
+
name: string;
|
|
689
|
+
/**
|
|
690
|
+
* Order in which this block is executed
|
|
691
|
+
*/
|
|
692
|
+
orderIndex: number;
|
|
693
|
+
/**
|
|
694
|
+
* Whether the tool should be invoked
|
|
695
|
+
*/
|
|
696
|
+
shouldBeInvoked: boolean;
|
|
697
|
+
/**
|
|
698
|
+
* ID of the tool definition
|
|
699
|
+
*/
|
|
700
|
+
toolDefinitionId: string;
|
|
701
|
+
/**
|
|
702
|
+
* Weight of this block in the overall evaluation score (0-100)
|
|
703
|
+
*/
|
|
704
|
+
weight: number;
|
|
705
|
+
}
|
|
706
|
+
interface UnionMember7 {
|
|
707
|
+
/**
|
|
708
|
+
* Unique identifier for the block
|
|
709
|
+
*/
|
|
710
|
+
id: string;
|
|
711
|
+
/**
|
|
712
|
+
* Block type identifier
|
|
713
|
+
*/
|
|
714
|
+
blockType: 'TOXICITY';
|
|
715
|
+
/**
|
|
716
|
+
* Optional description of what this block evaluates
|
|
717
|
+
*/
|
|
718
|
+
description: string | null;
|
|
719
|
+
/**
|
|
720
|
+
* Display name of the evaluation block
|
|
721
|
+
*/
|
|
722
|
+
name: string;
|
|
723
|
+
/**
|
|
724
|
+
* Order in which this block is executed
|
|
725
|
+
*/
|
|
726
|
+
orderIndex: number;
|
|
727
|
+
/**
|
|
728
|
+
* Maximum allowed toxicity score (0-1)
|
|
729
|
+
*/
|
|
730
|
+
threshold: number;
|
|
731
|
+
/**
|
|
732
|
+
* Weight of this block in the overall evaluation score (0-100)
|
|
733
|
+
*/
|
|
734
|
+
weight: number;
|
|
735
|
+
}
|
|
736
|
+
interface UnionMember8 {
|
|
737
|
+
/**
|
|
738
|
+
* Unique identifier for the block
|
|
739
|
+
*/
|
|
740
|
+
id: string;
|
|
741
|
+
/**
|
|
742
|
+
* Block type identifier
|
|
743
|
+
*/
|
|
744
|
+
blockType: 'VOCAL_CUE';
|
|
745
|
+
/**
|
|
746
|
+
* Optional description of what this block evaluates
|
|
747
|
+
*/
|
|
748
|
+
description: string | null;
|
|
749
|
+
/**
|
|
750
|
+
* Display name of the evaluation block
|
|
751
|
+
*/
|
|
752
|
+
name: string;
|
|
753
|
+
/**
|
|
754
|
+
* Order in which this block is executed
|
|
755
|
+
*/
|
|
756
|
+
orderIndex: number;
|
|
757
|
+
/**
|
|
758
|
+
* The vocal cue to detect (e.g., "pace", "tone", "volume")
|
|
759
|
+
*/
|
|
760
|
+
selectedCue: string;
|
|
761
|
+
/**
|
|
762
|
+
* Minimum confidence threshold for vocal cue detection (0-1)
|
|
763
|
+
*/
|
|
764
|
+
threshold: number;
|
|
765
|
+
/**
|
|
766
|
+
* Weight of this block in the overall evaluation score (0-100)
|
|
767
|
+
*/
|
|
768
|
+
weight: number;
|
|
769
|
+
}
|
|
770
|
+
}
|
|
771
|
+
/**
|
|
772
|
+
* Pagination information
|
|
773
|
+
*/
|
|
774
|
+
interface Pagination {
|
|
775
|
+
/**
|
|
776
|
+
* Whether there are more evaluators to fetch
|
|
777
|
+
*/
|
|
778
|
+
hasMore: boolean;
|
|
779
|
+
/**
|
|
780
|
+
* Cursor for the next page, null if no more pages
|
|
781
|
+
*/
|
|
782
|
+
nextCursor: string | null;
|
|
783
|
+
/**
|
|
784
|
+
* Total number of evaluators
|
|
785
|
+
*/
|
|
786
|
+
total: number;
|
|
787
|
+
}
|
|
788
|
+
}
|
|
45
789
|
export interface EvaluationGetJobResponse {
|
|
46
790
|
/**
|
|
47
791
|
* Evaluation job response payload
|
|
@@ -126,107 +870,138 @@ export declare namespace EvaluationGetJobRunsResponse {
|
|
|
126
870
|
namespace Data {
|
|
127
871
|
interface Data {
|
|
128
872
|
/**
|
|
129
|
-
*
|
|
873
|
+
* All block runs for this evaluator, including skipped ones
|
|
130
874
|
*/
|
|
131
|
-
|
|
875
|
+
blockRuns: Array<Data.BlockRun>;
|
|
876
|
+
evaluator: Data.Evaluator;
|
|
877
|
+
evidence: Array<Data.Evidence>;
|
|
878
|
+
metrics: Array<Data.Metric>;
|
|
132
879
|
/**
|
|
133
|
-
*
|
|
134
|
-
*/
|
|
135
|
-
completedAt: string | null;
|
|
136
|
-
/**
|
|
137
|
-
* Evaluator of the evaluator run
|
|
880
|
+
* Status of the evaluator run
|
|
138
881
|
*/
|
|
139
|
-
|
|
882
|
+
status: 'PENDING' | 'IN_PROGRESS' | 'COMPLETED' | 'FAILED';
|
|
140
883
|
/**
|
|
141
|
-
*
|
|
884
|
+
* ID of the evaluator run
|
|
142
885
|
*/
|
|
143
|
-
|
|
886
|
+
id?: string;
|
|
144
887
|
/**
|
|
145
|
-
*
|
|
888
|
+
* When the evaluator run completed
|
|
146
889
|
*/
|
|
147
|
-
|
|
890
|
+
completedAt?: string | null;
|
|
148
891
|
/**
|
|
149
|
-
* Score of the
|
|
892
|
+
* Score of the evaluation run (0-1)
|
|
150
893
|
*/
|
|
151
|
-
score
|
|
894
|
+
score?: number | null;
|
|
152
895
|
/**
|
|
153
|
-
* Score classification of the evaluator run
|
|
896
|
+
* Score classification of the evaluator run based on score threshold (IRRELEVANT
|
|
897
|
+
* is mapped to SKIPPED)
|
|
154
898
|
*/
|
|
155
|
-
scoreClassification
|
|
899
|
+
scoreClassification?: 'SUCCESS' | 'FAILURE' | 'SKIPPED' | null;
|
|
156
900
|
/**
|
|
157
901
|
* When the evaluator run started
|
|
158
902
|
*/
|
|
159
|
-
startedAt
|
|
903
|
+
startedAt?: string | null;
|
|
160
904
|
/**
|
|
161
|
-
*
|
|
905
|
+
* Summary of the evaluation run
|
|
162
906
|
*/
|
|
163
|
-
|
|
164
|
-
/**
|
|
165
|
-
* Summary of the evaluator run
|
|
166
|
-
*/
|
|
167
|
-
summary: string | null;
|
|
907
|
+
summary?: string | null;
|
|
168
908
|
}
|
|
169
909
|
namespace Data {
|
|
170
|
-
|
|
171
|
-
|
|
172
|
-
|
|
910
|
+
interface BlockRun {
|
|
911
|
+
/**
|
|
912
|
+
* ID of the block definition
|
|
913
|
+
*/
|
|
914
|
+
blockDefinitionId: string;
|
|
915
|
+
/**
|
|
916
|
+
* Name of the evaluation block
|
|
917
|
+
*/
|
|
918
|
+
blockName: string;
|
|
919
|
+
/**
|
|
920
|
+
* ID of the block run instance
|
|
921
|
+
*/
|
|
922
|
+
blockRunId: string;
|
|
923
|
+
/**
|
|
924
|
+
* When the block run was created
|
|
925
|
+
*/
|
|
926
|
+
createdAt: string;
|
|
927
|
+
/**
|
|
928
|
+
* Reason for the outcome (pass/fail explanation or skip reason)
|
|
929
|
+
*/
|
|
930
|
+
reason: string | null;
|
|
931
|
+
/**
|
|
932
|
+
* Result of the block run
|
|
933
|
+
*/
|
|
934
|
+
result: 'PASSED' | 'FAILED' | 'SKIPPED' | null;
|
|
935
|
+
/**
|
|
936
|
+
* Score of the block run (0-1)
|
|
937
|
+
*/
|
|
938
|
+
score: number | null;
|
|
939
|
+
/**
|
|
940
|
+
* Status of the block run
|
|
941
|
+
*/
|
|
942
|
+
status: 'PENDING' | 'RUNNING' | 'COMPLETED' | 'FAILED';
|
|
943
|
+
}
|
|
173
944
|
interface Evaluator {
|
|
174
945
|
/**
|
|
175
946
|
* ID of the evaluator
|
|
176
947
|
*/
|
|
177
|
-
id: string
|
|
948
|
+
id: string;
|
|
178
949
|
/**
|
|
179
950
|
* Name of the evaluator
|
|
180
951
|
*/
|
|
181
|
-
name: string
|
|
952
|
+
name: string;
|
|
953
|
+
/**
|
|
954
|
+
* Weight of the evaluator
|
|
955
|
+
*/
|
|
956
|
+
weight?: number;
|
|
182
957
|
}
|
|
183
958
|
interface Evidence {
|
|
184
959
|
/**
|
|
185
|
-
*
|
|
960
|
+
* Comment text of the evidence
|
|
186
961
|
*/
|
|
187
|
-
|
|
962
|
+
commentText: string | null;
|
|
188
963
|
/**
|
|
189
|
-
*
|
|
964
|
+
* Created at of the evidence
|
|
190
965
|
*/
|
|
191
|
-
|
|
966
|
+
createdAt: string;
|
|
192
967
|
/**
|
|
193
|
-
*
|
|
968
|
+
* Is positive of the evidence
|
|
194
969
|
*/
|
|
195
|
-
isPositive: boolean
|
|
970
|
+
isPositive: boolean;
|
|
196
971
|
/**
|
|
197
|
-
* Snippet of the evidence
|
|
972
|
+
* Snippet text of the evidence
|
|
198
973
|
*/
|
|
199
|
-
snippetText: string
|
|
974
|
+
snippetText: string;
|
|
200
975
|
}
|
|
201
976
|
interface Metric {
|
|
202
|
-
/**
|
|
203
|
-
* ID of the metric
|
|
204
|
-
*/
|
|
205
|
-
id: string | null;
|
|
206
977
|
/**
|
|
207
978
|
* Boolean value of the metric
|
|
208
979
|
*/
|
|
209
980
|
booleanValue: boolean | null;
|
|
210
981
|
/**
|
|
211
|
-
* Confidence of the metric
|
|
982
|
+
* Confidence level of the metric (0-1)
|
|
212
983
|
*/
|
|
213
984
|
confidence: number | null;
|
|
985
|
+
/**
|
|
986
|
+
* Created at of the metric
|
|
987
|
+
*/
|
|
988
|
+
createdAt: string;
|
|
214
989
|
/**
|
|
215
990
|
* Name of the metric
|
|
216
991
|
*/
|
|
217
|
-
name: string
|
|
992
|
+
name: string;
|
|
218
993
|
/**
|
|
219
994
|
* Numeric value of the metric
|
|
220
995
|
*/
|
|
221
996
|
numericValue: number | null;
|
|
222
997
|
/**
|
|
223
|
-
* Reasoning
|
|
998
|
+
* Reasoning of the metric
|
|
224
999
|
*/
|
|
225
1000
|
reasoning: string | null;
|
|
226
1001
|
/**
|
|
227
1002
|
* Role of the metric
|
|
228
1003
|
*/
|
|
229
|
-
role:
|
|
1004
|
+
role: string;
|
|
230
1005
|
/**
|
|
231
1006
|
* Text value of the metric
|
|
232
1007
|
*/
|
|
@@ -234,7 +1009,7 @@ export declare namespace EvaluationGetJobRunsResponse {
|
|
|
234
1009
|
/**
|
|
235
1010
|
* Value type of the metric
|
|
236
1011
|
*/
|
|
237
|
-
valueType:
|
|
1012
|
+
valueType: string;
|
|
238
1013
|
}
|
|
239
1014
|
}
|
|
240
1015
|
/**
|
|
@@ -498,7 +1273,13 @@ export declare namespace EvaluationCreateJobParams {
|
|
|
498
1273
|
}
|
|
499
1274
|
}
|
|
500
1275
|
export interface EvaluationGetEvaluatorsParams {
|
|
1276
|
+
/**
|
|
1277
|
+
* Cursor for pagination - evaluator ID to start after
|
|
1278
|
+
*/
|
|
501
1279
|
after?: string;
|
|
1280
|
+
/**
|
|
1281
|
+
* Maximum number of evaluators to return (default: 20, max: 50)
|
|
1282
|
+
*/
|
|
502
1283
|
limit?: string;
|
|
503
1284
|
}
|
|
504
1285
|
export interface EvaluationGetJobRunsParams {
|