@roarkanalytics/sdk 0.332.0 → 2.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -8,13 +8,13 @@ export declare class Evaluation extends APIResource {
8
8
  /**
9
9
  * Returns a specific evaluator with its blocks and configuration.
10
10
  */
11
- getEvaluatorById(evaluatorId: string, options?: Core.RequestOptions): Core.APIPromise<unknown>;
11
+ getEvaluatorById(evaluatorId: string, options?: Core.RequestOptions): Core.APIPromise<EvaluationGetEvaluatorByIDResponse>;
12
12
  /**
13
13
  * Returns a list of evaluators with their blocks and configuration for the
14
14
  * authenticated project.
15
15
  */
16
- getEvaluators(query?: EvaluationGetEvaluatorsParams, options?: Core.RequestOptions): Core.APIPromise<unknown>;
17
- getEvaluators(options?: Core.RequestOptions): Core.APIPromise<unknown>;
16
+ getEvaluators(query?: EvaluationGetEvaluatorsParams, options?: Core.RequestOptions): Core.APIPromise<EvaluationGetEvaluatorsResponse>;
17
+ getEvaluators(options?: Core.RequestOptions): Core.APIPromise<EvaluationGetEvaluatorsResponse>;
18
18
  /**
19
19
  * Retrieve details of a specific evaluation job
20
20
  */
@@ -40,8 +40,752 @@ export declare namespace EvaluationCreateJobResponse {
40
40
  status: 'PENDING' | 'PROCESSING' | 'SUCCESS' | 'FAILURE';
41
41
  }
42
42
  }
43
- export type EvaluationGetEvaluatorByIDResponse = unknown;
44
- export type EvaluationGetEvaluatorsResponse = unknown;
43
+ /**
44
+ * Evaluator with its configured blocks
45
+ */
46
+ export interface EvaluationGetEvaluatorByIDResponse {
47
+ /**
48
+ * Unique identifier for the evaluator
49
+ */
50
+ id: string;
51
+ /**
52
+ * Array of evaluation blocks configured for this evaluator
53
+ */
54
+ blocks: Array<EvaluationGetEvaluatorByIDResponse.UnionMember0 | EvaluationGetEvaluatorByIDResponse.UnionMember1 | EvaluationGetEvaluatorByIDResponse.UnionMember2 | EvaluationGetEvaluatorByIDResponse.UnionMember3 | EvaluationGetEvaluatorByIDResponse.UnionMember4 | EvaluationGetEvaluatorByIDResponse.UnionMember5 | EvaluationGetEvaluatorByIDResponse.UnionMember6 | EvaluationGetEvaluatorByIDResponse.UnionMember7 | EvaluationGetEvaluatorByIDResponse.UnionMember8>;
55
+ /**
56
+ * ISO timestamp when the evaluator was created
57
+ */
58
+ createdAt: string;
59
+ /**
60
+ * Optional description of the evaluator
61
+ */
62
+ description: string | null;
63
+ /**
64
+ * Name of the evaluator
65
+ */
66
+ name: string;
67
+ /**
68
+ * Unique slug identifier for the evaluator
69
+ */
70
+ slug: string;
71
+ /**
72
+ * ISO timestamp when the evaluator was last updated
73
+ */
74
+ updatedAt: string;
75
+ }
76
+ export declare namespace EvaluationGetEvaluatorByIDResponse {
77
+ interface UnionMember0 {
78
+ /**
79
+ * Unique identifier for the block
80
+ */
81
+ id: string;
82
+ /**
83
+ * Block type identifier
84
+ */
85
+ blockType: 'CUSTOM_PROMPT';
86
+ /**
87
+ * Optional description of what this block evaluates
88
+ */
89
+ description: string | null;
90
+ /**
91
+ * Name of the metric this prompt evaluates
92
+ */
93
+ metricName: string;
94
+ /**
95
+ * Display name of the evaluation block
96
+ */
97
+ name: string;
98
+ /**
99
+ * Order in which this block is executed
100
+ */
101
+ orderIndex: number;
102
+ /**
103
+ * The prompt to evaluate the call against
104
+ */
105
+ prompt: string;
106
+ /**
107
+ * Minimum score threshold to pass evaluation (0-1)
108
+ */
109
+ threshold: number;
110
+ /**
111
+ * Weight of this block in the overall evaluation score (0-100)
112
+ */
113
+ weight: number;
114
+ }
115
+ interface UnionMember1 {
116
+ /**
117
+ * Unique identifier for the block
118
+ */
119
+ id: string;
120
+ /**
121
+ * Block type identifier
122
+ */
123
+ blockType: 'DATAFIELD_CHECK';
124
+ /**
125
+ * Optional description of what this block evaluates
126
+ */
127
+ description: string | null;
128
+ /**
129
+ * Criteria for evaluating the property
130
+ */
131
+ evaluationCriteria: string;
132
+ /**
133
+ * Whether this property must be present
134
+ */
135
+ isRequired: boolean;
136
+ /**
137
+ * Display name of the evaluation block
138
+ */
139
+ name: string;
140
+ /**
141
+ * Order in which this block is executed
142
+ */
143
+ orderIndex: number;
144
+ /**
145
+ * Name of the property to check
146
+ */
147
+ propertyName: string;
148
+ /**
149
+ * Minimum score threshold to pass evaluation (0-1)
150
+ */
151
+ threshold: number;
152
+ /**
153
+ * Expected type of the property value
154
+ */
155
+ valueType: string;
156
+ /**
157
+ * Weight of this block in the overall evaluation score (0-100)
158
+ */
159
+ weight: number;
160
+ }
161
+ interface UnionMember2 {
162
+ /**
163
+ * Unique identifier for the block
164
+ */
165
+ id: string;
166
+ /**
167
+ * Block type identifier
168
+ */
169
+ blockType: 'EMOTION';
170
+ /**
171
+ * Optional description of what this block evaluates
172
+ */
173
+ description: string | null;
174
+ /**
175
+ * Display name of the evaluation block
176
+ */
177
+ name: string;
178
+ /**
179
+ * Order in which this block is executed
180
+ */
181
+ orderIndex: number;
182
+ /**
183
+ * The emotion to detect (e.g., "joy", "anger", "sadness")
184
+ */
185
+ selectedEmotion: string;
186
+ /**
187
+ * Minimum confidence threshold for emotion detection (0-1)
188
+ */
189
+ threshold: number;
190
+ /**
191
+ * Weight of this block in the overall evaluation score (0-100)
192
+ */
193
+ weight: number;
194
+ }
195
+ interface UnionMember3 {
196
+ /**
197
+ * Unique identifier for the block
198
+ */
199
+ id: string;
200
+ /**
201
+ * Block type identifier
202
+ */
203
+ blockType: 'LATENCY';
204
+ /**
205
+ * Optional description of what this block evaluates
206
+ */
207
+ description: string | null;
208
+ /**
209
+ * Maximum number of silence periods allowed
210
+ */
211
+ maxAllowedSilences: number;
212
+ /**
213
+ * Minimum duration of silence in milliseconds to be considered
214
+ */
215
+ minSilenceDuration: number;
216
+ /**
217
+ * Display name of the evaluation block
218
+ */
219
+ name: string;
220
+ /**
221
+ * Order in which this block is executed
222
+ */
223
+ orderIndex: number;
224
+ /**
225
+ * Maximum allowed latency score
226
+ */
227
+ threshold: number;
228
+ /**
229
+ * Weight of this block in the overall evaluation score (0-100)
230
+ */
231
+ weight: number;
232
+ }
233
+ interface UnionMember4 {
234
+ /**
235
+ * Unique identifier for the block
236
+ */
237
+ id: string;
238
+ /**
239
+ * Block type identifier
240
+ */
241
+ blockType: 'POLITENESS';
242
+ /**
243
+ * Optional description of what this block evaluates
244
+ */
245
+ description: string | null;
246
+ /**
247
+ * Display name of the evaluation block
248
+ */
249
+ name: string;
250
+ /**
251
+ * Order in which this block is executed
252
+ */
253
+ orderIndex: number;
254
+ /**
255
+ * Minimum politeness score threshold (0-1)
256
+ */
257
+ threshold: number;
258
+ /**
259
+ * Weight of this block in the overall evaluation score (0-100)
260
+ */
261
+ weight: number;
262
+ }
263
+ interface UnionMember5 {
264
+ /**
265
+ * Unique identifier for the block
266
+ */
267
+ id: string;
268
+ /**
269
+ * Block type identifier
270
+ */
271
+ blockType: 'SENTIMENT';
272
+ /**
273
+ * Optional description of what this block evaluates
274
+ */
275
+ description: string | null;
276
+ /**
277
+ * Display name of the evaluation block
278
+ */
279
+ name: string;
280
+ /**
281
+ * Order in which this block is executed
282
+ */
283
+ orderIndex: number;
284
+ /**
285
+ * Minimum sentiment score threshold (0-1)
286
+ */
287
+ threshold: number;
288
+ /**
289
+ * Weight of this block in the overall evaluation score (0-100)
290
+ */
291
+ weight: number;
292
+ }
293
+ interface UnionMember6 {
294
+ /**
295
+ * Unique identifier for the block
296
+ */
297
+ id: string;
298
+ /**
299
+ * Block type identifier
300
+ */
301
+ blockType: 'TOOL_CALLS';
302
+ /**
303
+ * Optional description of what this block evaluates
304
+ */
305
+ description: string | null;
306
+ /**
307
+ * Condition that must be met for tool invocation
308
+ */
309
+ invocationCondition: string | null;
310
+ /**
311
+ * Minimum number of times the tool should be invoked
312
+ */
313
+ minInvocationCount: number | null;
314
+ /**
315
+ * Display name of the evaluation block
316
+ */
317
+ name: string;
318
+ /**
319
+ * Order in which this block is executed
320
+ */
321
+ orderIndex: number;
322
+ /**
323
+ * Whether the tool should be invoked
324
+ */
325
+ shouldBeInvoked: boolean;
326
+ /**
327
+ * ID of the tool definition
328
+ */
329
+ toolDefinitionId: string;
330
+ /**
331
+ * Weight of this block in the overall evaluation score (0-100)
332
+ */
333
+ weight: number;
334
+ }
335
+ interface UnionMember7 {
336
+ /**
337
+ * Unique identifier for the block
338
+ */
339
+ id: string;
340
+ /**
341
+ * Block type identifier
342
+ */
343
+ blockType: 'TOXICITY';
344
+ /**
345
+ * Optional description of what this block evaluates
346
+ */
347
+ description: string | null;
348
+ /**
349
+ * Display name of the evaluation block
350
+ */
351
+ name: string;
352
+ /**
353
+ * Order in which this block is executed
354
+ */
355
+ orderIndex: number;
356
+ /**
357
+ * Maximum allowed toxicity score (0-1)
358
+ */
359
+ threshold: number;
360
+ /**
361
+ * Weight of this block in the overall evaluation score (0-100)
362
+ */
363
+ weight: number;
364
+ }
365
+ interface UnionMember8 {
366
+ /**
367
+ * Unique identifier for the block
368
+ */
369
+ id: string;
370
+ /**
371
+ * Block type identifier
372
+ */
373
+ blockType: 'VOCAL_CUE';
374
+ /**
375
+ * Optional description of what this block evaluates
376
+ */
377
+ description: string | null;
378
+ /**
379
+ * Display name of the evaluation block
380
+ */
381
+ name: string;
382
+ /**
383
+ * Order in which this block is executed
384
+ */
385
+ orderIndex: number;
386
+ /**
387
+ * The vocal cue to detect (e.g., "pace", "tone", "volume")
388
+ */
389
+ selectedCue: string;
390
+ /**
391
+ * Minimum confidence threshold for vocal cue detection (0-1)
392
+ */
393
+ threshold: number;
394
+ /**
395
+ * Weight of this block in the overall evaluation score (0-100)
396
+ */
397
+ weight: number;
398
+ }
399
+ }
400
+ /**
401
+ * Response containing evaluators and pagination info
402
+ */
403
+ export interface EvaluationGetEvaluatorsResponse {
404
+ /**
405
+ * Array of evaluators with their blocks
406
+ */
407
+ data: Array<EvaluationGetEvaluatorsResponse.Data>;
408
+ /**
409
+ * Pagination information
410
+ */
411
+ pagination: EvaluationGetEvaluatorsResponse.Pagination;
412
+ }
413
+ export declare namespace EvaluationGetEvaluatorsResponse {
414
+ /**
415
+ * Evaluator with its configured blocks
416
+ */
417
+ interface Data {
418
+ /**
419
+ * Unique identifier for the evaluator
420
+ */
421
+ id: string;
422
+ /**
423
+ * Array of evaluation blocks configured for this evaluator
424
+ */
425
+ blocks: Array<Data.UnionMember0 | Data.UnionMember1 | Data.UnionMember2 | Data.UnionMember3 | Data.UnionMember4 | Data.UnionMember5 | Data.UnionMember6 | Data.UnionMember7 | Data.UnionMember8>;
426
+ /**
427
+ * ISO timestamp when the evaluator was created
428
+ */
429
+ createdAt: string;
430
+ /**
431
+ * Optional description of the evaluator
432
+ */
433
+ description: string | null;
434
+ /**
435
+ * Name of the evaluator
436
+ */
437
+ name: string;
438
+ /**
439
+ * Unique slug identifier for the evaluator
440
+ */
441
+ slug: string;
442
+ /**
443
+ * ISO timestamp when the evaluator was last updated
444
+ */
445
+ updatedAt: string;
446
+ }
447
+ namespace Data {
448
+ interface UnionMember0 {
449
+ /**
450
+ * Unique identifier for the block
451
+ */
452
+ id: string;
453
+ /**
454
+ * Block type identifier
455
+ */
456
+ blockType: 'CUSTOM_PROMPT';
457
+ /**
458
+ * Optional description of what this block evaluates
459
+ */
460
+ description: string | null;
461
+ /**
462
+ * Name of the metric this prompt evaluates
463
+ */
464
+ metricName: string;
465
+ /**
466
+ * Display name of the evaluation block
467
+ */
468
+ name: string;
469
+ /**
470
+ * Order in which this block is executed
471
+ */
472
+ orderIndex: number;
473
+ /**
474
+ * The prompt to evaluate the call against
475
+ */
476
+ prompt: string;
477
+ /**
478
+ * Minimum score threshold to pass evaluation (0-1)
479
+ */
480
+ threshold: number;
481
+ /**
482
+ * Weight of this block in the overall evaluation score (0-100)
483
+ */
484
+ weight: number;
485
+ }
486
+ interface UnionMember1 {
487
+ /**
488
+ * Unique identifier for the block
489
+ */
490
+ id: string;
491
+ /**
492
+ * Block type identifier
493
+ */
494
+ blockType: 'DATAFIELD_CHECK';
495
+ /**
496
+ * Optional description of what this block evaluates
497
+ */
498
+ description: string | null;
499
+ /**
500
+ * Criteria for evaluating the property
501
+ */
502
+ evaluationCriteria: string;
503
+ /**
504
+ * Whether this property must be present
505
+ */
506
+ isRequired: boolean;
507
+ /**
508
+ * Display name of the evaluation block
509
+ */
510
+ name: string;
511
+ /**
512
+ * Order in which this block is executed
513
+ */
514
+ orderIndex: number;
515
+ /**
516
+ * Name of the property to check
517
+ */
518
+ propertyName: string;
519
+ /**
520
+ * Minimum score threshold to pass evaluation (0-1)
521
+ */
522
+ threshold: number;
523
+ /**
524
+ * Expected type of the property value
525
+ */
526
+ valueType: string;
527
+ /**
528
+ * Weight of this block in the overall evaluation score (0-100)
529
+ */
530
+ weight: number;
531
+ }
532
+ interface UnionMember2 {
533
+ /**
534
+ * Unique identifier for the block
535
+ */
536
+ id: string;
537
+ /**
538
+ * Block type identifier
539
+ */
540
+ blockType: 'EMOTION';
541
+ /**
542
+ * Optional description of what this block evaluates
543
+ */
544
+ description: string | null;
545
+ /**
546
+ * Display name of the evaluation block
547
+ */
548
+ name: string;
549
+ /**
550
+ * Order in which this block is executed
551
+ */
552
+ orderIndex: number;
553
+ /**
554
+ * The emotion to detect (e.g., "joy", "anger", "sadness")
555
+ */
556
+ selectedEmotion: string;
557
+ /**
558
+ * Minimum confidence threshold for emotion detection (0-1)
559
+ */
560
+ threshold: number;
561
+ /**
562
+ * Weight of this block in the overall evaluation score (0-100)
563
+ */
564
+ weight: number;
565
+ }
566
+ interface UnionMember3 {
567
+ /**
568
+ * Unique identifier for the block
569
+ */
570
+ id: string;
571
+ /**
572
+ * Block type identifier
573
+ */
574
+ blockType: 'LATENCY';
575
+ /**
576
+ * Optional description of what this block evaluates
577
+ */
578
+ description: string | null;
579
+ /**
580
+ * Maximum number of silence periods allowed
581
+ */
582
+ maxAllowedSilences: number;
583
+ /**
584
+ * Minimum duration of silence in milliseconds to be considered
585
+ */
586
+ minSilenceDuration: number;
587
+ /**
588
+ * Display name of the evaluation block
589
+ */
590
+ name: string;
591
+ /**
592
+ * Order in which this block is executed
593
+ */
594
+ orderIndex: number;
595
+ /**
596
+ * Maximum allowed latency score
597
+ */
598
+ threshold: number;
599
+ /**
600
+ * Weight of this block in the overall evaluation score (0-100)
601
+ */
602
+ weight: number;
603
+ }
604
+ interface UnionMember4 {
605
+ /**
606
+ * Unique identifier for the block
607
+ */
608
+ id: string;
609
+ /**
610
+ * Block type identifier
611
+ */
612
+ blockType: 'POLITENESS';
613
+ /**
614
+ * Optional description of what this block evaluates
615
+ */
616
+ description: string | null;
617
+ /**
618
+ * Display name of the evaluation block
619
+ */
620
+ name: string;
621
+ /**
622
+ * Order in which this block is executed
623
+ */
624
+ orderIndex: number;
625
+ /**
626
+ * Minimum politeness score threshold (0-1)
627
+ */
628
+ threshold: number;
629
+ /**
630
+ * Weight of this block in the overall evaluation score (0-100)
631
+ */
632
+ weight: number;
633
+ }
634
+ interface UnionMember5 {
635
+ /**
636
+ * Unique identifier for the block
637
+ */
638
+ id: string;
639
+ /**
640
+ * Block type identifier
641
+ */
642
+ blockType: 'SENTIMENT';
643
+ /**
644
+ * Optional description of what this block evaluates
645
+ */
646
+ description: string | null;
647
+ /**
648
+ * Display name of the evaluation block
649
+ */
650
+ name: string;
651
+ /**
652
+ * Order in which this block is executed
653
+ */
654
+ orderIndex: number;
655
+ /**
656
+ * Minimum sentiment score threshold (0-1)
657
+ */
658
+ threshold: number;
659
+ /**
660
+ * Weight of this block in the overall evaluation score (0-100)
661
+ */
662
+ weight: number;
663
+ }
664
+ interface UnionMember6 {
665
+ /**
666
+ * Unique identifier for the block
667
+ */
668
+ id: string;
669
+ /**
670
+ * Block type identifier
671
+ */
672
+ blockType: 'TOOL_CALLS';
673
+ /**
674
+ * Optional description of what this block evaluates
675
+ */
676
+ description: string | null;
677
+ /**
678
+ * Condition that must be met for tool invocation
679
+ */
680
+ invocationCondition: string | null;
681
+ /**
682
+ * Minimum number of times the tool should be invoked
683
+ */
684
+ minInvocationCount: number | null;
685
+ /**
686
+ * Display name of the evaluation block
687
+ */
688
+ name: string;
689
+ /**
690
+ * Order in which this block is executed
691
+ */
692
+ orderIndex: number;
693
+ /**
694
+ * Whether the tool should be invoked
695
+ */
696
+ shouldBeInvoked: boolean;
697
+ /**
698
+ * ID of the tool definition
699
+ */
700
+ toolDefinitionId: string;
701
+ /**
702
+ * Weight of this block in the overall evaluation score (0-100)
703
+ */
704
+ weight: number;
705
+ }
706
+ interface UnionMember7 {
707
+ /**
708
+ * Unique identifier for the block
709
+ */
710
+ id: string;
711
+ /**
712
+ * Block type identifier
713
+ */
714
+ blockType: 'TOXICITY';
715
+ /**
716
+ * Optional description of what this block evaluates
717
+ */
718
+ description: string | null;
719
+ /**
720
+ * Display name of the evaluation block
721
+ */
722
+ name: string;
723
+ /**
724
+ * Order in which this block is executed
725
+ */
726
+ orderIndex: number;
727
+ /**
728
+ * Maximum allowed toxicity score (0-1)
729
+ */
730
+ threshold: number;
731
+ /**
732
+ * Weight of this block in the overall evaluation score (0-100)
733
+ */
734
+ weight: number;
735
+ }
736
+ interface UnionMember8 {
737
+ /**
738
+ * Unique identifier for the block
739
+ */
740
+ id: string;
741
+ /**
742
+ * Block type identifier
743
+ */
744
+ blockType: 'VOCAL_CUE';
745
+ /**
746
+ * Optional description of what this block evaluates
747
+ */
748
+ description: string | null;
749
+ /**
750
+ * Display name of the evaluation block
751
+ */
752
+ name: string;
753
+ /**
754
+ * Order in which this block is executed
755
+ */
756
+ orderIndex: number;
757
+ /**
758
+ * The vocal cue to detect (e.g., "pace", "tone", "volume")
759
+ */
760
+ selectedCue: string;
761
+ /**
762
+ * Minimum confidence threshold for vocal cue detection (0-1)
763
+ */
764
+ threshold: number;
765
+ /**
766
+ * Weight of this block in the overall evaluation score (0-100)
767
+ */
768
+ weight: number;
769
+ }
770
+ }
771
+ /**
772
+ * Pagination information
773
+ */
774
+ interface Pagination {
775
+ /**
776
+ * Whether there are more evaluators to fetch
777
+ */
778
+ hasMore: boolean;
779
+ /**
780
+ * Cursor for the next page, null if no more pages
781
+ */
782
+ nextCursor: string | null;
783
+ /**
784
+ * Total number of evaluators
785
+ */
786
+ total: number;
787
+ }
788
+ }
45
789
  export interface EvaluationGetJobResponse {
46
790
  /**
47
791
  * Evaluation job response payload
@@ -126,107 +870,138 @@ export declare namespace EvaluationGetJobRunsResponse {
126
870
  namespace Data {
127
871
  interface Data {
128
872
  /**
129
- * ID of the evaluator run
873
+ * All block runs for this evaluator, including skipped ones
130
874
  */
131
- id: string;
875
+ blockRuns: Array<Data.BlockRun>;
876
+ evaluator: Data.Evaluator;
877
+ evidence: Array<Data.Evidence>;
878
+ metrics: Array<Data.Metric>;
132
879
  /**
133
- * When the evaluator run completed
134
- */
135
- completedAt: string | null;
136
- /**
137
- * Evaluator of the evaluator run
880
+ * Status of the evaluator run
138
881
  */
139
- evaluator: Data.Evaluator | null;
882
+ status: 'PENDING' | 'IN_PROGRESS' | 'COMPLETED' | 'FAILED';
140
883
  /**
141
- * Evidence of the evaluator run
884
+ * ID of the evaluator run
142
885
  */
143
- evidence: Array<Data.Evidence> | null;
886
+ id?: string;
144
887
  /**
145
- * Metrics of the evaluator run
888
+ * When the evaluator run completed
146
889
  */
147
- metrics: Array<Data.Metric> | null;
890
+ completedAt?: string | null;
148
891
  /**
149
- * Score of the evaluator run
892
+ * Score of the evaluation run (0-1)
150
893
  */
151
- score: number | null;
894
+ score?: number | null;
152
895
  /**
153
- * Score classification of the evaluator run
896
+ * Score classification of the evaluator run based on score threshold (IRRELEVANT
897
+ * is mapped to SKIPPED)
154
898
  */
155
- scoreClassification: 'SUCCESS' | 'FAILURE' | 'IRRELEVANT' | null;
899
+ scoreClassification?: 'SUCCESS' | 'FAILURE' | 'SKIPPED' | null;
156
900
  /**
157
901
  * When the evaluator run started
158
902
  */
159
- startedAt: string | null;
903
+ startedAt?: string | null;
160
904
  /**
161
- * Status of the evaluator run
905
+ * Summary of the evaluation run
162
906
  */
163
- status: 'PENDING' | 'IN_PROGRESS' | 'COMPLETED' | 'FAILED';
164
- /**
165
- * Summary of the evaluator run
166
- */
167
- summary: string | null;
907
+ summary?: string | null;
168
908
  }
169
909
  namespace Data {
170
- /**
171
- * Evaluator of the evaluator run
172
- */
910
+ interface BlockRun {
911
+ /**
912
+ * ID of the block definition
913
+ */
914
+ blockDefinitionId: string;
915
+ /**
916
+ * Name of the evaluation block
917
+ */
918
+ blockName: string;
919
+ /**
920
+ * ID of the block run instance
921
+ */
922
+ blockRunId: string;
923
+ /**
924
+ * When the block run was created
925
+ */
926
+ createdAt: string;
927
+ /**
928
+ * Reason for the outcome (pass/fail explanation or skip reason)
929
+ */
930
+ reason: string | null;
931
+ /**
932
+ * Result of the block run
933
+ */
934
+ result: 'PASSED' | 'FAILED' | 'SKIPPED' | null;
935
+ /**
936
+ * Score of the block run (0-1)
937
+ */
938
+ score: number | null;
939
+ /**
940
+ * Status of the block run
941
+ */
942
+ status: 'PENDING' | 'RUNNING' | 'COMPLETED' | 'FAILED';
943
+ }
173
944
  interface Evaluator {
174
945
  /**
175
946
  * ID of the evaluator
176
947
  */
177
- id: string | null;
948
+ id: string;
178
949
  /**
179
950
  * Name of the evaluator
180
951
  */
181
- name: string | null;
952
+ name: string;
953
+ /**
954
+ * Weight of the evaluator
955
+ */
956
+ weight?: number;
182
957
  }
183
958
  interface Evidence {
184
959
  /**
185
- * ID of the evidence
960
+ * Comment text of the evidence
186
961
  */
187
- id: string | null;
962
+ commentText: string | null;
188
963
  /**
189
- * Comment on the evidence
964
+ * Created at of the evidence
190
965
  */
191
- commentText: string | null;
966
+ createdAt: string;
192
967
  /**
193
- * Whether this is a positive example of the metric
968
+ * Is positive of the evidence
194
969
  */
195
- isPositive: boolean | null;
970
+ isPositive: boolean;
196
971
  /**
197
- * Snippet of the evidence
972
+ * Snippet text of the evidence
198
973
  */
199
- snippetText: string | null;
974
+ snippetText: string;
200
975
  }
201
976
  interface Metric {
202
- /**
203
- * ID of the metric
204
- */
205
- id: string | null;
206
977
  /**
207
978
  * Boolean value of the metric
208
979
  */
209
980
  booleanValue: boolean | null;
210
981
  /**
211
- * Confidence of the metric
982
+ * Confidence level of the metric (0-1)
212
983
  */
213
984
  confidence: number | null;
985
+ /**
986
+ * Created at of the metric
987
+ */
988
+ createdAt: string;
214
989
  /**
215
990
  * Name of the metric
216
991
  */
217
- name: string | null;
992
+ name: string;
218
993
  /**
219
994
  * Numeric value of the metric
220
995
  */
221
996
  numericValue: number | null;
222
997
  /**
223
- * Reasoning for the metric
998
+ * Reasoning of the metric
224
999
  */
225
1000
  reasoning: string | null;
226
1001
  /**
227
1002
  * Role of the metric
228
1003
  */
229
- role: 'PRIMARY' | 'SECONDARY' | null;
1004
+ role: string;
230
1005
  /**
231
1006
  * Text value of the metric
232
1007
  */
@@ -234,7 +1009,7 @@ export declare namespace EvaluationGetJobRunsResponse {
234
1009
  /**
235
1010
  * Value type of the metric
236
1011
  */
237
- valueType: 'NUMERIC' | 'BOOLEAN' | 'TEXT' | null;
1012
+ valueType: string;
238
1013
  }
239
1014
  }
240
1015
  /**
@@ -498,7 +1273,13 @@ export declare namespace EvaluationCreateJobParams {
498
1273
  }
499
1274
  }
500
1275
  export interface EvaluationGetEvaluatorsParams {
1276
+ /**
1277
+ * Cursor for pagination - evaluator ID to start after
1278
+ */
501
1279
  after?: string;
1280
+ /**
1281
+ * Maximum number of evaluators to return (default: 20, max: 50)
1282
+ */
502
1283
  limit?: string;
503
1284
  }
504
1285
  export interface EvaluationGetJobRunsParams {