@ls-stack/agent-eval 0.39.0 → 0.40.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/{app-DD-8kx5H.mjs → app-0k8Y1OBk.mjs} +4 -4
- package/dist/apps/web/dist/assets/index-C4v6dWcv.js +140 -0
- package/dist/apps/web/dist/assets/index-C58_zLA9.css +1 -0
- package/dist/apps/web/dist/index.html +2 -2
- package/dist/bin.mjs +1 -1
- package/dist/{cli-BUX6tr9J.mjs → cli-Sg8UdOnm.mjs} +6 -4
- package/dist/index.d.mts +93 -88
- package/dist/index.mjs +4 -4
- package/dist/runChild.mjs +1 -1
- package/dist/{runOrchestration-BhUFWvq9.mjs → runOrchestration-CTzVNrDP.mjs} +28 -32
- package/dist/{runner-B1wfPKNH.mjs → runner-Bb9JdFkg.mjs} +2 -2
- package/dist/{runner-CoRf7Vef.mjs → runner-njK_CtXC.mjs} +1 -1
- package/dist/src-BZzPFS8r.mjs +3 -0
- package/package.json +2 -1
- package/skills/agent-eval/SKILL.md +8 -7
- package/dist/apps/web/dist/assets/index-C6PgBOfP.css +0 -1
- package/dist/apps/web/dist/assets/index-CO86PsY-.js +0 -140
- package/dist/src-BwJ5tod2.mjs +0 -3
package/dist/index.d.mts
CHANGED
|
@@ -1,4 +1,5 @@
|
|
|
1
1
|
import { z, z as z$1 } from "zod/v4";
|
|
2
|
+
import dayjs from "dayjs";
|
|
2
3
|
import { Blob, File } from "node:buffer";
|
|
3
4
|
|
|
4
5
|
//#region ../runner/dist/index.d.mts
|
|
@@ -2147,7 +2148,7 @@ type EvalDefinitionBase<TInput = unknown, TOutputs extends EvalOutputs = EvalOut
|
|
|
2147
2148
|
*/
|
|
2148
2149
|
startTime?: EvalStartTime;
|
|
2149
2150
|
/**
|
|
2150
|
-
* Freeze the eval Date clock at `startTime` until `
|
|
2151
|
+
* Freeze the eval Date clock at `startTime` until `evalTime.advance(...)`
|
|
2151
2152
|
* moves it manually. Defaults to `false`, so eval time advances with real
|
|
2152
2153
|
* elapsed time from the configured `startTime`.
|
|
2153
2154
|
*/
|
|
@@ -2510,8 +2511,6 @@ type EvalCaseScope = {
|
|
|
2510
2511
|
* modules imported while a run is being prepared.
|
|
2511
2512
|
*/
|
|
2512
2513
|
type EvalRuntimeScope = 'env' | 'cases' | 'eval' | 'derive' | 'outputsSchema' | 'scorer';
|
|
2513
|
-
/** Time unit accepted by `advanceEvalTime(unit, amount)`. */
|
|
2514
|
-
type EvalTimeUnit = 'millisecond' | 'milliseconds' | 'second' | 'seconds' | 'minute' | 'minutes' | 'hour' | 'hours' | 'day' | 'days';
|
|
2515
2514
|
type EvalLogLevelInput = RunLogLevel$1 | 'warning';
|
|
2516
2515
|
/** Error thrown when an eval assertion fails during case execution. */
|
|
2517
2516
|
declare class EvalAssertionError extends Error {
|
|
@@ -2519,21 +2518,27 @@ declare class EvalAssertionError extends Error {
|
|
|
2519
2518
|
}
|
|
2520
2519
|
/** Return the shifted wall-clock time for a stored eval clock state. */
|
|
2521
2520
|
/**
|
|
2522
|
-
*
|
|
2521
|
+
* Eval time helpers for reading and moving the active eval clock.
|
|
2523
2522
|
*
|
|
2524
|
-
*
|
|
2525
|
-
*
|
|
2523
|
+
* `startTime` is a Dayjs object for the wall-clock start captured for the
|
|
2524
|
+
* active eval. For `startTime: 'now'`, it reflects the real time captured when
|
|
2525
|
+
* the eval clock context was created. Dayjs objects are immutable, so
|
|
2526
|
+
* `evalTime.startTime.add(5, 'minutes')` computes a derived time without
|
|
2527
|
+
* moving the active eval clock.
|
|
2526
2528
|
*/
|
|
2527
|
-
declare
|
|
2529
|
+
declare const evalTime: {
|
|
2530
|
+
/** Create a Dayjs object with the same arguments as `dayjs(...)`. */dayjs: typeof dayjs; /** Dayjs wall-clock start captured for the active eval. */
|
|
2531
|
+
readonly startTime: dayjs.Dayjs;
|
|
2532
|
+
/**
|
|
2533
|
+
* Move the active shifted Date clock and return the new current eval time.
|
|
2534
|
+
*
|
|
2535
|
+
* Throws outside an active shifted eval clock. Evals that set
|
|
2536
|
+
* `startTime: 'now'` use the real current clock unless `freezeTime: true` is
|
|
2537
|
+
* also set.
|
|
2538
|
+
*/
|
|
2539
|
+
advance: (amount: number, unit: dayjs.ManipulateType) => dayjs.Dayjs;
|
|
2540
|
+
};
|
|
2528
2541
|
/** Execute a callback with the eval Date clock shifted from `startTime`. */
|
|
2529
|
-
/**
|
|
2530
|
-
* Advance the active eval's shifted Date clock and return the new time.
|
|
2531
|
-
*
|
|
2532
|
-
* Throws outside an active shifted eval clock. Evals that set
|
|
2533
|
-
* `startTime: 'now'` use the real current clock unless `freezeTime: true` is
|
|
2534
|
-
* also set.
|
|
2535
|
-
*/
|
|
2536
|
-
declare function advanceEvalTime(unit: EvalTimeUnit, amount: number): Date;
|
|
2537
2542
|
/** Return the current eval scope for the active async context, if any. */
|
|
2538
2543
|
declare function getCurrentScope(): EvalCaseScope | undefined;
|
|
2539
2544
|
/**
|
|
@@ -3036,9 +3041,9 @@ declare const traceAttributeDisplaySchema: z$1.ZodObject<{
|
|
|
3036
3041
|
subtree: "subtree";
|
|
3037
3042
|
}>>;
|
|
3038
3043
|
mode: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3039
|
-
all: "all";
|
|
3040
|
-
last: "last";
|
|
3041
3044
|
sum: "sum";
|
|
3045
|
+
last: "last";
|
|
3046
|
+
all: "all";
|
|
3042
3047
|
}>>;
|
|
3043
3048
|
}, z$1.core.$strip>;
|
|
3044
3049
|
/**
|
|
@@ -3072,9 +3077,9 @@ declare const traceDisplayConfigSchema: z$1.ZodObject<{
|
|
|
3072
3077
|
subtree: "subtree";
|
|
3073
3078
|
}>>;
|
|
3074
3079
|
mode: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3075
|
-
all: "all";
|
|
3076
|
-
last: "last";
|
|
3077
3080
|
sum: "sum";
|
|
3081
|
+
last: "last";
|
|
3082
|
+
all: "all";
|
|
3078
3083
|
}>>;
|
|
3079
3084
|
}, z$1.core.$strip>>>;
|
|
3080
3085
|
}, z$1.core.$strip>;
|
|
@@ -3112,9 +3117,9 @@ declare const traceAttributeDisplayInputSchema: z$1.ZodObject<{
|
|
|
3112
3117
|
subtree: "subtree";
|
|
3113
3118
|
}>>;
|
|
3114
3119
|
mode: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3115
|
-
all: "all";
|
|
3116
|
-
last: "last";
|
|
3117
3120
|
sum: "sum";
|
|
3121
|
+
last: "last";
|
|
3122
|
+
all: "all";
|
|
3118
3123
|
}>>;
|
|
3119
3124
|
transform: z$1.ZodOptional<z$1.ZodCustom<TraceAttributeTransform, TraceAttributeTransform>>;
|
|
3120
3125
|
}, z$1.core.$strip>;
|
|
@@ -3150,9 +3155,9 @@ declare const traceDisplayInputConfigSchema: z$1.ZodObject<{
|
|
|
3150
3155
|
subtree: "subtree";
|
|
3151
3156
|
}>>;
|
|
3152
3157
|
mode: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3153
|
-
all: "all";
|
|
3154
|
-
last: "last";
|
|
3155
3158
|
sum: "sum";
|
|
3159
|
+
last: "last";
|
|
3160
|
+
all: "all";
|
|
3156
3161
|
}>>;
|
|
3157
3162
|
transform: z$1.ZodOptional<z$1.ZodCustom<TraceAttributeTransform, TraceAttributeTransform>>;
|
|
3158
3163
|
}, z$1.core.$strip>>>;
|
|
@@ -3189,8 +3194,8 @@ declare const traceSpanSchema: z$1.ZodObject<{
|
|
|
3189
3194
|
status: z$1.ZodEnum<{
|
|
3190
3195
|
error: "error";
|
|
3191
3196
|
running: "running";
|
|
3192
|
-
ok: "ok";
|
|
3193
3197
|
cancelled: "cancelled";
|
|
3198
|
+
ok: "ok";
|
|
3194
3199
|
}>;
|
|
3195
3200
|
attributes: z$1.ZodOptional<z$1.ZodRecord<z$1.ZodString, z$1.ZodUnknown>>;
|
|
3196
3201
|
error: z$1.ZodOptional<z$1.ZodObject<{
|
|
@@ -3231,11 +3236,11 @@ declare const evalFreshnessStatusSchema: z$1.ZodEnum<{
|
|
|
3231
3236
|
type EvalFreshnessStatus = z$1.infer<typeof evalFreshnessStatusSchema>;
|
|
3232
3237
|
/** Reducer used to collapse a column's per-case values into a single stat. */
|
|
3233
3238
|
declare const evalStatAggregateSchema: z$1.ZodEnum<{
|
|
3234
|
-
last: "last";
|
|
3235
|
-
sum: "sum";
|
|
3236
3239
|
avg: "avg";
|
|
3237
3240
|
min: "min";
|
|
3238
3241
|
max: "max";
|
|
3242
|
+
sum: "sum";
|
|
3243
|
+
last: "last";
|
|
3239
3244
|
}>;
|
|
3240
3245
|
/** Reducer used to collapse a column's per-case values into a single stat. */
|
|
3241
3246
|
type EvalStatAggregate = z$1.infer<typeof evalStatAggregateSchema>;
|
|
@@ -3259,11 +3264,11 @@ declare const evalStatItemSchema: z$1.ZodDiscriminatedUnion<[z$1.ZodObject<{
|
|
|
3259
3264
|
key: z$1.ZodString;
|
|
3260
3265
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
3261
3266
|
aggregate: z$1.ZodEnum<{
|
|
3262
|
-
last: "last";
|
|
3263
|
-
sum: "sum";
|
|
3264
3267
|
avg: "avg";
|
|
3265
3268
|
min: "min";
|
|
3266
3269
|
max: "max";
|
|
3270
|
+
sum: "sum";
|
|
3271
|
+
last: "last";
|
|
3267
3272
|
}>;
|
|
3268
3273
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3269
3274
|
number: "number";
|
|
@@ -3301,11 +3306,11 @@ declare const evalStatsConfigSchema: z$1.ZodArray<z$1.ZodDiscriminatedUnion<[z$1
|
|
|
3301
3306
|
key: z$1.ZodString;
|
|
3302
3307
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
3303
3308
|
aggregate: z$1.ZodEnum<{
|
|
3304
|
-
last: "last";
|
|
3305
|
-
sum: "sum";
|
|
3306
3309
|
avg: "avg";
|
|
3307
3310
|
min: "min";
|
|
3308
3311
|
max: "max";
|
|
3312
|
+
sum: "sum";
|
|
3313
|
+
last: "last";
|
|
3309
3314
|
}>;
|
|
3310
3315
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3311
3316
|
number: "number";
|
|
@@ -3381,10 +3386,10 @@ declare const evalSummarySchema: z$1.ZodObject<{
|
|
|
3381
3386
|
caseIds: z$1.ZodOptional<z$1.ZodArray<z$1.ZodString>>;
|
|
3382
3387
|
lastRunStatus: z$1.ZodNullable<z$1.ZodEnum<{
|
|
3383
3388
|
error: "error";
|
|
3384
|
-
running: "running";
|
|
3385
|
-
cancelled: "cancelled";
|
|
3386
3389
|
pass: "pass";
|
|
3387
3390
|
fail: "fail";
|
|
3391
|
+
running: "running";
|
|
3392
|
+
cancelled: "cancelled";
|
|
3388
3393
|
unscored: "unscored";
|
|
3389
3394
|
}>>;
|
|
3390
3395
|
stats: z$1.ZodOptional<z$1.ZodArray<z$1.ZodDiscriminatedUnion<[z$1.ZodObject<{
|
|
@@ -3403,11 +3408,11 @@ declare const evalSummarySchema: z$1.ZodObject<{
|
|
|
3403
3408
|
key: z$1.ZodString;
|
|
3404
3409
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
3405
3410
|
aggregate: z$1.ZodEnum<{
|
|
3406
|
-
last: "last";
|
|
3407
|
-
sum: "sum";
|
|
3408
3411
|
avg: "avg";
|
|
3409
3412
|
min: "min";
|
|
3410
3413
|
max: "max";
|
|
3414
|
+
sum: "sum";
|
|
3415
|
+
last: "last";
|
|
3411
3416
|
}>;
|
|
3412
3417
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3413
3418
|
number: "number";
|
|
@@ -3445,9 +3450,9 @@ declare const evalSummarySchema: z$1.ZodObject<{
|
|
|
3445
3450
|
color: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3446
3451
|
success: "success";
|
|
3447
3452
|
error: "error";
|
|
3448
|
-
warning: "warning";
|
|
3449
3453
|
accent: "accent";
|
|
3450
3454
|
accentDim: "accentDim";
|
|
3455
|
+
warning: "warning";
|
|
3451
3456
|
textMuted: "textMuted";
|
|
3452
3457
|
}>>;
|
|
3453
3458
|
axis: z$1.ZodOptional<z$1.ZodEnum<{
|
|
@@ -3458,10 +3463,10 @@ declare const evalSummarySchema: z$1.ZodObject<{
|
|
|
3458
3463
|
source: z$1.ZodLiteral<"column">;
|
|
3459
3464
|
key: z$1.ZodString;
|
|
3460
3465
|
aggregate: z$1.ZodEnum<{
|
|
3461
|
-
sum: "sum";
|
|
3462
3466
|
avg: "avg";
|
|
3463
3467
|
min: "min";
|
|
3464
3468
|
max: "max";
|
|
3469
|
+
sum: "sum";
|
|
3465
3470
|
latest: "latest";
|
|
3466
3471
|
passThresholdRate: "passThresholdRate";
|
|
3467
3472
|
}>;
|
|
@@ -3469,9 +3474,9 @@ declare const evalSummarySchema: z$1.ZodObject<{
|
|
|
3469
3474
|
color: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3470
3475
|
success: "success";
|
|
3471
3476
|
error: "error";
|
|
3472
|
-
warning: "warning";
|
|
3473
3477
|
accent: "accent";
|
|
3474
3478
|
accentDim: "accentDim";
|
|
3479
|
+
warning: "warning";
|
|
3475
3480
|
textMuted: "textMuted";
|
|
3476
3481
|
}>>;
|
|
3477
3482
|
axis: z$1.ZodOptional<z$1.ZodEnum<{
|
|
@@ -3500,10 +3505,10 @@ declare const evalSummarySchema: z$1.ZodObject<{
|
|
|
3500
3505
|
source: z$1.ZodLiteral<"column">;
|
|
3501
3506
|
key: z$1.ZodString;
|
|
3502
3507
|
aggregate: z$1.ZodEnum<{
|
|
3503
|
-
sum: "sum";
|
|
3504
3508
|
avg: "avg";
|
|
3505
3509
|
min: "min";
|
|
3506
3510
|
max: "max";
|
|
3511
|
+
sum: "sum";
|
|
3507
3512
|
latest: "latest";
|
|
3508
3513
|
passThresholdRate: "passThresholdRate";
|
|
3509
3514
|
}>;
|
|
@@ -3599,11 +3604,11 @@ declare const caseRowSchema: z$1.ZodObject<{
|
|
|
3599
3604
|
evalId: z$1.ZodString;
|
|
3600
3605
|
status: z$1.ZodEnum<{
|
|
3601
3606
|
error: "error";
|
|
3607
|
+
pass: "pass";
|
|
3608
|
+
fail: "fail";
|
|
3602
3609
|
running: "running";
|
|
3603
3610
|
cancelled: "cancelled";
|
|
3604
3611
|
pending: "pending";
|
|
3605
|
-
pass: "pass";
|
|
3606
|
-
fail: "fail";
|
|
3607
3612
|
}>;
|
|
3608
3613
|
durationMs: z$1.ZodNullable<z$1.ZodNumber>;
|
|
3609
3614
|
costUsd: z$1.ZodOptional<z$1.ZodNullable<z$1.ZodNumber>>;
|
|
@@ -3695,8 +3700,8 @@ declare const scoreTraceSchema: z$1.ZodObject<{
|
|
|
3695
3700
|
status: z$1.ZodEnum<{
|
|
3696
3701
|
error: "error";
|
|
3697
3702
|
running: "running";
|
|
3698
|
-
ok: "ok";
|
|
3699
3703
|
cancelled: "cancelled";
|
|
3704
|
+
ok: "ok";
|
|
3700
3705
|
}>;
|
|
3701
3706
|
attributes: z$1.ZodOptional<z$1.ZodRecord<z$1.ZodString, z$1.ZodUnknown>>;
|
|
3702
3707
|
error: z$1.ZodOptional<z$1.ZodObject<{
|
|
@@ -3746,9 +3751,9 @@ declare const scoreTraceSchema: z$1.ZodObject<{
|
|
|
3746
3751
|
subtree: "subtree";
|
|
3747
3752
|
}>>;
|
|
3748
3753
|
mode: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3749
|
-
all: "all";
|
|
3750
|
-
last: "last";
|
|
3751
3754
|
sum: "sum";
|
|
3755
|
+
last: "last";
|
|
3756
|
+
all: "all";
|
|
3752
3757
|
}>>;
|
|
3753
3758
|
}, z$1.core.$strip>>>;
|
|
3754
3759
|
}, z$1.core.$strip>;
|
|
@@ -3763,11 +3768,11 @@ declare const caseDetailSchema: z$1.ZodObject<{
|
|
|
3763
3768
|
evalId: z$1.ZodString;
|
|
3764
3769
|
status: z$1.ZodEnum<{
|
|
3765
3770
|
error: "error";
|
|
3771
|
+
pass: "pass";
|
|
3772
|
+
fail: "fail";
|
|
3766
3773
|
running: "running";
|
|
3767
3774
|
cancelled: "cancelled";
|
|
3768
3775
|
pending: "pending";
|
|
3769
|
-
pass: "pass";
|
|
3770
|
-
fail: "fail";
|
|
3771
3776
|
}>;
|
|
3772
3777
|
input: z$1.ZodUnknown;
|
|
3773
3778
|
trace: z$1.ZodArray<z$1.ZodObject<{
|
|
@@ -3781,8 +3786,8 @@ declare const caseDetailSchema: z$1.ZodObject<{
|
|
|
3781
3786
|
status: z$1.ZodEnum<{
|
|
3782
3787
|
error: "error";
|
|
3783
3788
|
running: "running";
|
|
3784
|
-
ok: "ok";
|
|
3785
3789
|
cancelled: "cancelled";
|
|
3790
|
+
ok: "ok";
|
|
3786
3791
|
}>;
|
|
3787
3792
|
attributes: z$1.ZodOptional<z$1.ZodRecord<z$1.ZodString, z$1.ZodUnknown>>;
|
|
3788
3793
|
error: z$1.ZodOptional<z$1.ZodObject<{
|
|
@@ -3832,9 +3837,9 @@ declare const caseDetailSchema: z$1.ZodObject<{
|
|
|
3832
3837
|
subtree: "subtree";
|
|
3833
3838
|
}>>;
|
|
3834
3839
|
mode: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3835
|
-
all: "all";
|
|
3836
|
-
last: "last";
|
|
3837
3840
|
sum: "sum";
|
|
3841
|
+
last: "last";
|
|
3842
|
+
all: "all";
|
|
3838
3843
|
}>>;
|
|
3839
3844
|
}, z$1.core.$strip>>>;
|
|
3840
3845
|
}, z$1.core.$strip>;
|
|
@@ -3850,8 +3855,8 @@ declare const caseDetailSchema: z$1.ZodObject<{
|
|
|
3850
3855
|
status: z$1.ZodEnum<{
|
|
3851
3856
|
error: "error";
|
|
3852
3857
|
running: "running";
|
|
3853
|
-
ok: "ok";
|
|
3854
3858
|
cancelled: "cancelled";
|
|
3859
|
+
ok: "ok";
|
|
3855
3860
|
}>;
|
|
3856
3861
|
attributes: z$1.ZodOptional<z$1.ZodRecord<z$1.ZodString, z$1.ZodUnknown>>;
|
|
3857
3862
|
error: z$1.ZodOptional<z$1.ZodObject<{
|
|
@@ -3901,9 +3906,9 @@ declare const caseDetailSchema: z$1.ZodObject<{
|
|
|
3901
3906
|
subtree: "subtree";
|
|
3902
3907
|
}>>;
|
|
3903
3908
|
mode: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3904
|
-
all: "all";
|
|
3905
|
-
last: "last";
|
|
3906
3909
|
sum: "sum";
|
|
3910
|
+
last: "last";
|
|
3911
|
+
all: "all";
|
|
3907
3912
|
}>>;
|
|
3908
3913
|
}, z$1.core.$strip>>>;
|
|
3909
3914
|
}, z$1.core.$strip>;
|
|
@@ -3963,10 +3968,10 @@ declare const caseDetailSchema: z$1.ZodObject<{
|
|
|
3963
3968
|
namespace: z$1.ZodString;
|
|
3964
3969
|
key: z$1.ZodString;
|
|
3965
3970
|
status: z$1.ZodEnum<{
|
|
3966
|
-
bypass: "bypass";
|
|
3967
|
-
refresh: "refresh";
|
|
3968
3971
|
hit: "hit";
|
|
3969
3972
|
miss: "miss";
|
|
3973
|
+
refresh: "refresh";
|
|
3974
|
+
bypass: "bypass";
|
|
3970
3975
|
}>;
|
|
3971
3976
|
read: z$1.ZodOptional<z$1.ZodBoolean>;
|
|
3972
3977
|
stored: z$1.ZodOptional<z$1.ZodBoolean>;
|
|
@@ -4037,10 +4042,10 @@ declare const evalChartBuiltinMetricSchema: z$1.ZodEnum<{
|
|
|
4037
4042
|
type EvalChartBuiltinMetric = z$1.infer<typeof evalChartBuiltinMetricSchema>;
|
|
4038
4043
|
/** Reducer applied to a numeric column across all cases of a single run. */
|
|
4039
4044
|
declare const evalChartAggregateSchema: z$1.ZodEnum<{
|
|
4040
|
-
sum: "sum";
|
|
4041
4045
|
avg: "avg";
|
|
4042
4046
|
min: "min";
|
|
4043
4047
|
max: "max";
|
|
4048
|
+
sum: "sum";
|
|
4044
4049
|
latest: "latest";
|
|
4045
4050
|
passThresholdRate: "passThresholdRate";
|
|
4046
4051
|
}>;
|
|
@@ -4053,9 +4058,9 @@ type EvalChartAggregate = z$1.infer<typeof evalChartAggregateSchema>;
|
|
|
4053
4058
|
declare const evalChartColorSchema: z$1.ZodEnum<{
|
|
4054
4059
|
success: "success";
|
|
4055
4060
|
error: "error";
|
|
4056
|
-
warning: "warning";
|
|
4057
4061
|
accent: "accent";
|
|
4058
4062
|
accentDim: "accentDim";
|
|
4063
|
+
warning: "warning";
|
|
4059
4064
|
textMuted: "textMuted";
|
|
4060
4065
|
}>;
|
|
4061
4066
|
/** Semantic color token resolved to a theme color by the web UI. */
|
|
@@ -4082,9 +4087,9 @@ declare const evalChartMetricSchema: z$1.ZodDiscriminatedUnion<[z$1.ZodObject<{
|
|
|
4082
4087
|
color: z$1.ZodOptional<z$1.ZodEnum<{
|
|
4083
4088
|
success: "success";
|
|
4084
4089
|
error: "error";
|
|
4085
|
-
warning: "warning";
|
|
4086
4090
|
accent: "accent";
|
|
4087
4091
|
accentDim: "accentDim";
|
|
4092
|
+
warning: "warning";
|
|
4088
4093
|
textMuted: "textMuted";
|
|
4089
4094
|
}>>;
|
|
4090
4095
|
axis: z$1.ZodOptional<z$1.ZodEnum<{
|
|
@@ -4095,10 +4100,10 @@ declare const evalChartMetricSchema: z$1.ZodDiscriminatedUnion<[z$1.ZodObject<{
|
|
|
4095
4100
|
source: z$1.ZodLiteral<"column">;
|
|
4096
4101
|
key: z$1.ZodString;
|
|
4097
4102
|
aggregate: z$1.ZodEnum<{
|
|
4098
|
-
sum: "sum";
|
|
4099
4103
|
avg: "avg";
|
|
4100
4104
|
min: "min";
|
|
4101
4105
|
max: "max";
|
|
4106
|
+
sum: "sum";
|
|
4102
4107
|
latest: "latest";
|
|
4103
4108
|
passThresholdRate: "passThresholdRate";
|
|
4104
4109
|
}>;
|
|
@@ -4106,9 +4111,9 @@ declare const evalChartMetricSchema: z$1.ZodDiscriminatedUnion<[z$1.ZodObject<{
|
|
|
4106
4111
|
color: z$1.ZodOptional<z$1.ZodEnum<{
|
|
4107
4112
|
success: "success";
|
|
4108
4113
|
error: "error";
|
|
4109
|
-
warning: "warning";
|
|
4110
4114
|
accent: "accent";
|
|
4111
4115
|
accentDim: "accentDim";
|
|
4116
|
+
warning: "warning";
|
|
4112
4117
|
textMuted: "textMuted";
|
|
4113
4118
|
}>>;
|
|
4114
4119
|
axis: z$1.ZodOptional<z$1.ZodEnum<{
|
|
@@ -4130,10 +4135,10 @@ declare const evalChartTooltipExtraSchema: z$1.ZodDiscriminatedUnion<[z$1.ZodObj
|
|
|
4130
4135
|
source: z$1.ZodLiteral<"column">;
|
|
4131
4136
|
key: z$1.ZodString;
|
|
4132
4137
|
aggregate: z$1.ZodEnum<{
|
|
4133
|
-
sum: "sum";
|
|
4134
4138
|
avg: "avg";
|
|
4135
4139
|
min: "min";
|
|
4136
4140
|
max: "max";
|
|
4141
|
+
sum: "sum";
|
|
4137
4142
|
latest: "latest";
|
|
4138
4143
|
passThresholdRate: "passThresholdRate";
|
|
4139
4144
|
}>;
|
|
@@ -4165,9 +4170,9 @@ declare const evalChartConfigSchema: z$1.ZodObject<{
|
|
|
4165
4170
|
color: z$1.ZodOptional<z$1.ZodEnum<{
|
|
4166
4171
|
success: "success";
|
|
4167
4172
|
error: "error";
|
|
4168
|
-
warning: "warning";
|
|
4169
4173
|
accent: "accent";
|
|
4170
4174
|
accentDim: "accentDim";
|
|
4175
|
+
warning: "warning";
|
|
4171
4176
|
textMuted: "textMuted";
|
|
4172
4177
|
}>>;
|
|
4173
4178
|
axis: z$1.ZodOptional<z$1.ZodEnum<{
|
|
@@ -4178,10 +4183,10 @@ declare const evalChartConfigSchema: z$1.ZodObject<{
|
|
|
4178
4183
|
source: z$1.ZodLiteral<"column">;
|
|
4179
4184
|
key: z$1.ZodString;
|
|
4180
4185
|
aggregate: z$1.ZodEnum<{
|
|
4181
|
-
sum: "sum";
|
|
4182
4186
|
avg: "avg";
|
|
4183
4187
|
min: "min";
|
|
4184
4188
|
max: "max";
|
|
4189
|
+
sum: "sum";
|
|
4185
4190
|
latest: "latest";
|
|
4186
4191
|
passThresholdRate: "passThresholdRate";
|
|
4187
4192
|
}>;
|
|
@@ -4189,9 +4194,9 @@ declare const evalChartConfigSchema: z$1.ZodObject<{
|
|
|
4189
4194
|
color: z$1.ZodOptional<z$1.ZodEnum<{
|
|
4190
4195
|
success: "success";
|
|
4191
4196
|
error: "error";
|
|
4192
|
-
warning: "warning";
|
|
4193
4197
|
accent: "accent";
|
|
4194
4198
|
accentDim: "accentDim";
|
|
4199
|
+
warning: "warning";
|
|
4195
4200
|
textMuted: "textMuted";
|
|
4196
4201
|
}>>;
|
|
4197
4202
|
axis: z$1.ZodOptional<z$1.ZodEnum<{
|
|
@@ -4220,10 +4225,10 @@ declare const evalChartConfigSchema: z$1.ZodObject<{
|
|
|
4220
4225
|
source: z$1.ZodLiteral<"column">;
|
|
4221
4226
|
key: z$1.ZodString;
|
|
4222
4227
|
aggregate: z$1.ZodEnum<{
|
|
4223
|
-
sum: "sum";
|
|
4224
4228
|
avg: "avg";
|
|
4225
4229
|
min: "min";
|
|
4226
4230
|
max: "max";
|
|
4231
|
+
sum: "sum";
|
|
4227
4232
|
latest: "latest";
|
|
4228
4233
|
passThresholdRate: "passThresholdRate";
|
|
4229
4234
|
}>;
|
|
@@ -4255,9 +4260,9 @@ declare const evalChartsConfigSchema: z$1.ZodArray<z$1.ZodObject<{
|
|
|
4255
4260
|
color: z$1.ZodOptional<z$1.ZodEnum<{
|
|
4256
4261
|
success: "success";
|
|
4257
4262
|
error: "error";
|
|
4258
|
-
warning: "warning";
|
|
4259
4263
|
accent: "accent";
|
|
4260
4264
|
accentDim: "accentDim";
|
|
4265
|
+
warning: "warning";
|
|
4261
4266
|
textMuted: "textMuted";
|
|
4262
4267
|
}>>;
|
|
4263
4268
|
axis: z$1.ZodOptional<z$1.ZodEnum<{
|
|
@@ -4268,10 +4273,10 @@ declare const evalChartsConfigSchema: z$1.ZodArray<z$1.ZodObject<{
|
|
|
4268
4273
|
source: z$1.ZodLiteral<"column">;
|
|
4269
4274
|
key: z$1.ZodString;
|
|
4270
4275
|
aggregate: z$1.ZodEnum<{
|
|
4271
|
-
sum: "sum";
|
|
4272
4276
|
avg: "avg";
|
|
4273
4277
|
min: "min";
|
|
4274
4278
|
max: "max";
|
|
4279
|
+
sum: "sum";
|
|
4275
4280
|
latest: "latest";
|
|
4276
4281
|
passThresholdRate: "passThresholdRate";
|
|
4277
4282
|
}>;
|
|
@@ -4279,9 +4284,9 @@ declare const evalChartsConfigSchema: z$1.ZodArray<z$1.ZodObject<{
|
|
|
4279
4284
|
color: z$1.ZodOptional<z$1.ZodEnum<{
|
|
4280
4285
|
success: "success";
|
|
4281
4286
|
error: "error";
|
|
4282
|
-
warning: "warning";
|
|
4283
4287
|
accent: "accent";
|
|
4284
4288
|
accentDim: "accentDim";
|
|
4289
|
+
warning: "warning";
|
|
4285
4290
|
textMuted: "textMuted";
|
|
4286
4291
|
}>>;
|
|
4287
4292
|
axis: z$1.ZodOptional<z$1.ZodEnum<{
|
|
@@ -4310,10 +4315,10 @@ declare const evalChartsConfigSchema: z$1.ZodArray<z$1.ZodObject<{
|
|
|
4310
4315
|
source: z$1.ZodLiteral<"column">;
|
|
4311
4316
|
key: z$1.ZodString;
|
|
4312
4317
|
aggregate: z$1.ZodEnum<{
|
|
4313
|
-
sum: "sum";
|
|
4314
4318
|
avg: "avg";
|
|
4315
4319
|
min: "min";
|
|
4316
4320
|
max: "max";
|
|
4321
|
+
sum: "sum";
|
|
4317
4322
|
latest: "latest";
|
|
4318
4323
|
passThresholdRate: "passThresholdRate";
|
|
4319
4324
|
}>;
|
|
@@ -4341,9 +4346,9 @@ declare const runManifestSchema: z$1.ZodObject<{
|
|
|
4341
4346
|
evalSourceFingerprints: z$1.ZodDefault<z$1.ZodOptional<z$1.ZodRecord<z$1.ZodString, z$1.ZodString>>>;
|
|
4342
4347
|
target: z$1.ZodObject<{
|
|
4343
4348
|
mode: z$1.ZodEnum<{
|
|
4349
|
+
caseIds: "caseIds";
|
|
4344
4350
|
all: "all";
|
|
4345
4351
|
evalIds: "evalIds";
|
|
4346
|
-
caseIds: "caseIds";
|
|
4347
4352
|
}>;
|
|
4348
4353
|
evalKeys: z$1.ZodOptional<z$1.ZodArray<z$1.ZodString>>;
|
|
4349
4354
|
files: z$1.ZodOptional<z$1.ZodArray<z$1.ZodString>>;
|
|
@@ -4356,9 +4361,9 @@ declare const runManifestSchema: z$1.ZodObject<{
|
|
|
4356
4361
|
median: "median";
|
|
4357
4362
|
}>>>;
|
|
4358
4363
|
cacheMode: z$1.ZodOptional<z$1.ZodEnum<{
|
|
4359
|
-
use: "use";
|
|
4360
|
-
bypass: "bypass";
|
|
4361
4364
|
refresh: "refresh";
|
|
4365
|
+
bypass: "bypass";
|
|
4366
|
+
use: "use";
|
|
4362
4367
|
}>>;
|
|
4363
4368
|
}, z$1.core.$strip>;
|
|
4364
4369
|
/** Persisted lifecycle metadata for a single eval run. */
|
|
@@ -5164,9 +5169,9 @@ declare const agentEvalsConfigSchema: z$1.ZodObject<{
|
|
|
5164
5169
|
subtree: "subtree";
|
|
5165
5170
|
}>>;
|
|
5166
5171
|
mode: z$1.ZodOptional<z$1.ZodEnum<{
|
|
5167
|
-
all: "all";
|
|
5168
|
-
last: "last";
|
|
5169
5172
|
sum: "sum";
|
|
5173
|
+
last: "last";
|
|
5174
|
+
all: "all";
|
|
5170
5175
|
}>>;
|
|
5171
5176
|
transform: z$1.ZodOptional<z$1.ZodCustom<TraceAttributeTransform, TraceAttributeTransform>>;
|
|
5172
5177
|
}, z$1.core.$strip>>>;
|
|
@@ -5189,11 +5194,11 @@ declare const agentEvalsConfigSchema: z$1.ZodObject<{
|
|
|
5189
5194
|
key: z$1.ZodString;
|
|
5190
5195
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
5191
5196
|
aggregate: z$1.ZodEnum<{
|
|
5192
|
-
last: "last";
|
|
5193
|
-
sum: "sum";
|
|
5194
5197
|
avg: "avg";
|
|
5195
5198
|
min: "min";
|
|
5196
5199
|
max: "max";
|
|
5200
|
+
sum: "sum";
|
|
5201
|
+
last: "last";
|
|
5197
5202
|
}>;
|
|
5198
5203
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
5199
5204
|
number: "number";
|
|
@@ -5542,9 +5547,9 @@ declare function extractApiCalls(spans: EvalTraceSpan[], config: ResolvedApiCall
|
|
|
5542
5547
|
* - `refresh`: never read, always write (forces re-execution and overwrites).
|
|
5543
5548
|
*/
|
|
5544
5549
|
declare const cacheModeSchema: z$1.ZodEnum<{
|
|
5545
|
-
use: "use";
|
|
5546
|
-
bypass: "bypass";
|
|
5547
5550
|
refresh: "refresh";
|
|
5551
|
+
bypass: "bypass";
|
|
5552
|
+
use: "use";
|
|
5548
5553
|
}>;
|
|
5549
5554
|
/** Mode controlling how cached spans behave during a run. */
|
|
5550
5555
|
type CacheMode = z$1.infer<typeof cacheModeSchema>;
|
|
@@ -5565,10 +5570,10 @@ declare const cacheOperationTypeSchema: z$1.ZodEnum<{
|
|
|
5565
5570
|
type CacheOperationType = z$1.infer<typeof cacheOperationTypeSchema>;
|
|
5566
5571
|
/** Status of a cache lookup recorded on a span or case scope. */
|
|
5567
5572
|
declare const cacheStatusSchema: z$1.ZodEnum<{
|
|
5568
|
-
bypass: "bypass";
|
|
5569
|
-
refresh: "refresh";
|
|
5570
5573
|
hit: "hit";
|
|
5571
5574
|
miss: "miss";
|
|
5575
|
+
refresh: "refresh";
|
|
5576
|
+
bypass: "bypass";
|
|
5572
5577
|
}>;
|
|
5573
5578
|
/** Status of a cache lookup recorded on a span or case scope. */
|
|
5574
5579
|
type CacheStatus = z$1.infer<typeof cacheStatusSchema>;
|
|
@@ -5585,10 +5590,10 @@ declare const traceCacheRefSchema: z$1.ZodObject<{
|
|
|
5585
5590
|
namespace: z$1.ZodString;
|
|
5586
5591
|
key: z$1.ZodString;
|
|
5587
5592
|
status: z$1.ZodEnum<{
|
|
5588
|
-
bypass: "bypass";
|
|
5589
|
-
refresh: "refresh";
|
|
5590
5593
|
hit: "hit";
|
|
5591
5594
|
miss: "miss";
|
|
5595
|
+
refresh: "refresh";
|
|
5596
|
+
bypass: "bypass";
|
|
5592
5597
|
}>;
|
|
5593
5598
|
read: z$1.ZodOptional<z$1.ZodBoolean>;
|
|
5594
5599
|
stored: z$1.ZodOptional<z$1.ZodBoolean>;
|
|
@@ -5666,8 +5671,8 @@ declare const cacheRecordingSchema: z$1.ZodObject<{
|
|
|
5666
5671
|
finalStatus: z$1.ZodOptional<z$1.ZodEnum<{
|
|
5667
5672
|
error: "error";
|
|
5668
5673
|
running: "running";
|
|
5669
|
-
ok: "ok";
|
|
5670
5674
|
cancelled: "cancelled";
|
|
5675
|
+
ok: "ok";
|
|
5671
5676
|
}>>;
|
|
5672
5677
|
finalError: z$1.ZodOptional<z$1.ZodObject<{
|
|
5673
5678
|
name: z$1.ZodOptional<z$1.ZodString>;
|
|
@@ -5739,8 +5744,8 @@ declare const cacheEntrySchema: z$1.ZodObject<{
|
|
|
5739
5744
|
finalStatus: z$1.ZodOptional<z$1.ZodEnum<{
|
|
5740
5745
|
error: "error";
|
|
5741
5746
|
running: "running";
|
|
5742
|
-
ok: "ok";
|
|
5743
5747
|
cancelled: "cancelled";
|
|
5748
|
+
ok: "ok";
|
|
5744
5749
|
}>>;
|
|
5745
5750
|
finalError: z$1.ZodOptional<z$1.ZodObject<{
|
|
5746
5751
|
name: z$1.ZodOptional<z$1.ZodString>;
|
|
@@ -5828,8 +5833,8 @@ declare const cacheEntryWithDebugKeySchema: z$1.ZodObject<{
|
|
|
5828
5833
|
finalStatus: z$1.ZodOptional<z$1.ZodEnum<{
|
|
5829
5834
|
error: "error";
|
|
5830
5835
|
running: "running";
|
|
5831
|
-
ok: "ok";
|
|
5832
5836
|
cancelled: "cancelled";
|
|
5837
|
+
ok: "ok";
|
|
5833
5838
|
}>>;
|
|
5834
5839
|
finalError: z$1.ZodOptional<z$1.ZodObject<{
|
|
5835
5840
|
name: z$1.ZodOptional<z$1.ZodString>;
|
|
@@ -5917,8 +5922,8 @@ declare const cacheFileSchema: z$1.ZodObject<{
|
|
|
5917
5922
|
finalStatus: z$1.ZodOptional<z$1.ZodEnum<{
|
|
5918
5923
|
error: "error";
|
|
5919
5924
|
running: "running";
|
|
5920
|
-
ok: "ok";
|
|
5921
5925
|
cancelled: "cancelled";
|
|
5926
|
+
ok: "ok";
|
|
5922
5927
|
}>>;
|
|
5923
5928
|
finalError: z$1.ZodOptional<z$1.ZodObject<{
|
|
5924
5929
|
name: z$1.ZodOptional<z$1.ZodString>;
|
|
@@ -6092,9 +6097,9 @@ type ConfigReloadState = z$1.infer<typeof configReloadStateSchema>;
|
|
|
6092
6097
|
declare const createRunRequestSchema: z$1.ZodObject<{
|
|
6093
6098
|
target: z$1.ZodObject<{
|
|
6094
6099
|
mode: z$1.ZodEnum<{
|
|
6100
|
+
caseIds: "caseIds";
|
|
6095
6101
|
all: "all";
|
|
6096
6102
|
evalIds: "evalIds";
|
|
6097
|
-
caseIds: "caseIds";
|
|
6098
6103
|
}>;
|
|
6099
6104
|
evalKeys: z$1.ZodOptional<z$1.ZodArray<z$1.ZodString>>;
|
|
6100
6105
|
files: z$1.ZodOptional<z$1.ZodArray<z$1.ZodString>>;
|
|
@@ -6105,9 +6110,9 @@ declare const createRunRequestSchema: z$1.ZodObject<{
|
|
|
6105
6110
|
temporary: z$1.ZodOptional<z$1.ZodBoolean>;
|
|
6106
6111
|
cache: z$1.ZodOptional<z$1.ZodObject<{
|
|
6107
6112
|
mode: z$1.ZodDefault<z$1.ZodEnum<{
|
|
6108
|
-
use: "use";
|
|
6109
|
-
bypass: "bypass";
|
|
6110
6113
|
refresh: "refresh";
|
|
6114
|
+
bypass: "bypass";
|
|
6115
|
+
use: "use";
|
|
6111
6116
|
}>>;
|
|
6112
6117
|
}, z$1.core.$strip>>;
|
|
6113
6118
|
manualInputs: z$1.ZodOptional<z$1.ZodRecord<z$1.ZodString, z$1.ZodUnknown>>;
|
|
@@ -6377,4 +6382,4 @@ type ManualInputDescriptor = z$1.infer<typeof manualInputDescriptorSchema>; //#e
|
|
|
6377
6382
|
*/
|
|
6378
6383
|
declare function runCli(argv: string[]): Promise<void>;
|
|
6379
6384
|
//#endregion
|
|
6380
|
-
export { type AgentEvalsConfig, type ApiCallEntry, type ApiCallMetric, type ApiCallMetricFormat, type ApiCallMetricPlacement, type ApiCallMetricValue, type ApiCallsConfigInput, type AssertionFailure, type CacheActivityEntry, type CacheAdapter, type CacheDebugKeyEntry, type CacheDebugKeyFile, type CacheDebugKeyWrite, type CacheEntry, type CacheEntryWithDebugKey, type CacheFile, type CacheHitEntry, type CacheKeyHashInput, type CacheKeyHashOptions, type CacheListItem, type CacheMode, type CacheOperationType, type CacheRecording, type CacheRecordingFrame, type CacheRecordingOp, type CacheScopeContext, type CacheSerializationOptions, type CacheStatus, type CallDerivedAttribute, type CallDerivedAttributeContext, type CallDerivedAttributesConfig, type CallDerivedAttributesFn, type CaptureEvalSpanErrorLevel, type CaptureEvalSpanErrorOptions, type CaseDetail, type CaseRow, type CellValue, type ColumnDef, type ColumnFormat, type ColumnKind, type ConfigReloadState, type ConfigReloadStatus, type CreateRunRequest, DEFAULT_API_CALLS_CONFIG, DEFAULT_LLM_CALLS_CONFIG, type DefaultConfigKey, type DerivedStatus, type DiscoveryIssue, EvalAssertionError, type EvalCacheConfig, type EvalCase, type EvalCaseScope, type EvalChartAggregate, type EvalChartAxis, type EvalChartBuiltinMetric, type EvalChartColor, type EvalChartConfig, type EvalChartMetric, type EvalChartTooltipExtra, type EvalChartType, type EvalChartsConfig, type EvalColumnOverride, type EvalColumns, type EvalDefinition, type EvalDeriveConfig, type EvalDeriveContext, type EvalDeriveFn, type EvalDeriveMap, type EvalDeriveValueFn, type EvalDisplayStatus, type EvalExecuteContext, type EvalExpectation, type EvalFreshnessStatus, type EvalManualInputConfig, type EvalManualScoreDef, type EvalOutputs, type EvalOutputsSchema, type EvalRunner, type EvalRuntimeScope, type EvalScoreContext, type EvalScoreDef, type EvalScoreFn, type EvalSetOutput, type EvalStartTime, type EvalStatAggregate, type EvalStatItem, type EvalStatsConfig, type EvalSummary, type
|
|
6385
|
+
export { type AgentEvalsConfig, type ApiCallEntry, type ApiCallMetric, type ApiCallMetricFormat, type ApiCallMetricPlacement, type ApiCallMetricValue, type ApiCallsConfigInput, type AssertionFailure, type CacheActivityEntry, type CacheAdapter, type CacheDebugKeyEntry, type CacheDebugKeyFile, type CacheDebugKeyWrite, type CacheEntry, type CacheEntryWithDebugKey, type CacheFile, type CacheHitEntry, type CacheKeyHashInput, type CacheKeyHashOptions, type CacheListItem, type CacheMode, type CacheOperationType, type CacheRecording, type CacheRecordingFrame, type CacheRecordingOp, type CacheScopeContext, type CacheSerializationOptions, type CacheStatus, type CallDerivedAttribute, type CallDerivedAttributeContext, type CallDerivedAttributesConfig, type CallDerivedAttributesFn, type CaptureEvalSpanErrorLevel, type CaptureEvalSpanErrorOptions, type CaseDetail, type CaseRow, type CellValue, type ColumnDef, type ColumnFormat, type ColumnKind, type ConfigReloadState, type ConfigReloadStatus, type CreateRunRequest, DEFAULT_API_CALLS_CONFIG, DEFAULT_LLM_CALLS_CONFIG, type DefaultConfigKey, type DerivedStatus, type DiscoveryIssue, EvalAssertionError, type EvalCacheConfig, type EvalCase, type EvalCaseScope, type EvalChartAggregate, type EvalChartAxis, type EvalChartBuiltinMetric, type EvalChartColor, type EvalChartConfig, type EvalChartMetric, type EvalChartTooltipExtra, type EvalChartType, type EvalChartsConfig, type EvalColumnOverride, type EvalColumns, type EvalDefinition, type EvalDeriveConfig, type EvalDeriveContext, type EvalDeriveFn, type EvalDeriveMap, type EvalDeriveValueFn, type EvalDisplayStatus, type EvalExecuteContext, type EvalExpectation, type EvalFreshnessStatus, type EvalManualInputConfig, type EvalManualScoreDef, type EvalOutputs, type EvalOutputsSchema, type EvalRunner, type EvalRuntimeScope, type EvalScoreContext, type EvalScoreDef, type EvalScoreFn, type EvalSetOutput, type EvalStartTime, type EvalStatAggregate, type EvalStatItem, type EvalStatsConfig, type EvalSummary, type EvalTraceSpan, type EvalTraceSpanError, type EvalTraceSpanWarning, type EvalTraceTree, type FileRef, type JsonCell, type LlmCallCostBreakdown, type LlmCallCostCurrency, type LlmCallEntry, type LlmCallMetric, type LlmCallMetricFormat, type LlmCallMetricPlacement, type LlmCallMetricValue, type LlmCallPricing, type LlmCallPricingRate, type LlmCallPricingRegistry, type LlmCallSimulatedTokens, type LlmCallsConfigInput, type LlmCostScenario, type ManualInputDescriptor, type ManualInputFieldDescriptor, type ManualInputFieldKind, type ManualInputFieldOverride, type ManualInputFieldsConfig, type ManualInputFileValue, type ManualInputSelectOption, type MaterializeManualInputFilesResult, type NumberDisplayOptions, type ReadManualInputFileResult, type RemoveDefaultConfig, type RepoFileRef, type ResolvedApiCallMetric, type ResolvedApiCallsConfig, type ResolvedCallDerivedAttribute, type ResolvedLlmCallCostCurrency, type ResolvedLlmCallMetric, type ResolvedLlmCallPricing, type ResolvedLlmCallsConfig, type RunArtifactRef, type RunInEvalScopeOptions, type RunLogEntry, type RunLogLevel, type RunLogLocation, type RunLogPhase, type RunLogsConfigInput, type RunManifest, type RunSummary, type ScalarCell, type ScopedCaseSummary, type ScoreTrace, type SerializedCacheSpan, type SerializedCacheValue, type SpanCacheOptions, type SseEnvelope, type SseEventType, type TraceActiveSpan, type TraceAttributeDisplay, type TraceAttributeDisplayFormat, type TraceAttributeDisplayInput, type TraceAttributeDisplayPlacement, type TraceAttributeTransform, type TraceAttributeTransformContext, type TraceCacheInfo, type TraceCacheRef, type TraceDisplayConfig, type TraceDisplayInputConfig, type TraceSpanInfo, type TrialSelectionMode, type UpdateManualScoreRequest, agentEvalsConfigSchema, apiCallMetricFormatSchema, apiCallMetricPlacementSchema, apiCallMetricSchema, apiCallsConfigSchema, appendToEvalOutput, applyDerivedCallAttributes, assertionFailureSchema, buildCaseKey, buildEvalKey, buildTraceTree, cacheDebugKeyEntrySchema, cacheDebugKeyFileSchema, cacheEntrySchema, cacheEntryWithDebugKeySchema, cacheFileSchema, cacheListItemSchema, cacheModeSchema, cacheOperationTypeSchema, cacheRecordingOpSchema, cacheRecordingSchema, cacheStatusSchema, captureEvalSpanError, caseDetailSchema, caseRowSchema, cellValueSchema, cleanupStagedManualInputFiles, columnDefSchema, columnFormatSchema, columnKindSchema, configReloadStateSchema, configReloadStatusSchema, createRunRequestSchema, createRunner, defaultConfigKeySchema, defineEval, deriveScopedSummaryFromCases, deriveStatusFromCaseRows, deriveStatusFromChildStatuses, deserializeCacheRecording, deserializeCacheValue, discoveryIssueSchema, evalAssert, evalChartAggregateSchema, evalChartAxisSchema, evalChartBuiltinMetricSchema, evalChartColorSchema, evalChartConfigSchema, evalChartMetricSchema, evalChartTooltipExtraSchema, evalChartTypeSchema, evalChartsConfigSchema, evalColumnOverrideSchema, evalColumnsSchema, evalDeriveConfigSchema, evalExpect, evalFreshnessStatusSchema, evalLog, evalSpan, evalStatAggregateSchema, evalStatItemSchema, evalStatsConfigSchema, evalSummarySchema, evalTime, evalTracer, extractApiCalls, extractCacheEntries, extractCacheHits, extractLlmCalls, fileRefSchema, getCaseRowCaseKey, getCaseRowEvalKey, getCurrentScope, getEvalCaseInput, getEvalDisplayStatus, getEvalRegistry, getEvalTitle, getNestedAttribute, hashCacheKey, hashCacheKeySync, incrementEvalOutput, isInEvalScope, isManualInputFileValue, jsonCellSchema, llmCallCostCurrencySchema, llmCallMetricFormatSchema, llmCallMetricPlacementSchema, llmCallMetricSchema, llmCallPricingRateSchema, llmCallPricingSchema, llmCallsConfigSchema, manualInputBooleanFieldSchema, manualInputDescriptorSchema, manualInputFieldDescriptorSchema, manualInputFileValueSchema, manualInputJsonFieldSchema, manualInputMultilineFieldSchema, manualInputNumberFieldSchema, manualInputSelectFieldSchema, manualInputSelectOptionSchema, manualInputTextFieldSchema, materializeManualInputFiles, mergeEvalOutput, nextEvalId, numberDisplayOptionsSchema, readManualInputFile, removeDefaultConfigSchema, repoFile, repoFileRefSchema, resolveApiCallsConfig, resolveLlmCallsConfig, runArtifactRefSchema, runCli, runInEvalRuntimeScope, runInEvalScope, runInExistingEvalScope, runLogEntrySchema, runLogLevelSchema, runLogLocationSchema, runLogPhaseSchema, runLogsConfigSchema, runManifestSchema, runSummarySchema, scoreTraceSchema, serializeCacheRecording, serializeCacheValue, serializedCacheSpanSchema, setEvalOutput, setScopeCacheContext, simulateLlmCallCost, simulateTokenAllocation, spanCacheOptionsSchema, sseEnvelopeSchema, stageManualInputFile, stageManualInputFileFromPath, startEvalBackgroundJob, traceAttributeDisplayFormatSchema, traceAttributeDisplayInputSchema, traceAttributeDisplayPlacementSchema, traceAttributeDisplaySchema, traceCacheRefSchema, traceDisplayConfigSchema, traceDisplayInputConfigSchema, traceSpanErrorSchema, traceSpanKindSchema, traceSpanSchema, traceSpanWarningSchema, trialSelectionModeSchema, updateManualScoreRequestSchema, z };
|