@ls-stack/agent-eval 0.30.0 → 0.31.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/{app-CbOZBHju.mjs → app-BrSMRTpy.mjs} +4 -4
- package/dist/apps/web/dist/assets/{index-DEikHy2a.js → index-CPcVyFRP.js} +42 -42
- package/dist/apps/web/dist/assets/index-ClPR-tfN.css +1 -0
- package/dist/apps/web/dist/index.html +2 -2
- package/dist/bin.mjs +1 -1
- package/dist/{cli-CiFOqMwS.mjs → cli-CMPmuY7W.mjs} +3 -3
- package/dist/index.d.mts +138 -93
- package/dist/index.mjs +4 -4
- package/dist/runChild.mjs +1 -1
- package/dist/{runOrchestration-CO3Vf0cQ.mjs → runOrchestration-CAyVXPFz.mjs} +34 -3
- package/dist/{runner-CXHkf7ih.mjs → runner-Bnm1nz0U.mjs} +2 -2
- package/dist/{runner-4pF_Qrc9.mjs → runner-CmpWwCe1.mjs} +1 -1
- package/dist/src-gZm9nyTp.mjs +3 -0
- package/package.json +1 -1
- package/skills/agent-eval/SKILL.md +4 -3
- package/dist/apps/web/dist/assets/index-DjUTm3M-.css +0 -1
- package/dist/src-BiPLv9ya.mjs +0 -3
package/dist/index.d.mts
CHANGED
|
@@ -754,6 +754,7 @@ type ResolvedLlmCallsConfig$1 = {
|
|
|
754
754
|
derivedAttributes: ResolvedCallDerivedAttribute$1[];
|
|
755
755
|
metrics: ResolvedLlmCallMetric$1[];
|
|
756
756
|
pricing: ResolvedLlmCallPricing$1[];
|
|
757
|
+
costCurrencies: ResolvedLlmCallCostCurrency$1[];
|
|
757
758
|
};
|
|
758
759
|
/** Resolved API-calls config sent to the UI with all defaults applied. */
|
|
759
760
|
type ResolvedApiCallsConfig$1 = {
|
|
@@ -801,6 +802,13 @@ type ResolvedLlmCallPricing$1 = {
|
|
|
801
802
|
cacheCreationInputUsdPerMillion?: number;
|
|
802
803
|
cacheCreationInput1hUsdPerMillion?: number;
|
|
803
804
|
reasoningUsdPerMillion?: number;
|
|
805
|
+
};
|
|
806
|
+
/** Fully-resolved extra currency used by the LLM calls tab. */
|
|
807
|
+
type ResolvedLlmCallCostCurrency$1 = {
|
|
808
|
+
code: string;
|
|
809
|
+
label?: string;
|
|
810
|
+
usdToCurrencyRate: number;
|
|
811
|
+
numberFormat?: NumberDisplayOptions$2;
|
|
804
812
|
}; //#endregion
|
|
805
813
|
//#region ../shared/src/schemas/cache.d.ts
|
|
806
814
|
/** Summary of a single persisted cache entry, used by list/delete endpoints. */
|
|
@@ -2900,13 +2908,13 @@ type ColumnKind = z$1.infer<typeof columnKindSchema>;
|
|
|
2900
2908
|
declare const columnFormatSchema: z$1.ZodEnum<{
|
|
2901
2909
|
number: "number";
|
|
2902
2910
|
boolean: "boolean";
|
|
2911
|
+
duration: "duration";
|
|
2912
|
+
json: "json";
|
|
2903
2913
|
file: "file";
|
|
2904
2914
|
markdown: "markdown";
|
|
2905
|
-
json: "json";
|
|
2906
2915
|
image: "image";
|
|
2907
2916
|
audio: "audio";
|
|
2908
2917
|
video: "video";
|
|
2909
|
-
duration: "duration";
|
|
2910
2918
|
percent: "percent";
|
|
2911
2919
|
passFail: "passFail";
|
|
2912
2920
|
stars: "stars";
|
|
@@ -2925,13 +2933,13 @@ declare const columnDefSchema: z$1.ZodObject<{
|
|
|
2925
2933
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
2926
2934
|
number: "number";
|
|
2927
2935
|
boolean: "boolean";
|
|
2936
|
+
duration: "duration";
|
|
2937
|
+
json: "json";
|
|
2928
2938
|
file: "file";
|
|
2929
2939
|
markdown: "markdown";
|
|
2930
|
-
json: "json";
|
|
2931
2940
|
image: "image";
|
|
2932
2941
|
audio: "audio";
|
|
2933
2942
|
video: "video";
|
|
2934
|
-
duration: "duration";
|
|
2935
2943
|
percent: "percent";
|
|
2936
2944
|
passFail: "passFail";
|
|
2937
2945
|
stars: "stars";
|
|
@@ -2976,8 +2984,8 @@ declare const traceSpanKindSchema: z$1.ZodString;
|
|
|
2976
2984
|
declare const traceAttributeDisplayFormatSchema: z$1.ZodEnum<{
|
|
2977
2985
|
string: "string";
|
|
2978
2986
|
number: "number";
|
|
2979
|
-
json: "json";
|
|
2980
2987
|
duration: "duration";
|
|
2988
|
+
json: "json";
|
|
2981
2989
|
}>;
|
|
2982
2990
|
/**
|
|
2983
2991
|
* Formatting hint for trace attribute values rendered by the UI.
|
|
@@ -3001,8 +3009,8 @@ declare const traceAttributeDisplaySchema: z$1.ZodObject<{
|
|
|
3001
3009
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3002
3010
|
string: "string";
|
|
3003
3011
|
number: "number";
|
|
3004
|
-
json: "json";
|
|
3005
3012
|
duration: "duration";
|
|
3013
|
+
json: "json";
|
|
3006
3014
|
}>>;
|
|
3007
3015
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
3008
3016
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -3037,8 +3045,8 @@ declare const traceDisplayConfigSchema: z$1.ZodObject<{
|
|
|
3037
3045
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3038
3046
|
string: "string";
|
|
3039
3047
|
number: "number";
|
|
3040
|
-
json: "json";
|
|
3041
3048
|
duration: "duration";
|
|
3049
|
+
json: "json";
|
|
3042
3050
|
}>>;
|
|
3043
3051
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
3044
3052
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -3077,8 +3085,8 @@ declare const traceAttributeDisplayInputSchema: z$1.ZodObject<{
|
|
|
3077
3085
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3078
3086
|
string: "string";
|
|
3079
3087
|
number: "number";
|
|
3080
|
-
json: "json";
|
|
3081
3088
|
duration: "duration";
|
|
3089
|
+
json: "json";
|
|
3082
3090
|
}>>;
|
|
3083
3091
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
3084
3092
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -3115,8 +3123,8 @@ declare const traceDisplayInputConfigSchema: z$1.ZodObject<{
|
|
|
3115
3123
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3116
3124
|
string: "string";
|
|
3117
3125
|
number: "number";
|
|
3118
|
-
json: "json";
|
|
3119
3126
|
duration: "duration";
|
|
3127
|
+
json: "json";
|
|
3120
3128
|
}>>;
|
|
3121
3129
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
3122
3130
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -3168,8 +3176,8 @@ declare const traceSpanSchema: z$1.ZodObject<{
|
|
|
3168
3176
|
status: z$1.ZodEnum<{
|
|
3169
3177
|
error: "error";
|
|
3170
3178
|
running: "running";
|
|
3171
|
-
cancelled: "cancelled";
|
|
3172
3179
|
ok: "ok";
|
|
3180
|
+
cancelled: "cancelled";
|
|
3173
3181
|
}>;
|
|
3174
3182
|
attributes: z$1.ZodOptional<z$1.ZodRecord<z$1.ZodString, z$1.ZodUnknown>>;
|
|
3175
3183
|
error: z$1.ZodOptional<z$1.ZodObject<{
|
|
@@ -3212,9 +3220,9 @@ type EvalFreshnessStatus = z$1.infer<typeof evalFreshnessStatusSchema>;
|
|
|
3212
3220
|
declare const evalStatAggregateSchema: z$1.ZodEnum<{
|
|
3213
3221
|
last: "last";
|
|
3214
3222
|
sum: "sum";
|
|
3223
|
+
avg: "avg";
|
|
3215
3224
|
min: "min";
|
|
3216
3225
|
max: "max";
|
|
3217
|
-
avg: "avg";
|
|
3218
3226
|
}>;
|
|
3219
3227
|
/** Reducer used to collapse a column's per-case values into a single stat. */
|
|
3220
3228
|
type EvalStatAggregate = z$1.infer<typeof evalStatAggregateSchema>;
|
|
@@ -3240,20 +3248,20 @@ declare const evalStatItemSchema: z$1.ZodDiscriminatedUnion<[z$1.ZodObject<{
|
|
|
3240
3248
|
aggregate: z$1.ZodEnum<{
|
|
3241
3249
|
last: "last";
|
|
3242
3250
|
sum: "sum";
|
|
3251
|
+
avg: "avg";
|
|
3243
3252
|
min: "min";
|
|
3244
3253
|
max: "max";
|
|
3245
|
-
avg: "avg";
|
|
3246
3254
|
}>;
|
|
3247
3255
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3248
3256
|
number: "number";
|
|
3249
3257
|
boolean: "boolean";
|
|
3258
|
+
duration: "duration";
|
|
3259
|
+
json: "json";
|
|
3250
3260
|
file: "file";
|
|
3251
3261
|
markdown: "markdown";
|
|
3252
|
-
json: "json";
|
|
3253
3262
|
image: "image";
|
|
3254
3263
|
audio: "audio";
|
|
3255
3264
|
video: "video";
|
|
3256
|
-
duration: "duration";
|
|
3257
3265
|
percent: "percent";
|
|
3258
3266
|
passFail: "passFail";
|
|
3259
3267
|
stars: "stars";
|
|
@@ -3282,20 +3290,20 @@ declare const evalStatsConfigSchema: z$1.ZodArray<z$1.ZodDiscriminatedUnion<[z$1
|
|
|
3282
3290
|
aggregate: z$1.ZodEnum<{
|
|
3283
3291
|
last: "last";
|
|
3284
3292
|
sum: "sum";
|
|
3293
|
+
avg: "avg";
|
|
3285
3294
|
min: "min";
|
|
3286
3295
|
max: "max";
|
|
3287
|
-
avg: "avg";
|
|
3288
3296
|
}>;
|
|
3289
3297
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3290
3298
|
number: "number";
|
|
3291
3299
|
boolean: "boolean";
|
|
3300
|
+
duration: "duration";
|
|
3301
|
+
json: "json";
|
|
3292
3302
|
file: "file";
|
|
3293
3303
|
markdown: "markdown";
|
|
3294
|
-
json: "json";
|
|
3295
3304
|
image: "image";
|
|
3296
3305
|
audio: "audio";
|
|
3297
3306
|
video: "video";
|
|
3298
|
-
duration: "duration";
|
|
3299
3307
|
percent: "percent";
|
|
3300
3308
|
passFail: "passFail";
|
|
3301
3309
|
stars: "stars";
|
|
@@ -3332,13 +3340,13 @@ declare const evalSummarySchema: z$1.ZodObject<{
|
|
|
3332
3340
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3333
3341
|
number: "number";
|
|
3334
3342
|
boolean: "boolean";
|
|
3343
|
+
duration: "duration";
|
|
3344
|
+
json: "json";
|
|
3335
3345
|
file: "file";
|
|
3336
3346
|
markdown: "markdown";
|
|
3337
|
-
json: "json";
|
|
3338
3347
|
image: "image";
|
|
3339
3348
|
audio: "audio";
|
|
3340
3349
|
video: "video";
|
|
3341
|
-
duration: "duration";
|
|
3342
3350
|
percent: "percent";
|
|
3343
3351
|
passFail: "passFail";
|
|
3344
3352
|
stars: "stars";
|
|
@@ -3383,20 +3391,20 @@ declare const evalSummarySchema: z$1.ZodObject<{
|
|
|
3383
3391
|
aggregate: z$1.ZodEnum<{
|
|
3384
3392
|
last: "last";
|
|
3385
3393
|
sum: "sum";
|
|
3394
|
+
avg: "avg";
|
|
3386
3395
|
min: "min";
|
|
3387
3396
|
max: "max";
|
|
3388
|
-
avg: "avg";
|
|
3389
3397
|
}>;
|
|
3390
3398
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3391
3399
|
number: "number";
|
|
3392
3400
|
boolean: "boolean";
|
|
3401
|
+
duration: "duration";
|
|
3402
|
+
json: "json";
|
|
3393
3403
|
file: "file";
|
|
3394
3404
|
markdown: "markdown";
|
|
3395
|
-
json: "json";
|
|
3396
3405
|
image: "image";
|
|
3397
3406
|
audio: "audio";
|
|
3398
3407
|
video: "video";
|
|
3399
|
-
duration: "duration";
|
|
3400
3408
|
percent: "percent";
|
|
3401
3409
|
passFail: "passFail";
|
|
3402
3410
|
stars: "stars";
|
|
@@ -3416,13 +3424,13 @@ declare const evalSummarySchema: z$1.ZodObject<{
|
|
|
3416
3424
|
metrics: z$1.ZodArray<z$1.ZodDiscriminatedUnion<[z$1.ZodObject<{
|
|
3417
3425
|
source: z$1.ZodLiteral<"builtin">;
|
|
3418
3426
|
metric: z$1.ZodEnum<{
|
|
3419
|
-
durationMs: "durationMs";
|
|
3420
3427
|
passRate: "passRate";
|
|
3428
|
+
durationMs: "durationMs";
|
|
3421
3429
|
}>;
|
|
3422
3430
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
3423
3431
|
color: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3424
|
-
success: "success";
|
|
3425
3432
|
error: "error";
|
|
3433
|
+
success: "success";
|
|
3426
3434
|
warning: "warning";
|
|
3427
3435
|
accent: "accent";
|
|
3428
3436
|
accentDim: "accentDim";
|
|
@@ -3437,16 +3445,16 @@ declare const evalSummarySchema: z$1.ZodObject<{
|
|
|
3437
3445
|
key: z$1.ZodString;
|
|
3438
3446
|
aggregate: z$1.ZodEnum<{
|
|
3439
3447
|
sum: "sum";
|
|
3448
|
+
avg: "avg";
|
|
3440
3449
|
min: "min";
|
|
3441
3450
|
max: "max";
|
|
3442
|
-
avg: "avg";
|
|
3443
3451
|
latest: "latest";
|
|
3444
3452
|
passThresholdRate: "passThresholdRate";
|
|
3445
3453
|
}>;
|
|
3446
3454
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
3447
3455
|
color: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3448
|
-
success: "success";
|
|
3449
3456
|
error: "error";
|
|
3457
|
+
success: "success";
|
|
3450
3458
|
warning: "warning";
|
|
3451
3459
|
accent: "accent";
|
|
3452
3460
|
accentDim: "accentDim";
|
|
@@ -3470,8 +3478,8 @@ declare const evalSummarySchema: z$1.ZodObject<{
|
|
|
3470
3478
|
tooltipExtras: z$1.ZodOptional<z$1.ZodArray<z$1.ZodDiscriminatedUnion<[z$1.ZodObject<{
|
|
3471
3479
|
source: z$1.ZodLiteral<"builtin">;
|
|
3472
3480
|
metric: z$1.ZodEnum<{
|
|
3473
|
-
durationMs: "durationMs";
|
|
3474
3481
|
passRate: "passRate";
|
|
3482
|
+
durationMs: "durationMs";
|
|
3475
3483
|
}>;
|
|
3476
3484
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
3477
3485
|
}, z$1.core.$strip>, z$1.ZodObject<{
|
|
@@ -3479,9 +3487,9 @@ declare const evalSummarySchema: z$1.ZodObject<{
|
|
|
3479
3487
|
key: z$1.ZodString;
|
|
3480
3488
|
aggregate: z$1.ZodEnum<{
|
|
3481
3489
|
sum: "sum";
|
|
3490
|
+
avg: "avg";
|
|
3482
3491
|
min: "min";
|
|
3483
3492
|
max: "max";
|
|
3484
|
-
avg: "avg";
|
|
3485
3493
|
latest: "latest";
|
|
3486
3494
|
passThresholdRate: "passThresholdRate";
|
|
3487
3495
|
}>;
|
|
@@ -3577,11 +3585,11 @@ declare const caseRowSchema: z$1.ZodObject<{
|
|
|
3577
3585
|
evalId: z$1.ZodString;
|
|
3578
3586
|
status: z$1.ZodEnum<{
|
|
3579
3587
|
error: "error";
|
|
3580
|
-
pending: "pending";
|
|
3581
3588
|
running: "running";
|
|
3582
3589
|
cancelled: "cancelled";
|
|
3583
3590
|
pass: "pass";
|
|
3584
3591
|
fail: "fail";
|
|
3592
|
+
pending: "pending";
|
|
3585
3593
|
}>;
|
|
3586
3594
|
durationMs: z$1.ZodNullable<z$1.ZodNumber>;
|
|
3587
3595
|
costUsd: z$1.ZodOptional<z$1.ZodNullable<z$1.ZodNumber>>;
|
|
@@ -3673,8 +3681,8 @@ declare const scoreTraceSchema: z$1.ZodObject<{
|
|
|
3673
3681
|
status: z$1.ZodEnum<{
|
|
3674
3682
|
error: "error";
|
|
3675
3683
|
running: "running";
|
|
3676
|
-
cancelled: "cancelled";
|
|
3677
3684
|
ok: "ok";
|
|
3685
|
+
cancelled: "cancelled";
|
|
3678
3686
|
}>;
|
|
3679
3687
|
attributes: z$1.ZodOptional<z$1.ZodRecord<z$1.ZodString, z$1.ZodUnknown>>;
|
|
3680
3688
|
error: z$1.ZodOptional<z$1.ZodObject<{
|
|
@@ -3710,8 +3718,8 @@ declare const scoreTraceSchema: z$1.ZodObject<{
|
|
|
3710
3718
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3711
3719
|
string: "string";
|
|
3712
3720
|
number: "number";
|
|
3713
|
-
json: "json";
|
|
3714
3721
|
duration: "duration";
|
|
3722
|
+
json: "json";
|
|
3715
3723
|
}>>;
|
|
3716
3724
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
3717
3725
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -3741,11 +3749,11 @@ declare const caseDetailSchema: z$1.ZodObject<{
|
|
|
3741
3749
|
evalId: z$1.ZodString;
|
|
3742
3750
|
status: z$1.ZodEnum<{
|
|
3743
3751
|
error: "error";
|
|
3744
|
-
pending: "pending";
|
|
3745
3752
|
running: "running";
|
|
3746
3753
|
cancelled: "cancelled";
|
|
3747
3754
|
pass: "pass";
|
|
3748
3755
|
fail: "fail";
|
|
3756
|
+
pending: "pending";
|
|
3749
3757
|
}>;
|
|
3750
3758
|
input: z$1.ZodUnknown;
|
|
3751
3759
|
trace: z$1.ZodArray<z$1.ZodObject<{
|
|
@@ -3759,8 +3767,8 @@ declare const caseDetailSchema: z$1.ZodObject<{
|
|
|
3759
3767
|
status: z$1.ZodEnum<{
|
|
3760
3768
|
error: "error";
|
|
3761
3769
|
running: "running";
|
|
3762
|
-
cancelled: "cancelled";
|
|
3763
3770
|
ok: "ok";
|
|
3771
|
+
cancelled: "cancelled";
|
|
3764
3772
|
}>;
|
|
3765
3773
|
attributes: z$1.ZodOptional<z$1.ZodRecord<z$1.ZodString, z$1.ZodUnknown>>;
|
|
3766
3774
|
error: z$1.ZodOptional<z$1.ZodObject<{
|
|
@@ -3796,8 +3804,8 @@ declare const caseDetailSchema: z$1.ZodObject<{
|
|
|
3796
3804
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3797
3805
|
string: "string";
|
|
3798
3806
|
number: "number";
|
|
3799
|
-
json: "json";
|
|
3800
3807
|
duration: "duration";
|
|
3808
|
+
json: "json";
|
|
3801
3809
|
}>>;
|
|
3802
3810
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
3803
3811
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -3828,8 +3836,8 @@ declare const caseDetailSchema: z$1.ZodObject<{
|
|
|
3828
3836
|
status: z$1.ZodEnum<{
|
|
3829
3837
|
error: "error";
|
|
3830
3838
|
running: "running";
|
|
3831
|
-
cancelled: "cancelled";
|
|
3832
3839
|
ok: "ok";
|
|
3840
|
+
cancelled: "cancelled";
|
|
3833
3841
|
}>;
|
|
3834
3842
|
attributes: z$1.ZodOptional<z$1.ZodRecord<z$1.ZodString, z$1.ZodUnknown>>;
|
|
3835
3843
|
error: z$1.ZodOptional<z$1.ZodObject<{
|
|
@@ -3865,8 +3873,8 @@ declare const caseDetailSchema: z$1.ZodObject<{
|
|
|
3865
3873
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3866
3874
|
string: "string";
|
|
3867
3875
|
number: "number";
|
|
3868
|
-
json: "json";
|
|
3869
3876
|
duration: "duration";
|
|
3877
|
+
json: "json";
|
|
3870
3878
|
}>>;
|
|
3871
3879
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
3872
3880
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -3941,10 +3949,10 @@ declare const caseDetailSchema: z$1.ZodObject<{
|
|
|
3941
3949
|
namespace: z$1.ZodString;
|
|
3942
3950
|
key: z$1.ZodString;
|
|
3943
3951
|
status: z$1.ZodEnum<{
|
|
3944
|
-
bypass: "bypass";
|
|
3945
|
-
refresh: "refresh";
|
|
3946
3952
|
hit: "hit";
|
|
3947
3953
|
miss: "miss";
|
|
3954
|
+
refresh: "refresh";
|
|
3955
|
+
bypass: "bypass";
|
|
3948
3956
|
}>;
|
|
3949
3957
|
read: z$1.ZodOptional<z$1.ZodBoolean>;
|
|
3950
3958
|
stored: z$1.ZodOptional<z$1.ZodBoolean>;
|
|
@@ -4005,8 +4013,8 @@ type EvalChartType = z$1.infer<typeof evalChartTypeSchema>;
|
|
|
4005
4013
|
* than from a per-case column.
|
|
4006
4014
|
*/
|
|
4007
4015
|
declare const evalChartBuiltinMetricSchema: z$1.ZodEnum<{
|
|
4008
|
-
durationMs: "durationMs";
|
|
4009
4016
|
passRate: "passRate";
|
|
4017
|
+
durationMs: "durationMs";
|
|
4010
4018
|
}>;
|
|
4011
4019
|
/**
|
|
4012
4020
|
* Run-level metric sourced from the aggregated `RunSummary` for a run, rather
|
|
@@ -4016,9 +4024,9 @@ type EvalChartBuiltinMetric = z$1.infer<typeof evalChartBuiltinMetricSchema>;
|
|
|
4016
4024
|
/** Reducer applied to a numeric column across all cases of a single run. */
|
|
4017
4025
|
declare const evalChartAggregateSchema: z$1.ZodEnum<{
|
|
4018
4026
|
sum: "sum";
|
|
4027
|
+
avg: "avg";
|
|
4019
4028
|
min: "min";
|
|
4020
4029
|
max: "max";
|
|
4021
|
-
avg: "avg";
|
|
4022
4030
|
latest: "latest";
|
|
4023
4031
|
passThresholdRate: "passThresholdRate";
|
|
4024
4032
|
}>;
|
|
@@ -4029,8 +4037,8 @@ type EvalChartAggregate = z$1.infer<typeof evalChartAggregateSchema>;
|
|
|
4029
4037
|
* not emit raw hex so authored evals stay decoupled from the web theme.
|
|
4030
4038
|
*/
|
|
4031
4039
|
declare const evalChartColorSchema: z$1.ZodEnum<{
|
|
4032
|
-
success: "success";
|
|
4033
4040
|
error: "error";
|
|
4041
|
+
success: "success";
|
|
4034
4042
|
warning: "warning";
|
|
4035
4043
|
accent: "accent";
|
|
4036
4044
|
accentDim: "accentDim";
|
|
@@ -4053,13 +4061,13 @@ type EvalChartAxis = z$1.infer<typeof evalChartAxisSchema>;
|
|
|
4053
4061
|
declare const evalChartMetricSchema: z$1.ZodDiscriminatedUnion<[z$1.ZodObject<{
|
|
4054
4062
|
source: z$1.ZodLiteral<"builtin">;
|
|
4055
4063
|
metric: z$1.ZodEnum<{
|
|
4056
|
-
durationMs: "durationMs";
|
|
4057
4064
|
passRate: "passRate";
|
|
4065
|
+
durationMs: "durationMs";
|
|
4058
4066
|
}>;
|
|
4059
4067
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
4060
4068
|
color: z$1.ZodOptional<z$1.ZodEnum<{
|
|
4061
|
-
success: "success";
|
|
4062
4069
|
error: "error";
|
|
4070
|
+
success: "success";
|
|
4063
4071
|
warning: "warning";
|
|
4064
4072
|
accent: "accent";
|
|
4065
4073
|
accentDim: "accentDim";
|
|
@@ -4074,16 +4082,16 @@ declare const evalChartMetricSchema: z$1.ZodDiscriminatedUnion<[z$1.ZodObject<{
|
|
|
4074
4082
|
key: z$1.ZodString;
|
|
4075
4083
|
aggregate: z$1.ZodEnum<{
|
|
4076
4084
|
sum: "sum";
|
|
4085
|
+
avg: "avg";
|
|
4077
4086
|
min: "min";
|
|
4078
4087
|
max: "max";
|
|
4079
|
-
avg: "avg";
|
|
4080
4088
|
latest: "latest";
|
|
4081
4089
|
passThresholdRate: "passThresholdRate";
|
|
4082
4090
|
}>;
|
|
4083
4091
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
4084
4092
|
color: z$1.ZodOptional<z$1.ZodEnum<{
|
|
4085
|
-
success: "success";
|
|
4086
4093
|
error: "error";
|
|
4094
|
+
success: "success";
|
|
4087
4095
|
warning: "warning";
|
|
4088
4096
|
accent: "accent";
|
|
4089
4097
|
accentDim: "accentDim";
|
|
@@ -4100,8 +4108,8 @@ type EvalChartMetric = z$1.infer<typeof evalChartMetricSchema>;
|
|
|
4100
4108
|
declare const evalChartTooltipExtraSchema: z$1.ZodDiscriminatedUnion<[z$1.ZodObject<{
|
|
4101
4109
|
source: z$1.ZodLiteral<"builtin">;
|
|
4102
4110
|
metric: z$1.ZodEnum<{
|
|
4103
|
-
durationMs: "durationMs";
|
|
4104
4111
|
passRate: "passRate";
|
|
4112
|
+
durationMs: "durationMs";
|
|
4105
4113
|
}>;
|
|
4106
4114
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
4107
4115
|
}, z$1.core.$strip>, z$1.ZodObject<{
|
|
@@ -4109,9 +4117,9 @@ declare const evalChartTooltipExtraSchema: z$1.ZodDiscriminatedUnion<[z$1.ZodObj
|
|
|
4109
4117
|
key: z$1.ZodString;
|
|
4110
4118
|
aggregate: z$1.ZodEnum<{
|
|
4111
4119
|
sum: "sum";
|
|
4120
|
+
avg: "avg";
|
|
4112
4121
|
min: "min";
|
|
4113
4122
|
max: "max";
|
|
4114
|
-
avg: "avg";
|
|
4115
4123
|
latest: "latest";
|
|
4116
4124
|
passThresholdRate: "passThresholdRate";
|
|
4117
4125
|
}>;
|
|
@@ -4136,13 +4144,13 @@ declare const evalChartConfigSchema: z$1.ZodObject<{
|
|
|
4136
4144
|
metrics: z$1.ZodArray<z$1.ZodDiscriminatedUnion<[z$1.ZodObject<{
|
|
4137
4145
|
source: z$1.ZodLiteral<"builtin">;
|
|
4138
4146
|
metric: z$1.ZodEnum<{
|
|
4139
|
-
durationMs: "durationMs";
|
|
4140
4147
|
passRate: "passRate";
|
|
4148
|
+
durationMs: "durationMs";
|
|
4141
4149
|
}>;
|
|
4142
4150
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
4143
4151
|
color: z$1.ZodOptional<z$1.ZodEnum<{
|
|
4144
|
-
success: "success";
|
|
4145
4152
|
error: "error";
|
|
4153
|
+
success: "success";
|
|
4146
4154
|
warning: "warning";
|
|
4147
4155
|
accent: "accent";
|
|
4148
4156
|
accentDim: "accentDim";
|
|
@@ -4157,16 +4165,16 @@ declare const evalChartConfigSchema: z$1.ZodObject<{
|
|
|
4157
4165
|
key: z$1.ZodString;
|
|
4158
4166
|
aggregate: z$1.ZodEnum<{
|
|
4159
4167
|
sum: "sum";
|
|
4168
|
+
avg: "avg";
|
|
4160
4169
|
min: "min";
|
|
4161
4170
|
max: "max";
|
|
4162
|
-
avg: "avg";
|
|
4163
4171
|
latest: "latest";
|
|
4164
4172
|
passThresholdRate: "passThresholdRate";
|
|
4165
4173
|
}>;
|
|
4166
4174
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
4167
4175
|
color: z$1.ZodOptional<z$1.ZodEnum<{
|
|
4168
|
-
success: "success";
|
|
4169
4176
|
error: "error";
|
|
4177
|
+
success: "success";
|
|
4170
4178
|
warning: "warning";
|
|
4171
4179
|
accent: "accent";
|
|
4172
4180
|
accentDim: "accentDim";
|
|
@@ -4190,8 +4198,8 @@ declare const evalChartConfigSchema: z$1.ZodObject<{
|
|
|
4190
4198
|
tooltipExtras: z$1.ZodOptional<z$1.ZodArray<z$1.ZodDiscriminatedUnion<[z$1.ZodObject<{
|
|
4191
4199
|
source: z$1.ZodLiteral<"builtin">;
|
|
4192
4200
|
metric: z$1.ZodEnum<{
|
|
4193
|
-
durationMs: "durationMs";
|
|
4194
4201
|
passRate: "passRate";
|
|
4202
|
+
durationMs: "durationMs";
|
|
4195
4203
|
}>;
|
|
4196
4204
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
4197
4205
|
}, z$1.core.$strip>, z$1.ZodObject<{
|
|
@@ -4199,9 +4207,9 @@ declare const evalChartConfigSchema: z$1.ZodObject<{
|
|
|
4199
4207
|
key: z$1.ZodString;
|
|
4200
4208
|
aggregate: z$1.ZodEnum<{
|
|
4201
4209
|
sum: "sum";
|
|
4210
|
+
avg: "avg";
|
|
4202
4211
|
min: "min";
|
|
4203
4212
|
max: "max";
|
|
4204
|
-
avg: "avg";
|
|
4205
4213
|
latest: "latest";
|
|
4206
4214
|
passThresholdRate: "passThresholdRate";
|
|
4207
4215
|
}>;
|
|
@@ -4226,13 +4234,13 @@ declare const evalChartsConfigSchema: z$1.ZodArray<z$1.ZodObject<{
|
|
|
4226
4234
|
metrics: z$1.ZodArray<z$1.ZodDiscriminatedUnion<[z$1.ZodObject<{
|
|
4227
4235
|
source: z$1.ZodLiteral<"builtin">;
|
|
4228
4236
|
metric: z$1.ZodEnum<{
|
|
4229
|
-
durationMs: "durationMs";
|
|
4230
4237
|
passRate: "passRate";
|
|
4238
|
+
durationMs: "durationMs";
|
|
4231
4239
|
}>;
|
|
4232
4240
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
4233
4241
|
color: z$1.ZodOptional<z$1.ZodEnum<{
|
|
4234
|
-
success: "success";
|
|
4235
4242
|
error: "error";
|
|
4243
|
+
success: "success";
|
|
4236
4244
|
warning: "warning";
|
|
4237
4245
|
accent: "accent";
|
|
4238
4246
|
accentDim: "accentDim";
|
|
@@ -4247,16 +4255,16 @@ declare const evalChartsConfigSchema: z$1.ZodArray<z$1.ZodObject<{
|
|
|
4247
4255
|
key: z$1.ZodString;
|
|
4248
4256
|
aggregate: z$1.ZodEnum<{
|
|
4249
4257
|
sum: "sum";
|
|
4258
|
+
avg: "avg";
|
|
4250
4259
|
min: "min";
|
|
4251
4260
|
max: "max";
|
|
4252
|
-
avg: "avg";
|
|
4253
4261
|
latest: "latest";
|
|
4254
4262
|
passThresholdRate: "passThresholdRate";
|
|
4255
4263
|
}>;
|
|
4256
4264
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
4257
4265
|
color: z$1.ZodOptional<z$1.ZodEnum<{
|
|
4258
|
-
success: "success";
|
|
4259
4266
|
error: "error";
|
|
4267
|
+
success: "success";
|
|
4260
4268
|
warning: "warning";
|
|
4261
4269
|
accent: "accent";
|
|
4262
4270
|
accentDim: "accentDim";
|
|
@@ -4280,8 +4288,8 @@ declare const evalChartsConfigSchema: z$1.ZodArray<z$1.ZodObject<{
|
|
|
4280
4288
|
tooltipExtras: z$1.ZodOptional<z$1.ZodArray<z$1.ZodDiscriminatedUnion<[z$1.ZodObject<{
|
|
4281
4289
|
source: z$1.ZodLiteral<"builtin">;
|
|
4282
4290
|
metric: z$1.ZodEnum<{
|
|
4283
|
-
durationMs: "durationMs";
|
|
4284
4291
|
passRate: "passRate";
|
|
4292
|
+
durationMs: "durationMs";
|
|
4285
4293
|
}>;
|
|
4286
4294
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
4287
4295
|
}, z$1.core.$strip>, z$1.ZodObject<{
|
|
@@ -4289,9 +4297,9 @@ declare const evalChartsConfigSchema: z$1.ZodArray<z$1.ZodObject<{
|
|
|
4289
4297
|
key: z$1.ZodString;
|
|
4290
4298
|
aggregate: z$1.ZodEnum<{
|
|
4291
4299
|
sum: "sum";
|
|
4300
|
+
avg: "avg";
|
|
4292
4301
|
min: "min";
|
|
4293
4302
|
max: "max";
|
|
4294
|
-
avg: "avg";
|
|
4295
4303
|
latest: "latest";
|
|
4296
4304
|
passThresholdRate: "passThresholdRate";
|
|
4297
4305
|
}>;
|
|
@@ -4307,10 +4315,10 @@ declare const runManifestSchema: z$1.ZodObject<{
|
|
|
4307
4315
|
shortId: z$1.ZodString;
|
|
4308
4316
|
status: z$1.ZodEnum<{
|
|
4309
4317
|
error: "error";
|
|
4310
|
-
pending: "pending";
|
|
4311
4318
|
running: "running";
|
|
4312
|
-
completed: "completed";
|
|
4313
4319
|
cancelled: "cancelled";
|
|
4320
|
+
pending: "pending";
|
|
4321
|
+
completed: "completed";
|
|
4314
4322
|
}>;
|
|
4315
4323
|
startedAt: z$1.ZodString;
|
|
4316
4324
|
endedAt: z$1.ZodNullable<z$1.ZodString>;
|
|
@@ -4333,9 +4341,9 @@ declare const runManifestSchema: z$1.ZodObject<{
|
|
|
4333
4341
|
median: "median";
|
|
4334
4342
|
}>>>;
|
|
4335
4343
|
cacheMode: z$1.ZodOptional<z$1.ZodEnum<{
|
|
4336
|
-
use: "use";
|
|
4337
|
-
bypass: "bypass";
|
|
4338
4344
|
refresh: "refresh";
|
|
4345
|
+
bypass: "bypass";
|
|
4346
|
+
use: "use";
|
|
4339
4347
|
}>>;
|
|
4340
4348
|
}, z$1.core.$strip>;
|
|
4341
4349
|
/** Persisted lifecycle metadata for a single eval run. */
|
|
@@ -4345,10 +4353,10 @@ declare const runSummarySchema: z$1.ZodObject<{
|
|
|
4345
4353
|
runId: z$1.ZodString;
|
|
4346
4354
|
status: z$1.ZodEnum<{
|
|
4347
4355
|
error: "error";
|
|
4348
|
-
pending: "pending";
|
|
4349
4356
|
running: "running";
|
|
4350
|
-
completed: "completed";
|
|
4351
4357
|
cancelled: "cancelled";
|
|
4358
|
+
pending: "pending";
|
|
4359
|
+
completed: "completed";
|
|
4352
4360
|
}>;
|
|
4353
4361
|
totalCases: z$1.ZodNumber;
|
|
4354
4362
|
passedCases: z$1.ZodNumber;
|
|
@@ -4458,8 +4466,8 @@ declare const trialSelectionModeSchema: z$1.ZodEnum<{
|
|
|
4458
4466
|
type TrialSelectionMode = z$1.infer<typeof trialSelectionModeSchema>;
|
|
4459
4467
|
/** Built-in eval-level output/column keys. */
|
|
4460
4468
|
declare const defaultConfigKeySchema: z$1.ZodEnum<{
|
|
4461
|
-
apiCalls: "apiCalls";
|
|
4462
4469
|
costUsd: "costUsd";
|
|
4470
|
+
apiCalls: "apiCalls";
|
|
4463
4471
|
llmTurns: "llmTurns";
|
|
4464
4472
|
inputTokens: "inputTokens";
|
|
4465
4473
|
outputTokens: "outputTokens";
|
|
@@ -4472,8 +4480,8 @@ declare const defaultConfigKeySchema: z$1.ZodEnum<{
|
|
|
4472
4480
|
/** Built-in eval-level output/column key. */
|
|
4473
4481
|
/** Removal config for built-in eval-level outputs and UI metadata. */
|
|
4474
4482
|
declare const removeDefaultConfigSchema: z$1.ZodUnion<readonly [z$1.ZodLiteral<true>, z$1.ZodArray<z$1.ZodEnum<{
|
|
4475
|
-
apiCalls: "apiCalls";
|
|
4476
4483
|
costUsd: "costUsd";
|
|
4484
|
+
apiCalls: "apiCalls";
|
|
4477
4485
|
llmTurns: "llmTurns";
|
|
4478
4486
|
inputTokens: "inputTokens";
|
|
4479
4487
|
outputTokens: "outputTokens";
|
|
@@ -4566,8 +4574,8 @@ declare const llmCallMetricFormatSchema: z$1.ZodEnum<{
|
|
|
4566
4574
|
string: "string";
|
|
4567
4575
|
number: "number";
|
|
4568
4576
|
boolean: "boolean";
|
|
4569
|
-
json: "json";
|
|
4570
4577
|
duration: "duration";
|
|
4578
|
+
json: "json";
|
|
4571
4579
|
}>;
|
|
4572
4580
|
/** Render format applied to an LLM-call metric value. */
|
|
4573
4581
|
type LlmCallMetricFormat = z$1.infer<typeof llmCallMetricFormatSchema>;
|
|
@@ -4576,8 +4584,8 @@ declare const apiCallMetricFormatSchema: z$1.ZodEnum<{
|
|
|
4576
4584
|
string: "string";
|
|
4577
4585
|
number: "number";
|
|
4578
4586
|
boolean: "boolean";
|
|
4579
|
-
json: "json";
|
|
4580
4587
|
duration: "duration";
|
|
4588
|
+
json: "json";
|
|
4581
4589
|
}>;
|
|
4582
4590
|
/** Render format applied to an API-call metric value. */
|
|
4583
4591
|
type ApiCallMetricFormat = z$1.infer<typeof apiCallMetricFormatSchema>;
|
|
@@ -4646,8 +4654,8 @@ declare const llmCallMetricSchema: z$1.ZodObject<{
|
|
|
4646
4654
|
string: "string";
|
|
4647
4655
|
number: "number";
|
|
4648
4656
|
boolean: "boolean";
|
|
4649
|
-
json: "json";
|
|
4650
4657
|
duration: "duration";
|
|
4658
|
+
json: "json";
|
|
4651
4659
|
}>>;
|
|
4652
4660
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
4653
4661
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -4675,8 +4683,8 @@ declare const apiCallMetricSchema: z$1.ZodObject<{
|
|
|
4675
4683
|
string: "string";
|
|
4676
4684
|
number: "number";
|
|
4677
4685
|
boolean: "boolean";
|
|
4678
|
-
json: "json";
|
|
4679
4686
|
duration: "duration";
|
|
4687
|
+
json: "json";
|
|
4680
4688
|
}>>;
|
|
4681
4689
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
4682
4690
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -4725,6 +4733,18 @@ declare const llmCallPricingSchema: z$1.ZodObject<{
|
|
|
4725
4733
|
type LlmCallPricing = z$1.infer<typeof llmCallPricingSchema>;
|
|
4726
4734
|
/** Model-keyed pricing registry authored in `agent-evals.config.ts`. */
|
|
4727
4735
|
type LlmCallPricingRegistry = Record<string, LlmCallPricing>;
|
|
4736
|
+
/**
|
|
4737
|
+
* Schema for extra currencies displayed in the LLM calls breakdown table.
|
|
4738
|
+
* Costs are still derived in USD, then multiplied by `usdToCurrencyRate`.
|
|
4739
|
+
*/
|
|
4740
|
+
declare const llmCallCostCurrencySchema: z$1.ZodObject<{
|
|
4741
|
+
code: z$1.ZodString;
|
|
4742
|
+
label: z$1.ZodOptional<z$1.ZodString>;
|
|
4743
|
+
usdToCurrencyRate: z$1.ZodNumber;
|
|
4744
|
+
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
4745
|
+
}, z$1.core.$strip>;
|
|
4746
|
+
/** Extra LLM-call cost currency authored in `agent-evals.config.ts`. */
|
|
4747
|
+
type LlmCallCostCurrency = z$1.infer<typeof llmCallCostCurrencySchema>;
|
|
4728
4748
|
/** Schema for the global LLM calls config block in `agent-evals.config.ts`. */
|
|
4729
4749
|
declare const llmCallsConfigSchema: z$1.ZodObject<{
|
|
4730
4750
|
kinds: z$1.ZodOptional<z$1.ZodArray<z$1.ZodString>>;
|
|
@@ -4763,6 +4783,12 @@ declare const llmCallsConfigSchema: z$1.ZodObject<{
|
|
|
4763
4783
|
reasoningUsdPerMillion: z$1.ZodOptional<z$1.ZodNumber>;
|
|
4764
4784
|
}, z$1.core.$strip>>>;
|
|
4765
4785
|
}, z$1.core.$strip>>>;
|
|
4786
|
+
costCurrencies: z$1.ZodOptional<z$1.ZodArray<z$1.ZodObject<{
|
|
4787
|
+
code: z$1.ZodString;
|
|
4788
|
+
label: z$1.ZodOptional<z$1.ZodString>;
|
|
4789
|
+
usdToCurrencyRate: z$1.ZodNumber;
|
|
4790
|
+
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
4791
|
+
}, z$1.core.$strip>>>;
|
|
4766
4792
|
metrics: z$1.ZodOptional<z$1.ZodArray<z$1.ZodObject<{
|
|
4767
4793
|
label: z$1.ZodString;
|
|
4768
4794
|
tooltip: z$1.ZodOptional<z$1.ZodString>;
|
|
@@ -4771,8 +4797,8 @@ declare const llmCallsConfigSchema: z$1.ZodObject<{
|
|
|
4771
4797
|
string: "string";
|
|
4772
4798
|
number: "number";
|
|
4773
4799
|
boolean: "boolean";
|
|
4774
|
-
json: "json";
|
|
4775
4800
|
duration: "duration";
|
|
4801
|
+
json: "json";
|
|
4776
4802
|
}>>;
|
|
4777
4803
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
4778
4804
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -4807,8 +4833,8 @@ declare const apiCallsConfigSchema: z$1.ZodObject<{
|
|
|
4807
4833
|
string: "string";
|
|
4808
4834
|
number: "number";
|
|
4809
4835
|
boolean: "boolean";
|
|
4810
|
-
json: "json";
|
|
4811
4836
|
duration: "duration";
|
|
4837
|
+
json: "json";
|
|
4812
4838
|
}>>;
|
|
4813
4839
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
4814
4840
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -4848,6 +4874,7 @@ type ResolvedLlmCallsConfig = {
|
|
|
4848
4874
|
derivedAttributes: ResolvedCallDerivedAttribute[];
|
|
4849
4875
|
metrics: ResolvedLlmCallMetric[];
|
|
4850
4876
|
pricing: ResolvedLlmCallPricing[];
|
|
4877
|
+
costCurrencies: ResolvedLlmCallCostCurrency[];
|
|
4851
4878
|
};
|
|
4852
4879
|
/** Resolved API-calls config sent to the UI with all defaults applied. */
|
|
4853
4880
|
type ResolvedApiCallsConfig = {
|
|
@@ -4896,6 +4923,13 @@ type ResolvedLlmCallPricing = {
|
|
|
4896
4923
|
cacheCreationInput1hUsdPerMillion?: number;
|
|
4897
4924
|
reasoningUsdPerMillion?: number;
|
|
4898
4925
|
};
|
|
4926
|
+
/** Fully-resolved extra currency used by the LLM calls tab. */
|
|
4927
|
+
type ResolvedLlmCallCostCurrency = {
|
|
4928
|
+
code: string;
|
|
4929
|
+
label?: string;
|
|
4930
|
+
usdToCurrencyRate: number;
|
|
4931
|
+
numberFormat?: NumberDisplayOptions;
|
|
4932
|
+
};
|
|
4899
4933
|
/** Default LLM-calls config the UI uses before the workspace fetch resolves. */
|
|
4900
4934
|
declare const DEFAULT_LLM_CALLS_CONFIG: ResolvedLlmCallsConfig;
|
|
4901
4935
|
/** Default API-calls config the UI uses before the workspace fetch resolves. */
|
|
@@ -4911,6 +4945,8 @@ declare const DEFAULT_API_CALLS_CONFIG: ResolvedApiCallsConfig;
|
|
|
4911
4945
|
* - Missing `metrics[].placements` defaults to `['body']`.
|
|
4912
4946
|
* - Missing `pricing` defaults to an empty registry; built-in costs are only
|
|
4913
4947
|
* derived from configured model-keyed pricing and token counts.
|
|
4948
|
+
* - Missing `costCurrencies` defaults to an empty list; extra currencies only
|
|
4949
|
+
* affect the expanded LLM calls breakdown table.
|
|
4914
4950
|
*/
|
|
4915
4951
|
declare function resolveLlmCallsConfig(input: LlmCallsConfigInput | undefined): ResolvedLlmCallsConfig;
|
|
4916
4952
|
/**
|
|
@@ -5009,6 +5045,9 @@ type AgentEvalsConfig = {
|
|
|
5009
5045
|
* outputUsdPerMillion: 0.6,
|
|
5010
5046
|
* },
|
|
5011
5047
|
* },
|
|
5048
|
+
* costCurrencies: [
|
|
5049
|
+
* { code: 'BRL', usdToCurrencyRate: 5.7, numberFormat: { prefix: 'R$ ' } },
|
|
5050
|
+
* ],
|
|
5012
5051
|
* }
|
|
5013
5052
|
* ```
|
|
5014
5053
|
*/
|
|
@@ -5096,8 +5135,8 @@ declare const agentEvalsConfigSchema: z$1.ZodObject<{
|
|
|
5096
5135
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
5097
5136
|
string: "string";
|
|
5098
5137
|
number: "number";
|
|
5099
|
-
json: "json";
|
|
5100
5138
|
duration: "duration";
|
|
5139
|
+
json: "json";
|
|
5101
5140
|
}>>;
|
|
5102
5141
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
5103
5142
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -5137,20 +5176,20 @@ declare const agentEvalsConfigSchema: z$1.ZodObject<{
|
|
|
5137
5176
|
aggregate: z$1.ZodEnum<{
|
|
5138
5177
|
last: "last";
|
|
5139
5178
|
sum: "sum";
|
|
5179
|
+
avg: "avg";
|
|
5140
5180
|
min: "min";
|
|
5141
5181
|
max: "max";
|
|
5142
|
-
avg: "avg";
|
|
5143
5182
|
}>;
|
|
5144
5183
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
5145
5184
|
number: "number";
|
|
5146
5185
|
boolean: "boolean";
|
|
5186
|
+
duration: "duration";
|
|
5187
|
+
json: "json";
|
|
5147
5188
|
file: "file";
|
|
5148
5189
|
markdown: "markdown";
|
|
5149
|
-
json: "json";
|
|
5150
5190
|
image: "image";
|
|
5151
5191
|
audio: "audio";
|
|
5152
5192
|
video: "video";
|
|
5153
|
-
duration: "duration";
|
|
5154
5193
|
percent: "percent";
|
|
5155
5194
|
passFail: "passFail";
|
|
5156
5195
|
stars: "stars";
|
|
@@ -5195,6 +5234,12 @@ declare const agentEvalsConfigSchema: z$1.ZodObject<{
|
|
|
5195
5234
|
reasoningUsdPerMillion: z$1.ZodOptional<z$1.ZodNumber>;
|
|
5196
5235
|
}, z$1.core.$strip>>>;
|
|
5197
5236
|
}, z$1.core.$strip>>>;
|
|
5237
|
+
costCurrencies: z$1.ZodOptional<z$1.ZodArray<z$1.ZodObject<{
|
|
5238
|
+
code: z$1.ZodString;
|
|
5239
|
+
label: z$1.ZodOptional<z$1.ZodString>;
|
|
5240
|
+
usdToCurrencyRate: z$1.ZodNumber;
|
|
5241
|
+
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
5242
|
+
}, z$1.core.$strip>>>;
|
|
5198
5243
|
metrics: z$1.ZodOptional<z$1.ZodArray<z$1.ZodObject<{
|
|
5199
5244
|
label: z$1.ZodString;
|
|
5200
5245
|
tooltip: z$1.ZodOptional<z$1.ZodString>;
|
|
@@ -5203,8 +5248,8 @@ declare const agentEvalsConfigSchema: z$1.ZodObject<{
|
|
|
5203
5248
|
string: "string";
|
|
5204
5249
|
number: "number";
|
|
5205
5250
|
boolean: "boolean";
|
|
5206
|
-
json: "json";
|
|
5207
5251
|
duration: "duration";
|
|
5252
|
+
json: "json";
|
|
5208
5253
|
}>>;
|
|
5209
5254
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
5210
5255
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -5214,8 +5259,8 @@ declare const agentEvalsConfigSchema: z$1.ZodObject<{
|
|
|
5214
5259
|
}, z$1.core.$strip>>>;
|
|
5215
5260
|
}, z$1.core.$strip>>;
|
|
5216
5261
|
removeDefaultConfig: z$1.ZodOptional<z$1.ZodUnion<readonly [z$1.ZodLiteral<true>, z$1.ZodArray<z$1.ZodEnum<{
|
|
5217
|
-
apiCalls: "apiCalls";
|
|
5218
5262
|
costUsd: "costUsd";
|
|
5263
|
+
apiCalls: "apiCalls";
|
|
5219
5264
|
llmTurns: "llmTurns";
|
|
5220
5265
|
inputTokens: "inputTokens";
|
|
5221
5266
|
outputTokens: "outputTokens";
|
|
@@ -5248,8 +5293,8 @@ declare const agentEvalsConfigSchema: z$1.ZodObject<{
|
|
|
5248
5293
|
string: "string";
|
|
5249
5294
|
number: "number";
|
|
5250
5295
|
boolean: "boolean";
|
|
5251
|
-
json: "json";
|
|
5252
5296
|
duration: "duration";
|
|
5297
|
+
json: "json";
|
|
5253
5298
|
}>>;
|
|
5254
5299
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
5255
5300
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -5404,9 +5449,9 @@ declare function extractApiCalls(spans: EvalTraceSpan[], config: ResolvedApiCall
|
|
|
5404
5449
|
* - `refresh`: never read, always write (forces re-execution and overwrites).
|
|
5405
5450
|
*/
|
|
5406
5451
|
declare const cacheModeSchema: z$1.ZodEnum<{
|
|
5407
|
-
use: "use";
|
|
5408
|
-
bypass: "bypass";
|
|
5409
5452
|
refresh: "refresh";
|
|
5453
|
+
bypass: "bypass";
|
|
5454
|
+
use: "use";
|
|
5410
5455
|
}>;
|
|
5411
5456
|
/** Mode controlling how cached spans behave during a run. */
|
|
5412
5457
|
type CacheMode = z$1.infer<typeof cacheModeSchema>;
|
|
@@ -5427,10 +5472,10 @@ declare const cacheOperationTypeSchema: z$1.ZodEnum<{
|
|
|
5427
5472
|
type CacheOperationType = z$1.infer<typeof cacheOperationTypeSchema>;
|
|
5428
5473
|
/** Status of a cache lookup recorded on a span or case scope. */
|
|
5429
5474
|
declare const cacheStatusSchema: z$1.ZodEnum<{
|
|
5430
|
-
bypass: "bypass";
|
|
5431
|
-
refresh: "refresh";
|
|
5432
5475
|
hit: "hit";
|
|
5433
5476
|
miss: "miss";
|
|
5477
|
+
refresh: "refresh";
|
|
5478
|
+
bypass: "bypass";
|
|
5434
5479
|
}>;
|
|
5435
5480
|
/** Status of a cache lookup recorded on a span or case scope. */
|
|
5436
5481
|
type CacheStatus = z$1.infer<typeof cacheStatusSchema>;
|
|
@@ -5447,10 +5492,10 @@ declare const traceCacheRefSchema: z$1.ZodObject<{
|
|
|
5447
5492
|
namespace: z$1.ZodString;
|
|
5448
5493
|
key: z$1.ZodString;
|
|
5449
5494
|
status: z$1.ZodEnum<{
|
|
5450
|
-
bypass: "bypass";
|
|
5451
|
-
refresh: "refresh";
|
|
5452
5495
|
hit: "hit";
|
|
5453
5496
|
miss: "miss";
|
|
5497
|
+
refresh: "refresh";
|
|
5498
|
+
bypass: "bypass";
|
|
5454
5499
|
}>;
|
|
5455
5500
|
read: z$1.ZodOptional<z$1.ZodBoolean>;
|
|
5456
5501
|
stored: z$1.ZodOptional<z$1.ZodBoolean>;
|
|
@@ -5528,8 +5573,8 @@ declare const cacheRecordingSchema: z$1.ZodObject<{
|
|
|
5528
5573
|
finalStatus: z$1.ZodOptional<z$1.ZodEnum<{
|
|
5529
5574
|
error: "error";
|
|
5530
5575
|
running: "running";
|
|
5531
|
-
cancelled: "cancelled";
|
|
5532
5576
|
ok: "ok";
|
|
5577
|
+
cancelled: "cancelled";
|
|
5533
5578
|
}>>;
|
|
5534
5579
|
finalError: z$1.ZodOptional<z$1.ZodObject<{
|
|
5535
5580
|
name: z$1.ZodOptional<z$1.ZodString>;
|
|
@@ -5601,8 +5646,8 @@ declare const cacheEntrySchema: z$1.ZodObject<{
|
|
|
5601
5646
|
finalStatus: z$1.ZodOptional<z$1.ZodEnum<{
|
|
5602
5647
|
error: "error";
|
|
5603
5648
|
running: "running";
|
|
5604
|
-
cancelled: "cancelled";
|
|
5605
5649
|
ok: "ok";
|
|
5650
|
+
cancelled: "cancelled";
|
|
5606
5651
|
}>>;
|
|
5607
5652
|
finalError: z$1.ZodOptional<z$1.ZodObject<{
|
|
5608
5653
|
name: z$1.ZodOptional<z$1.ZodString>;
|
|
@@ -5690,8 +5735,8 @@ declare const cacheEntryWithDebugKeySchema: z$1.ZodObject<{
|
|
|
5690
5735
|
finalStatus: z$1.ZodOptional<z$1.ZodEnum<{
|
|
5691
5736
|
error: "error";
|
|
5692
5737
|
running: "running";
|
|
5693
|
-
cancelled: "cancelled";
|
|
5694
5738
|
ok: "ok";
|
|
5739
|
+
cancelled: "cancelled";
|
|
5695
5740
|
}>>;
|
|
5696
5741
|
finalError: z$1.ZodOptional<z$1.ZodObject<{
|
|
5697
5742
|
name: z$1.ZodOptional<z$1.ZodString>;
|
|
@@ -5779,8 +5824,8 @@ declare const cacheFileSchema: z$1.ZodObject<{
|
|
|
5779
5824
|
finalStatus: z$1.ZodOptional<z$1.ZodEnum<{
|
|
5780
5825
|
error: "error";
|
|
5781
5826
|
running: "running";
|
|
5782
|
-
cancelled: "cancelled";
|
|
5783
5827
|
ok: "ok";
|
|
5828
|
+
cancelled: "cancelled";
|
|
5784
5829
|
}>>;
|
|
5785
5830
|
finalError: z$1.ZodOptional<z$1.ZodObject<{
|
|
5786
5831
|
name: z$1.ZodOptional<z$1.ZodString>;
|
|
@@ -5966,9 +6011,9 @@ declare const createRunRequestSchema: z$1.ZodObject<{
|
|
|
5966
6011
|
trials: z$1.ZodNumber;
|
|
5967
6012
|
cache: z$1.ZodOptional<z$1.ZodObject<{
|
|
5968
6013
|
mode: z$1.ZodDefault<z$1.ZodEnum<{
|
|
5969
|
-
use: "use";
|
|
5970
|
-
bypass: "bypass";
|
|
5971
6014
|
refresh: "refresh";
|
|
6015
|
+
bypass: "bypass";
|
|
6016
|
+
use: "use";
|
|
5972
6017
|
}>>;
|
|
5973
6018
|
}, z$1.core.$strip>>;
|
|
5974
6019
|
manualInputs: z$1.ZodOptional<z$1.ZodRecord<z$1.ZodString, z$1.ZodUnknown>>;
|
|
@@ -6238,4 +6283,4 @@ type ManualInputDescriptor = z$1.infer<typeof manualInputDescriptorSchema>; //#e
|
|
|
6238
6283
|
*/
|
|
6239
6284
|
declare function runCli(argv: string[]): Promise<void>;
|
|
6240
6285
|
//#endregion
|
|
6241
|
-
export { type AgentEvalsConfig, type ApiCallEntry, type ApiCallMetric, type ApiCallMetricFormat, type ApiCallMetricPlacement, type ApiCallMetricValue, type ApiCallsConfigInput, type AssertionFailure, type CacheActivityEntry, type CacheAdapter, type CacheDebugKeyEntry, type CacheDebugKeyFile, type CacheDebugKeyWrite, type CacheEntry, type CacheEntryWithDebugKey, type CacheFile, type CacheHitEntry, type CacheKeyHashInput, type CacheKeyHashOptions, type CacheListItem, type CacheMode, type CacheOperationType, type CacheRecording, type CacheRecordingFrame, type CacheRecordingOp, type CacheScopeContext, type CacheSerializationOptions, type CacheStatus, type CallDerivedAttribute, type CallDerivedAttributeContext, type CallDerivedAttributesConfig, type CallDerivedAttributesFn, type CaptureEvalSpanErrorLevel, type CaptureEvalSpanErrorOptions, type CaseDetail, type CaseRow, type CellValue, type ColumnDef, type ColumnFormat, type ColumnKind, type ConfigReloadState, type ConfigReloadStatus, type CreateRunRequest, DEFAULT_API_CALLS_CONFIG, DEFAULT_LLM_CALLS_CONFIG, type DefaultConfigKey, type DerivedStatus, type DiscoveryIssue, EvalAssertionError, type EvalCacheConfig, type EvalCase, type EvalCaseScope, type EvalChartAggregate, type EvalChartAxis, type EvalChartBuiltinMetric, type EvalChartColor, type EvalChartConfig, type EvalChartMetric, type EvalChartTooltipExtra, type EvalChartType, type EvalChartsConfig, type EvalColumnOverride, type EvalColumns, type EvalDefinition, type EvalDeriveConfig, type EvalDeriveContext, type EvalDeriveFn, type EvalDeriveMap, type EvalDeriveValueFn, type EvalDisplayStatus, type EvalExecuteContext, type EvalExpectation, type EvalFreshnessStatus, type EvalManualInputConfig, type EvalManualScoreDef, type EvalOutputs, type EvalOutputsSchema, type EvalRunner, type EvalRuntimeScope, type EvalScoreContext, type EvalScoreDef, type EvalScoreFn, type EvalSetOutput, type EvalStartTime, type EvalStatAggregate, type EvalStatItem, type EvalStatsConfig, type EvalSummary, type EvalTimeUnit, type EvalTraceSpan, type EvalTraceSpanError, type EvalTraceSpanWarning, type EvalTraceTree, type FileRef, type JsonCell, type LlmCallEntry, type LlmCallMetric, type LlmCallMetricFormat, type LlmCallMetricPlacement, type LlmCallMetricValue, type LlmCallPricing, type LlmCallPricingRate, type LlmCallPricingRegistry, type LlmCallsConfigInput, type ManualInputDescriptor, type ManualInputFieldDescriptor, type ManualInputFieldKind, type ManualInputFieldOverride, type ManualInputFieldsConfig, type ManualInputFileValue, type ManualInputSelectOption, type MaterializeManualInputFilesResult, type NumberDisplayOptions, type ReadManualInputFileResult, type RemoveDefaultConfig, type RepoFileRef, type ResolvedApiCallMetric, type ResolvedApiCallsConfig, type ResolvedCallDerivedAttribute, type ResolvedLlmCallMetric, type ResolvedLlmCallPricing, type ResolvedLlmCallsConfig, type RunArtifactRef, type RunInEvalScopeOptions, type RunLogEntry, type RunLogLevel, type RunLogLocation, type RunLogPhase, type RunLogsConfigInput, type RunManifest, type RunSummary, type ScalarCell, type ScopedCaseSummary, type ScoreTrace, type SerializedCacheSpan, type SerializedCacheValue, type SpanCacheOptions, type SseEnvelope, type SseEventType, type TraceActiveSpan, type TraceAttributeDisplay, type TraceAttributeDisplayFormat, type TraceAttributeDisplayInput, type TraceAttributeDisplayPlacement, type TraceAttributeTransform, type TraceAttributeTransformContext, type TraceCacheInfo, type TraceCacheRef, type TraceDisplayConfig, type TraceDisplayInputConfig, type TraceSpanInfo, type TrialSelectionMode, type UpdateManualScoreRequest, advanceEvalTime, agentEvalsConfigSchema, apiCallMetricFormatSchema, apiCallMetricPlacementSchema, apiCallMetricSchema, apiCallsConfigSchema, appendToEvalOutput, applyDerivedCallAttributes, assertionFailureSchema, buildCaseKey, buildEvalKey, buildTraceTree, cacheDebugKeyEntrySchema, cacheDebugKeyFileSchema, cacheEntrySchema, cacheEntryWithDebugKeySchema, cacheFileSchema, cacheListItemSchema, cacheModeSchema, cacheOperationTypeSchema, cacheRecordingOpSchema, cacheRecordingSchema, cacheStatusSchema, captureEvalSpanError, caseDetailSchema, caseRowSchema, cellValueSchema, cleanupStagedManualInputFiles, columnDefSchema, columnFormatSchema, columnKindSchema, configReloadStateSchema, configReloadStatusSchema, createRunRequestSchema, createRunner, defaultConfigKeySchema, defineEval, deriveScopedSummaryFromCases, deriveStatusFromCaseRows, deriveStatusFromChildStatuses, deserializeCacheRecording, deserializeCacheValue, discoveryIssueSchema, evalAssert, evalChartAggregateSchema, evalChartAxisSchema, evalChartBuiltinMetricSchema, evalChartColorSchema, evalChartConfigSchema, evalChartMetricSchema, evalChartTooltipExtraSchema, evalChartTypeSchema, evalChartsConfigSchema, evalColumnOverrideSchema, evalColumnsSchema, evalDeriveConfigSchema, evalExpect, evalFreshnessStatusSchema, evalLog, evalSpan, evalStatAggregateSchema, evalStatItemSchema, evalStatsConfigSchema, evalSummarySchema, evalTracer, extractApiCalls, extractCacheEntries, extractCacheHits, extractLlmCalls, fileRefSchema, getCaseRowCaseKey, getCaseRowEvalKey, getCurrentScope, getEvalCaseInput, getEvalDisplayStatus, getEvalRegistry, getEvalStartTime, getEvalTitle, getNestedAttribute, hashCacheKey, hashCacheKeySync, incrementEvalOutput, isInEvalScope, isManualInputFileValue, jsonCellSchema, llmCallMetricFormatSchema, llmCallMetricPlacementSchema, llmCallMetricSchema, llmCallPricingRateSchema, llmCallPricingSchema, llmCallsConfigSchema, manualInputBooleanFieldSchema, manualInputDescriptorSchema, manualInputFieldDescriptorSchema, manualInputFileValueSchema, manualInputJsonFieldSchema, manualInputMultilineFieldSchema, manualInputNumberFieldSchema, manualInputSelectFieldSchema, manualInputSelectOptionSchema, manualInputTextFieldSchema, materializeManualInputFiles, mergeEvalOutput, nextEvalId, numberDisplayOptionsSchema, readManualInputFile, removeDefaultConfigSchema, repoFile, repoFileRefSchema, resolveApiCallsConfig, resolveLlmCallsConfig, runArtifactRefSchema, runCli, runInEvalRuntimeScope, runInEvalScope, runInExistingEvalScope, runLogEntrySchema, runLogLevelSchema, runLogLocationSchema, runLogPhaseSchema, runLogsConfigSchema, runManifestSchema, runSummarySchema, scoreTraceSchema, serializeCacheRecording, serializeCacheValue, serializedCacheSpanSchema, setEvalOutput, setScopeCacheContext, spanCacheOptionsSchema, sseEnvelopeSchema, stageManualInputFile, stageManualInputFileFromPath, startEvalBackgroundJob, traceAttributeDisplayFormatSchema, traceAttributeDisplayInputSchema, traceAttributeDisplayPlacementSchema, traceAttributeDisplaySchema, traceCacheRefSchema, traceDisplayConfigSchema, traceDisplayInputConfigSchema, traceSpanErrorSchema, traceSpanKindSchema, traceSpanSchema, traceSpanWarningSchema, trialSelectionModeSchema, updateManualScoreRequestSchema, z };
|
|
6286
|
+
export { type AgentEvalsConfig, type ApiCallEntry, type ApiCallMetric, type ApiCallMetricFormat, type ApiCallMetricPlacement, type ApiCallMetricValue, type ApiCallsConfigInput, type AssertionFailure, type CacheActivityEntry, type CacheAdapter, type CacheDebugKeyEntry, type CacheDebugKeyFile, type CacheDebugKeyWrite, type CacheEntry, type CacheEntryWithDebugKey, type CacheFile, type CacheHitEntry, type CacheKeyHashInput, type CacheKeyHashOptions, type CacheListItem, type CacheMode, type CacheOperationType, type CacheRecording, type CacheRecordingFrame, type CacheRecordingOp, type CacheScopeContext, type CacheSerializationOptions, type CacheStatus, type CallDerivedAttribute, type CallDerivedAttributeContext, type CallDerivedAttributesConfig, type CallDerivedAttributesFn, type CaptureEvalSpanErrorLevel, type CaptureEvalSpanErrorOptions, type CaseDetail, type CaseRow, type CellValue, type ColumnDef, type ColumnFormat, type ColumnKind, type ConfigReloadState, type ConfigReloadStatus, type CreateRunRequest, DEFAULT_API_CALLS_CONFIG, DEFAULT_LLM_CALLS_CONFIG, type DefaultConfigKey, type DerivedStatus, type DiscoveryIssue, EvalAssertionError, type EvalCacheConfig, type EvalCase, type EvalCaseScope, type EvalChartAggregate, type EvalChartAxis, type EvalChartBuiltinMetric, type EvalChartColor, type EvalChartConfig, type EvalChartMetric, type EvalChartTooltipExtra, type EvalChartType, type EvalChartsConfig, type EvalColumnOverride, type EvalColumns, type EvalDefinition, type EvalDeriveConfig, type EvalDeriveContext, type EvalDeriveFn, type EvalDeriveMap, type EvalDeriveValueFn, type EvalDisplayStatus, type EvalExecuteContext, type EvalExpectation, type EvalFreshnessStatus, type EvalManualInputConfig, type EvalManualScoreDef, type EvalOutputs, type EvalOutputsSchema, type EvalRunner, type EvalRuntimeScope, type EvalScoreContext, type EvalScoreDef, type EvalScoreFn, type EvalSetOutput, type EvalStartTime, type EvalStatAggregate, type EvalStatItem, type EvalStatsConfig, type EvalSummary, type EvalTimeUnit, type EvalTraceSpan, type EvalTraceSpanError, type EvalTraceSpanWarning, type EvalTraceTree, type FileRef, type JsonCell, type LlmCallCostCurrency, type LlmCallEntry, type LlmCallMetric, type LlmCallMetricFormat, type LlmCallMetricPlacement, type LlmCallMetricValue, type LlmCallPricing, type LlmCallPricingRate, type LlmCallPricingRegistry, type LlmCallsConfigInput, type ManualInputDescriptor, type ManualInputFieldDescriptor, type ManualInputFieldKind, type ManualInputFieldOverride, type ManualInputFieldsConfig, type ManualInputFileValue, type ManualInputSelectOption, type MaterializeManualInputFilesResult, type NumberDisplayOptions, type ReadManualInputFileResult, type RemoveDefaultConfig, type RepoFileRef, type ResolvedApiCallMetric, type ResolvedApiCallsConfig, type ResolvedCallDerivedAttribute, type ResolvedLlmCallCostCurrency, type ResolvedLlmCallMetric, type ResolvedLlmCallPricing, type ResolvedLlmCallsConfig, type RunArtifactRef, type RunInEvalScopeOptions, type RunLogEntry, type RunLogLevel, type RunLogLocation, type RunLogPhase, type RunLogsConfigInput, type RunManifest, type RunSummary, type ScalarCell, type ScopedCaseSummary, type ScoreTrace, type SerializedCacheSpan, type SerializedCacheValue, type SpanCacheOptions, type SseEnvelope, type SseEventType, type TraceActiveSpan, type TraceAttributeDisplay, type TraceAttributeDisplayFormat, type TraceAttributeDisplayInput, type TraceAttributeDisplayPlacement, type TraceAttributeTransform, type TraceAttributeTransformContext, type TraceCacheInfo, type TraceCacheRef, type TraceDisplayConfig, type TraceDisplayInputConfig, type TraceSpanInfo, type TrialSelectionMode, type UpdateManualScoreRequest, advanceEvalTime, agentEvalsConfigSchema, apiCallMetricFormatSchema, apiCallMetricPlacementSchema, apiCallMetricSchema, apiCallsConfigSchema, appendToEvalOutput, applyDerivedCallAttributes, assertionFailureSchema, buildCaseKey, buildEvalKey, buildTraceTree, cacheDebugKeyEntrySchema, cacheDebugKeyFileSchema, cacheEntrySchema, cacheEntryWithDebugKeySchema, cacheFileSchema, cacheListItemSchema, cacheModeSchema, cacheOperationTypeSchema, cacheRecordingOpSchema, cacheRecordingSchema, cacheStatusSchema, captureEvalSpanError, caseDetailSchema, caseRowSchema, cellValueSchema, cleanupStagedManualInputFiles, columnDefSchema, columnFormatSchema, columnKindSchema, configReloadStateSchema, configReloadStatusSchema, createRunRequestSchema, createRunner, defaultConfigKeySchema, defineEval, deriveScopedSummaryFromCases, deriveStatusFromCaseRows, deriveStatusFromChildStatuses, deserializeCacheRecording, deserializeCacheValue, discoveryIssueSchema, evalAssert, evalChartAggregateSchema, evalChartAxisSchema, evalChartBuiltinMetricSchema, evalChartColorSchema, evalChartConfigSchema, evalChartMetricSchema, evalChartTooltipExtraSchema, evalChartTypeSchema, evalChartsConfigSchema, evalColumnOverrideSchema, evalColumnsSchema, evalDeriveConfigSchema, evalExpect, evalFreshnessStatusSchema, evalLog, evalSpan, evalStatAggregateSchema, evalStatItemSchema, evalStatsConfigSchema, evalSummarySchema, evalTracer, extractApiCalls, extractCacheEntries, extractCacheHits, extractLlmCalls, fileRefSchema, getCaseRowCaseKey, getCaseRowEvalKey, getCurrentScope, getEvalCaseInput, getEvalDisplayStatus, getEvalRegistry, getEvalStartTime, getEvalTitle, getNestedAttribute, hashCacheKey, hashCacheKeySync, incrementEvalOutput, isInEvalScope, isManualInputFileValue, jsonCellSchema, llmCallCostCurrencySchema, llmCallMetricFormatSchema, llmCallMetricPlacementSchema, llmCallMetricSchema, llmCallPricingRateSchema, llmCallPricingSchema, llmCallsConfigSchema, manualInputBooleanFieldSchema, manualInputDescriptorSchema, manualInputFieldDescriptorSchema, manualInputFileValueSchema, manualInputJsonFieldSchema, manualInputMultilineFieldSchema, manualInputNumberFieldSchema, manualInputSelectFieldSchema, manualInputSelectOptionSchema, manualInputTextFieldSchema, materializeManualInputFiles, mergeEvalOutput, nextEvalId, numberDisplayOptionsSchema, readManualInputFile, removeDefaultConfigSchema, repoFile, repoFileRefSchema, resolveApiCallsConfig, resolveLlmCallsConfig, runArtifactRefSchema, runCli, runInEvalRuntimeScope, runInEvalScope, runInExistingEvalScope, runLogEntrySchema, runLogLevelSchema, runLogLocationSchema, runLogPhaseSchema, runLogsConfigSchema, runManifestSchema, runSummarySchema, scoreTraceSchema, serializeCacheRecording, serializeCacheValue, serializedCacheSpanSchema, setEvalOutput, setScopeCacheContext, spanCacheOptionsSchema, sseEnvelopeSchema, stageManualInputFile, stageManualInputFileFromPath, startEvalBackgroundJob, traceAttributeDisplayFormatSchema, traceAttributeDisplayInputSchema, traceAttributeDisplayPlacementSchema, traceAttributeDisplaySchema, traceCacheRefSchema, traceDisplayConfigSchema, traceDisplayInputConfigSchema, traceSpanErrorSchema, traceSpanKindSchema, traceSpanSchema, traceSpanWarningSchema, trialSelectionModeSchema, updateManualScoreRequestSchema, z };
|