@ls-stack/agent-eval 0.29.0 → 0.31.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/{app-D6-msfKP.mjs → app-BrSMRTpy.mjs} +4 -4
- package/dist/apps/web/dist/assets/index-CPcVyFRP.js +118 -0
- package/dist/apps/web/dist/assets/index-ClPR-tfN.css +1 -0
- package/dist/apps/web/dist/index.html +2 -2
- package/dist/bin.mjs +1 -1
- package/dist/{cli-CIc_gBNM.mjs → cli-CMPmuY7W.mjs} +3 -3
- package/dist/index.d.mts +182 -113
- package/dist/index.mjs +4 -4
- package/dist/runChild.mjs +1 -1
- package/dist/{runOrchestration-CIARrLs6.mjs → runOrchestration-CAyVXPFz.mjs} +69 -12
- package/dist/{runner-1F8MeY5V.mjs → runner-Bnm1nz0U.mjs} +2 -2
- package/dist/{runner-Bq1f9B9d.mjs → runner-CmpWwCe1.mjs} +1 -1
- package/dist/src-gZm9nyTp.mjs +3 -0
- package/package.json +1 -1
- package/skills/agent-eval/SKILL.md +12 -8
- package/dist/apps/web/dist/assets/index-BCr6J8Uj.js +0 -118
- package/dist/apps/web/dist/assets/index-DjUTm3M-.css +0 -1
- package/dist/src-CkWT1iSu.mjs +0 -3
package/dist/index.d.mts
CHANGED
|
@@ -700,10 +700,10 @@ declare const apiCallMetricPlacementSchema$1: z$1.ZodEnum<{
|
|
|
700
700
|
}>;
|
|
701
701
|
/** Placement option for an API-call metric. */
|
|
702
702
|
type ApiCallMetricPlacement$1 = z$1.infer<typeof apiCallMetricPlacementSchema$1>;
|
|
703
|
-
/** Context passed to
|
|
703
|
+
/** Context passed to LLM/API-call derived attribute functions. */
|
|
704
704
|
type CallDerivedAttributeContext$1 = {
|
|
705
|
-
/**
|
|
706
|
-
span: EvalTraceSpan$2; /** Dot-path helper for reading from
|
|
705
|
+
/** Current attributes from the matching trace span. */attributes: Record<string, unknown> | undefined; /** Matching trace span. */
|
|
706
|
+
span: EvalTraceSpan$2; /** Dot-path helper for reading from the current span attributes. */
|
|
707
707
|
get: (path: string) => unknown;
|
|
708
708
|
};
|
|
709
709
|
/**
|
|
@@ -711,14 +711,25 @@ type CallDerivedAttributeContext$1 = {
|
|
|
711
711
|
* LLM/API-call span. Return `undefined` to omit the attribute for that span.
|
|
712
712
|
*/
|
|
713
713
|
type CallDerivedAttribute$1 = (ctx: CallDerivedAttributeContext$1) => unknown;
|
|
714
|
+
/**
|
|
715
|
+
* Runner-side function used to derive multiple span attributes from a matching
|
|
716
|
+
* LLM/API-call span. Returned object keys are dot-paths under
|
|
717
|
+
* `span.attributes`; `undefined` values are skipped.
|
|
718
|
+
*/
|
|
719
|
+
type CallDerivedAttributesFn$1 = (ctx: CallDerivedAttributeContext$1) => Record<string, unknown> | undefined;
|
|
714
720
|
/** One resolved derived span attribute rule. */
|
|
715
721
|
type ResolvedCallDerivedAttribute$1 = {
|
|
716
|
-
/** Dot-path where
|
|
722
|
+
/** Dot-path where one derived value is persisted on `span.attributes`. */path?: string;
|
|
717
723
|
/**
|
|
718
|
-
* Function that derives
|
|
724
|
+
* Function that derives one persisted value for each matching span. Omitted
|
|
719
725
|
* after this config is serialized to the browser.
|
|
720
726
|
*/
|
|
721
727
|
compute?: CallDerivedAttribute$1;
|
|
728
|
+
/**
|
|
729
|
+
* Function that derives multiple persisted values for each matching span.
|
|
730
|
+
* Omitted after this config is serialized to the browser.
|
|
731
|
+
*/
|
|
732
|
+
computeMany?: CallDerivedAttributesFn$1;
|
|
722
733
|
};
|
|
723
734
|
/** Resolved LLM-calls config sent to the UI with all defaults applied. */
|
|
724
735
|
type ResolvedLlmCallsConfig$1 = {
|
|
@@ -743,6 +754,7 @@ type ResolvedLlmCallsConfig$1 = {
|
|
|
743
754
|
derivedAttributes: ResolvedCallDerivedAttribute$1[];
|
|
744
755
|
metrics: ResolvedLlmCallMetric$1[];
|
|
745
756
|
pricing: ResolvedLlmCallPricing$1[];
|
|
757
|
+
costCurrencies: ResolvedLlmCallCostCurrency$1[];
|
|
746
758
|
};
|
|
747
759
|
/** Resolved API-calls config sent to the UI with all defaults applied. */
|
|
748
760
|
type ResolvedApiCallsConfig$1 = {
|
|
@@ -790,6 +802,13 @@ type ResolvedLlmCallPricing$1 = {
|
|
|
790
802
|
cacheCreationInputUsdPerMillion?: number;
|
|
791
803
|
cacheCreationInput1hUsdPerMillion?: number;
|
|
792
804
|
reasoningUsdPerMillion?: number;
|
|
805
|
+
};
|
|
806
|
+
/** Fully-resolved extra currency used by the LLM calls tab. */
|
|
807
|
+
type ResolvedLlmCallCostCurrency$1 = {
|
|
808
|
+
code: string;
|
|
809
|
+
label?: string;
|
|
810
|
+
usdToCurrencyRate: number;
|
|
811
|
+
numberFormat?: NumberDisplayOptions$2;
|
|
793
812
|
}; //#endregion
|
|
794
813
|
//#region ../shared/src/schemas/cache.d.ts
|
|
795
814
|
/** Summary of a single persisted cache entry, used by list/delete endpoints. */
|
|
@@ -2889,13 +2908,13 @@ type ColumnKind = z$1.infer<typeof columnKindSchema>;
|
|
|
2889
2908
|
declare const columnFormatSchema: z$1.ZodEnum<{
|
|
2890
2909
|
number: "number";
|
|
2891
2910
|
boolean: "boolean";
|
|
2911
|
+
duration: "duration";
|
|
2912
|
+
json: "json";
|
|
2892
2913
|
file: "file";
|
|
2893
2914
|
markdown: "markdown";
|
|
2894
|
-
json: "json";
|
|
2895
2915
|
image: "image";
|
|
2896
2916
|
audio: "audio";
|
|
2897
2917
|
video: "video";
|
|
2898
|
-
duration: "duration";
|
|
2899
2918
|
percent: "percent";
|
|
2900
2919
|
passFail: "passFail";
|
|
2901
2920
|
stars: "stars";
|
|
@@ -2914,13 +2933,13 @@ declare const columnDefSchema: z$1.ZodObject<{
|
|
|
2914
2933
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
2915
2934
|
number: "number";
|
|
2916
2935
|
boolean: "boolean";
|
|
2936
|
+
duration: "duration";
|
|
2937
|
+
json: "json";
|
|
2917
2938
|
file: "file";
|
|
2918
2939
|
markdown: "markdown";
|
|
2919
|
-
json: "json";
|
|
2920
2940
|
image: "image";
|
|
2921
2941
|
audio: "audio";
|
|
2922
2942
|
video: "video";
|
|
2923
|
-
duration: "duration";
|
|
2924
2943
|
percent: "percent";
|
|
2925
2944
|
passFail: "passFail";
|
|
2926
2945
|
stars: "stars";
|
|
@@ -2965,8 +2984,8 @@ declare const traceSpanKindSchema: z$1.ZodString;
|
|
|
2965
2984
|
declare const traceAttributeDisplayFormatSchema: z$1.ZodEnum<{
|
|
2966
2985
|
string: "string";
|
|
2967
2986
|
number: "number";
|
|
2968
|
-
json: "json";
|
|
2969
2987
|
duration: "duration";
|
|
2988
|
+
json: "json";
|
|
2970
2989
|
}>;
|
|
2971
2990
|
/**
|
|
2972
2991
|
* Formatting hint for trace attribute values rendered by the UI.
|
|
@@ -2990,8 +3009,8 @@ declare const traceAttributeDisplaySchema: z$1.ZodObject<{
|
|
|
2990
3009
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
2991
3010
|
string: "string";
|
|
2992
3011
|
number: "number";
|
|
2993
|
-
json: "json";
|
|
2994
3012
|
duration: "duration";
|
|
3013
|
+
json: "json";
|
|
2995
3014
|
}>>;
|
|
2996
3015
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
2997
3016
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -3004,9 +3023,9 @@ declare const traceAttributeDisplaySchema: z$1.ZodObject<{
|
|
|
3004
3023
|
subtree: "subtree";
|
|
3005
3024
|
}>>;
|
|
3006
3025
|
mode: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3007
|
-
sum: "sum";
|
|
3008
|
-
last: "last";
|
|
3009
3026
|
all: "all";
|
|
3027
|
+
last: "last";
|
|
3028
|
+
sum: "sum";
|
|
3010
3029
|
}>>;
|
|
3011
3030
|
}, z$1.core.$strip>;
|
|
3012
3031
|
/**
|
|
@@ -3026,8 +3045,8 @@ declare const traceDisplayConfigSchema: z$1.ZodObject<{
|
|
|
3026
3045
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3027
3046
|
string: "string";
|
|
3028
3047
|
number: "number";
|
|
3029
|
-
json: "json";
|
|
3030
3048
|
duration: "duration";
|
|
3049
|
+
json: "json";
|
|
3031
3050
|
}>>;
|
|
3032
3051
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
3033
3052
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -3040,9 +3059,9 @@ declare const traceDisplayConfigSchema: z$1.ZodObject<{
|
|
|
3040
3059
|
subtree: "subtree";
|
|
3041
3060
|
}>>;
|
|
3042
3061
|
mode: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3043
|
-
sum: "sum";
|
|
3044
|
-
last: "last";
|
|
3045
3062
|
all: "all";
|
|
3063
|
+
last: "last";
|
|
3064
|
+
sum: "sum";
|
|
3046
3065
|
}>>;
|
|
3047
3066
|
}, z$1.core.$strip>>>;
|
|
3048
3067
|
}, z$1.core.$strip>;
|
|
@@ -3066,8 +3085,8 @@ declare const traceAttributeDisplayInputSchema: z$1.ZodObject<{
|
|
|
3066
3085
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3067
3086
|
string: "string";
|
|
3068
3087
|
number: "number";
|
|
3069
|
-
json: "json";
|
|
3070
3088
|
duration: "duration";
|
|
3089
|
+
json: "json";
|
|
3071
3090
|
}>>;
|
|
3072
3091
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
3073
3092
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -3080,9 +3099,9 @@ declare const traceAttributeDisplayInputSchema: z$1.ZodObject<{
|
|
|
3080
3099
|
subtree: "subtree";
|
|
3081
3100
|
}>>;
|
|
3082
3101
|
mode: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3083
|
-
sum: "sum";
|
|
3084
|
-
last: "last";
|
|
3085
3102
|
all: "all";
|
|
3103
|
+
last: "last";
|
|
3104
|
+
sum: "sum";
|
|
3086
3105
|
}>>;
|
|
3087
3106
|
transform: z$1.ZodOptional<z$1.ZodCustom<TraceAttributeTransform, TraceAttributeTransform>>;
|
|
3088
3107
|
}, z$1.core.$strip>;
|
|
@@ -3104,8 +3123,8 @@ declare const traceDisplayInputConfigSchema: z$1.ZodObject<{
|
|
|
3104
3123
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3105
3124
|
string: "string";
|
|
3106
3125
|
number: "number";
|
|
3107
|
-
json: "json";
|
|
3108
3126
|
duration: "duration";
|
|
3127
|
+
json: "json";
|
|
3109
3128
|
}>>;
|
|
3110
3129
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
3111
3130
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -3118,9 +3137,9 @@ declare const traceDisplayInputConfigSchema: z$1.ZodObject<{
|
|
|
3118
3137
|
subtree: "subtree";
|
|
3119
3138
|
}>>;
|
|
3120
3139
|
mode: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3121
|
-
sum: "sum";
|
|
3122
|
-
last: "last";
|
|
3123
3140
|
all: "all";
|
|
3141
|
+
last: "last";
|
|
3142
|
+
sum: "sum";
|
|
3124
3143
|
}>>;
|
|
3125
3144
|
transform: z$1.ZodOptional<z$1.ZodCustom<TraceAttributeTransform, TraceAttributeTransform>>;
|
|
3126
3145
|
}, z$1.core.$strip>>>;
|
|
@@ -3157,8 +3176,8 @@ declare const traceSpanSchema: z$1.ZodObject<{
|
|
|
3157
3176
|
status: z$1.ZodEnum<{
|
|
3158
3177
|
error: "error";
|
|
3159
3178
|
running: "running";
|
|
3160
|
-
cancelled: "cancelled";
|
|
3161
3179
|
ok: "ok";
|
|
3180
|
+
cancelled: "cancelled";
|
|
3162
3181
|
}>;
|
|
3163
3182
|
attributes: z$1.ZodOptional<z$1.ZodRecord<z$1.ZodString, z$1.ZodUnknown>>;
|
|
3164
3183
|
error: z$1.ZodOptional<z$1.ZodObject<{
|
|
@@ -3199,11 +3218,11 @@ declare const evalFreshnessStatusSchema: z$1.ZodEnum<{
|
|
|
3199
3218
|
type EvalFreshnessStatus = z$1.infer<typeof evalFreshnessStatusSchema>;
|
|
3200
3219
|
/** Reducer used to collapse a column's per-case values into a single stat. */
|
|
3201
3220
|
declare const evalStatAggregateSchema: z$1.ZodEnum<{
|
|
3221
|
+
last: "last";
|
|
3222
|
+
sum: "sum";
|
|
3202
3223
|
avg: "avg";
|
|
3203
3224
|
min: "min";
|
|
3204
3225
|
max: "max";
|
|
3205
|
-
sum: "sum";
|
|
3206
|
-
last: "last";
|
|
3207
3226
|
}>;
|
|
3208
3227
|
/** Reducer used to collapse a column's per-case values into a single stat. */
|
|
3209
3228
|
type EvalStatAggregate = z$1.infer<typeof evalStatAggregateSchema>;
|
|
@@ -3227,22 +3246,22 @@ declare const evalStatItemSchema: z$1.ZodDiscriminatedUnion<[z$1.ZodObject<{
|
|
|
3227
3246
|
key: z$1.ZodString;
|
|
3228
3247
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
3229
3248
|
aggregate: z$1.ZodEnum<{
|
|
3249
|
+
last: "last";
|
|
3250
|
+
sum: "sum";
|
|
3230
3251
|
avg: "avg";
|
|
3231
3252
|
min: "min";
|
|
3232
3253
|
max: "max";
|
|
3233
|
-
sum: "sum";
|
|
3234
|
-
last: "last";
|
|
3235
3254
|
}>;
|
|
3236
3255
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3237
3256
|
number: "number";
|
|
3238
3257
|
boolean: "boolean";
|
|
3258
|
+
duration: "duration";
|
|
3259
|
+
json: "json";
|
|
3239
3260
|
file: "file";
|
|
3240
3261
|
markdown: "markdown";
|
|
3241
|
-
json: "json";
|
|
3242
3262
|
image: "image";
|
|
3243
3263
|
audio: "audio";
|
|
3244
3264
|
video: "video";
|
|
3245
|
-
duration: "duration";
|
|
3246
3265
|
percent: "percent";
|
|
3247
3266
|
passFail: "passFail";
|
|
3248
3267
|
stars: "stars";
|
|
@@ -3269,22 +3288,22 @@ declare const evalStatsConfigSchema: z$1.ZodArray<z$1.ZodDiscriminatedUnion<[z$1
|
|
|
3269
3288
|
key: z$1.ZodString;
|
|
3270
3289
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
3271
3290
|
aggregate: z$1.ZodEnum<{
|
|
3291
|
+
last: "last";
|
|
3292
|
+
sum: "sum";
|
|
3272
3293
|
avg: "avg";
|
|
3273
3294
|
min: "min";
|
|
3274
3295
|
max: "max";
|
|
3275
|
-
sum: "sum";
|
|
3276
|
-
last: "last";
|
|
3277
3296
|
}>;
|
|
3278
3297
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3279
3298
|
number: "number";
|
|
3280
3299
|
boolean: "boolean";
|
|
3300
|
+
duration: "duration";
|
|
3301
|
+
json: "json";
|
|
3281
3302
|
file: "file";
|
|
3282
3303
|
markdown: "markdown";
|
|
3283
|
-
json: "json";
|
|
3284
3304
|
image: "image";
|
|
3285
3305
|
audio: "audio";
|
|
3286
3306
|
video: "video";
|
|
3287
|
-
duration: "duration";
|
|
3288
3307
|
percent: "percent";
|
|
3289
3308
|
passFail: "passFail";
|
|
3290
3309
|
stars: "stars";
|
|
@@ -3321,13 +3340,13 @@ declare const evalSummarySchema: z$1.ZodObject<{
|
|
|
3321
3340
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3322
3341
|
number: "number";
|
|
3323
3342
|
boolean: "boolean";
|
|
3343
|
+
duration: "duration";
|
|
3344
|
+
json: "json";
|
|
3324
3345
|
file: "file";
|
|
3325
3346
|
markdown: "markdown";
|
|
3326
|
-
json: "json";
|
|
3327
3347
|
image: "image";
|
|
3328
3348
|
audio: "audio";
|
|
3329
3349
|
video: "video";
|
|
3330
|
-
duration: "duration";
|
|
3331
3350
|
percent: "percent";
|
|
3332
3351
|
passFail: "passFail";
|
|
3333
3352
|
stars: "stars";
|
|
@@ -3348,10 +3367,10 @@ declare const evalSummarySchema: z$1.ZodObject<{
|
|
|
3348
3367
|
caseCount: z$1.ZodNullable<z$1.ZodNumber>;
|
|
3349
3368
|
lastRunStatus: z$1.ZodNullable<z$1.ZodEnum<{
|
|
3350
3369
|
error: "error";
|
|
3351
|
-
pass: "pass";
|
|
3352
|
-
fail: "fail";
|
|
3353
3370
|
running: "running";
|
|
3354
3371
|
cancelled: "cancelled";
|
|
3372
|
+
pass: "pass";
|
|
3373
|
+
fail: "fail";
|
|
3355
3374
|
unscored: "unscored";
|
|
3356
3375
|
}>>;
|
|
3357
3376
|
stats: z$1.ZodOptional<z$1.ZodArray<z$1.ZodDiscriminatedUnion<[z$1.ZodObject<{
|
|
@@ -3370,22 +3389,22 @@ declare const evalSummarySchema: z$1.ZodObject<{
|
|
|
3370
3389
|
key: z$1.ZodString;
|
|
3371
3390
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
3372
3391
|
aggregate: z$1.ZodEnum<{
|
|
3392
|
+
last: "last";
|
|
3393
|
+
sum: "sum";
|
|
3373
3394
|
avg: "avg";
|
|
3374
3395
|
min: "min";
|
|
3375
3396
|
max: "max";
|
|
3376
|
-
sum: "sum";
|
|
3377
|
-
last: "last";
|
|
3378
3397
|
}>;
|
|
3379
3398
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3380
3399
|
number: "number";
|
|
3381
3400
|
boolean: "boolean";
|
|
3401
|
+
duration: "duration";
|
|
3402
|
+
json: "json";
|
|
3382
3403
|
file: "file";
|
|
3383
3404
|
markdown: "markdown";
|
|
3384
|
-
json: "json";
|
|
3385
3405
|
image: "image";
|
|
3386
3406
|
audio: "audio";
|
|
3387
3407
|
video: "video";
|
|
3388
|
-
duration: "duration";
|
|
3389
3408
|
percent: "percent";
|
|
3390
3409
|
passFail: "passFail";
|
|
3391
3410
|
stars: "stars";
|
|
@@ -3410,11 +3429,11 @@ declare const evalSummarySchema: z$1.ZodObject<{
|
|
|
3410
3429
|
}>;
|
|
3411
3430
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
3412
3431
|
color: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3413
|
-
success: "success";
|
|
3414
3432
|
error: "error";
|
|
3433
|
+
success: "success";
|
|
3434
|
+
warning: "warning";
|
|
3415
3435
|
accent: "accent";
|
|
3416
3436
|
accentDim: "accentDim";
|
|
3417
|
-
warning: "warning";
|
|
3418
3437
|
textMuted: "textMuted";
|
|
3419
3438
|
}>>;
|
|
3420
3439
|
axis: z$1.ZodOptional<z$1.ZodEnum<{
|
|
@@ -3425,20 +3444,20 @@ declare const evalSummarySchema: z$1.ZodObject<{
|
|
|
3425
3444
|
source: z$1.ZodLiteral<"column">;
|
|
3426
3445
|
key: z$1.ZodString;
|
|
3427
3446
|
aggregate: z$1.ZodEnum<{
|
|
3447
|
+
sum: "sum";
|
|
3428
3448
|
avg: "avg";
|
|
3429
3449
|
min: "min";
|
|
3430
3450
|
max: "max";
|
|
3431
|
-
sum: "sum";
|
|
3432
3451
|
latest: "latest";
|
|
3433
3452
|
passThresholdRate: "passThresholdRate";
|
|
3434
3453
|
}>;
|
|
3435
3454
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
3436
3455
|
color: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3437
|
-
success: "success";
|
|
3438
3456
|
error: "error";
|
|
3457
|
+
success: "success";
|
|
3458
|
+
warning: "warning";
|
|
3439
3459
|
accent: "accent";
|
|
3440
3460
|
accentDim: "accentDim";
|
|
3441
|
-
warning: "warning";
|
|
3442
3461
|
textMuted: "textMuted";
|
|
3443
3462
|
}>>;
|
|
3444
3463
|
axis: z$1.ZodOptional<z$1.ZodEnum<{
|
|
@@ -3467,10 +3486,10 @@ declare const evalSummarySchema: z$1.ZodObject<{
|
|
|
3467
3486
|
source: z$1.ZodLiteral<"column">;
|
|
3468
3487
|
key: z$1.ZodString;
|
|
3469
3488
|
aggregate: z$1.ZodEnum<{
|
|
3489
|
+
sum: "sum";
|
|
3470
3490
|
avg: "avg";
|
|
3471
3491
|
min: "min";
|
|
3472
3492
|
max: "max";
|
|
3473
|
-
sum: "sum";
|
|
3474
3493
|
latest: "latest";
|
|
3475
3494
|
passThresholdRate: "passThresholdRate";
|
|
3476
3495
|
}>;
|
|
@@ -3566,10 +3585,10 @@ declare const caseRowSchema: z$1.ZodObject<{
|
|
|
3566
3585
|
evalId: z$1.ZodString;
|
|
3567
3586
|
status: z$1.ZodEnum<{
|
|
3568
3587
|
error: "error";
|
|
3569
|
-
pass: "pass";
|
|
3570
|
-
fail: "fail";
|
|
3571
3588
|
running: "running";
|
|
3572
3589
|
cancelled: "cancelled";
|
|
3590
|
+
pass: "pass";
|
|
3591
|
+
fail: "fail";
|
|
3573
3592
|
pending: "pending";
|
|
3574
3593
|
}>;
|
|
3575
3594
|
durationMs: z$1.ZodNullable<z$1.ZodNumber>;
|
|
@@ -3662,8 +3681,8 @@ declare const scoreTraceSchema: z$1.ZodObject<{
|
|
|
3662
3681
|
status: z$1.ZodEnum<{
|
|
3663
3682
|
error: "error";
|
|
3664
3683
|
running: "running";
|
|
3665
|
-
cancelled: "cancelled";
|
|
3666
3684
|
ok: "ok";
|
|
3685
|
+
cancelled: "cancelled";
|
|
3667
3686
|
}>;
|
|
3668
3687
|
attributes: z$1.ZodOptional<z$1.ZodRecord<z$1.ZodString, z$1.ZodUnknown>>;
|
|
3669
3688
|
error: z$1.ZodOptional<z$1.ZodObject<{
|
|
@@ -3699,8 +3718,8 @@ declare const scoreTraceSchema: z$1.ZodObject<{
|
|
|
3699
3718
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3700
3719
|
string: "string";
|
|
3701
3720
|
number: "number";
|
|
3702
|
-
json: "json";
|
|
3703
3721
|
duration: "duration";
|
|
3722
|
+
json: "json";
|
|
3704
3723
|
}>>;
|
|
3705
3724
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
3706
3725
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -3713,9 +3732,9 @@ declare const scoreTraceSchema: z$1.ZodObject<{
|
|
|
3713
3732
|
subtree: "subtree";
|
|
3714
3733
|
}>>;
|
|
3715
3734
|
mode: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3716
|
-
sum: "sum";
|
|
3717
|
-
last: "last";
|
|
3718
3735
|
all: "all";
|
|
3736
|
+
last: "last";
|
|
3737
|
+
sum: "sum";
|
|
3719
3738
|
}>>;
|
|
3720
3739
|
}, z$1.core.$strip>>>;
|
|
3721
3740
|
}, z$1.core.$strip>;
|
|
@@ -3730,10 +3749,10 @@ declare const caseDetailSchema: z$1.ZodObject<{
|
|
|
3730
3749
|
evalId: z$1.ZodString;
|
|
3731
3750
|
status: z$1.ZodEnum<{
|
|
3732
3751
|
error: "error";
|
|
3733
|
-
pass: "pass";
|
|
3734
|
-
fail: "fail";
|
|
3735
3752
|
running: "running";
|
|
3736
3753
|
cancelled: "cancelled";
|
|
3754
|
+
pass: "pass";
|
|
3755
|
+
fail: "fail";
|
|
3737
3756
|
pending: "pending";
|
|
3738
3757
|
}>;
|
|
3739
3758
|
input: z$1.ZodUnknown;
|
|
@@ -3748,8 +3767,8 @@ declare const caseDetailSchema: z$1.ZodObject<{
|
|
|
3748
3767
|
status: z$1.ZodEnum<{
|
|
3749
3768
|
error: "error";
|
|
3750
3769
|
running: "running";
|
|
3751
|
-
cancelled: "cancelled";
|
|
3752
3770
|
ok: "ok";
|
|
3771
|
+
cancelled: "cancelled";
|
|
3753
3772
|
}>;
|
|
3754
3773
|
attributes: z$1.ZodOptional<z$1.ZodRecord<z$1.ZodString, z$1.ZodUnknown>>;
|
|
3755
3774
|
error: z$1.ZodOptional<z$1.ZodObject<{
|
|
@@ -3785,8 +3804,8 @@ declare const caseDetailSchema: z$1.ZodObject<{
|
|
|
3785
3804
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3786
3805
|
string: "string";
|
|
3787
3806
|
number: "number";
|
|
3788
|
-
json: "json";
|
|
3789
3807
|
duration: "duration";
|
|
3808
|
+
json: "json";
|
|
3790
3809
|
}>>;
|
|
3791
3810
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
3792
3811
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -3799,9 +3818,9 @@ declare const caseDetailSchema: z$1.ZodObject<{
|
|
|
3799
3818
|
subtree: "subtree";
|
|
3800
3819
|
}>>;
|
|
3801
3820
|
mode: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3802
|
-
sum: "sum";
|
|
3803
|
-
last: "last";
|
|
3804
3821
|
all: "all";
|
|
3822
|
+
last: "last";
|
|
3823
|
+
sum: "sum";
|
|
3805
3824
|
}>>;
|
|
3806
3825
|
}, z$1.core.$strip>>>;
|
|
3807
3826
|
}, z$1.core.$strip>;
|
|
@@ -3817,8 +3836,8 @@ declare const caseDetailSchema: z$1.ZodObject<{
|
|
|
3817
3836
|
status: z$1.ZodEnum<{
|
|
3818
3837
|
error: "error";
|
|
3819
3838
|
running: "running";
|
|
3820
|
-
cancelled: "cancelled";
|
|
3821
3839
|
ok: "ok";
|
|
3840
|
+
cancelled: "cancelled";
|
|
3822
3841
|
}>;
|
|
3823
3842
|
attributes: z$1.ZodOptional<z$1.ZodRecord<z$1.ZodString, z$1.ZodUnknown>>;
|
|
3824
3843
|
error: z$1.ZodOptional<z$1.ZodObject<{
|
|
@@ -3854,8 +3873,8 @@ declare const caseDetailSchema: z$1.ZodObject<{
|
|
|
3854
3873
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3855
3874
|
string: "string";
|
|
3856
3875
|
number: "number";
|
|
3857
|
-
json: "json";
|
|
3858
3876
|
duration: "duration";
|
|
3877
|
+
json: "json";
|
|
3859
3878
|
}>>;
|
|
3860
3879
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
3861
3880
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -3868,9 +3887,9 @@ declare const caseDetailSchema: z$1.ZodObject<{
|
|
|
3868
3887
|
subtree: "subtree";
|
|
3869
3888
|
}>>;
|
|
3870
3889
|
mode: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3871
|
-
sum: "sum";
|
|
3872
|
-
last: "last";
|
|
3873
3890
|
all: "all";
|
|
3891
|
+
last: "last";
|
|
3892
|
+
sum: "sum";
|
|
3874
3893
|
}>>;
|
|
3875
3894
|
}, z$1.core.$strip>>>;
|
|
3876
3895
|
}, z$1.core.$strip>;
|
|
@@ -4004,10 +4023,10 @@ declare const evalChartBuiltinMetricSchema: z$1.ZodEnum<{
|
|
|
4004
4023
|
type EvalChartBuiltinMetric = z$1.infer<typeof evalChartBuiltinMetricSchema>;
|
|
4005
4024
|
/** Reducer applied to a numeric column across all cases of a single run. */
|
|
4006
4025
|
declare const evalChartAggregateSchema: z$1.ZodEnum<{
|
|
4026
|
+
sum: "sum";
|
|
4007
4027
|
avg: "avg";
|
|
4008
4028
|
min: "min";
|
|
4009
4029
|
max: "max";
|
|
4010
|
-
sum: "sum";
|
|
4011
4030
|
latest: "latest";
|
|
4012
4031
|
passThresholdRate: "passThresholdRate";
|
|
4013
4032
|
}>;
|
|
@@ -4018,11 +4037,11 @@ type EvalChartAggregate = z$1.infer<typeof evalChartAggregateSchema>;
|
|
|
4018
4037
|
* not emit raw hex so authored evals stay decoupled from the web theme.
|
|
4019
4038
|
*/
|
|
4020
4039
|
declare const evalChartColorSchema: z$1.ZodEnum<{
|
|
4021
|
-
success: "success";
|
|
4022
4040
|
error: "error";
|
|
4041
|
+
success: "success";
|
|
4042
|
+
warning: "warning";
|
|
4023
4043
|
accent: "accent";
|
|
4024
4044
|
accentDim: "accentDim";
|
|
4025
|
-
warning: "warning";
|
|
4026
4045
|
textMuted: "textMuted";
|
|
4027
4046
|
}>;
|
|
4028
4047
|
/** Semantic color token resolved to a theme color by the web UI. */
|
|
@@ -4047,11 +4066,11 @@ declare const evalChartMetricSchema: z$1.ZodDiscriminatedUnion<[z$1.ZodObject<{
|
|
|
4047
4066
|
}>;
|
|
4048
4067
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
4049
4068
|
color: z$1.ZodOptional<z$1.ZodEnum<{
|
|
4050
|
-
success: "success";
|
|
4051
4069
|
error: "error";
|
|
4070
|
+
success: "success";
|
|
4071
|
+
warning: "warning";
|
|
4052
4072
|
accent: "accent";
|
|
4053
4073
|
accentDim: "accentDim";
|
|
4054
|
-
warning: "warning";
|
|
4055
4074
|
textMuted: "textMuted";
|
|
4056
4075
|
}>>;
|
|
4057
4076
|
axis: z$1.ZodOptional<z$1.ZodEnum<{
|
|
@@ -4062,20 +4081,20 @@ declare const evalChartMetricSchema: z$1.ZodDiscriminatedUnion<[z$1.ZodObject<{
|
|
|
4062
4081
|
source: z$1.ZodLiteral<"column">;
|
|
4063
4082
|
key: z$1.ZodString;
|
|
4064
4083
|
aggregate: z$1.ZodEnum<{
|
|
4084
|
+
sum: "sum";
|
|
4065
4085
|
avg: "avg";
|
|
4066
4086
|
min: "min";
|
|
4067
4087
|
max: "max";
|
|
4068
|
-
sum: "sum";
|
|
4069
4088
|
latest: "latest";
|
|
4070
4089
|
passThresholdRate: "passThresholdRate";
|
|
4071
4090
|
}>;
|
|
4072
4091
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
4073
4092
|
color: z$1.ZodOptional<z$1.ZodEnum<{
|
|
4074
|
-
success: "success";
|
|
4075
4093
|
error: "error";
|
|
4094
|
+
success: "success";
|
|
4095
|
+
warning: "warning";
|
|
4076
4096
|
accent: "accent";
|
|
4077
4097
|
accentDim: "accentDim";
|
|
4078
|
-
warning: "warning";
|
|
4079
4098
|
textMuted: "textMuted";
|
|
4080
4099
|
}>>;
|
|
4081
4100
|
axis: z$1.ZodOptional<z$1.ZodEnum<{
|
|
@@ -4097,10 +4116,10 @@ declare const evalChartTooltipExtraSchema: z$1.ZodDiscriminatedUnion<[z$1.ZodObj
|
|
|
4097
4116
|
source: z$1.ZodLiteral<"column">;
|
|
4098
4117
|
key: z$1.ZodString;
|
|
4099
4118
|
aggregate: z$1.ZodEnum<{
|
|
4119
|
+
sum: "sum";
|
|
4100
4120
|
avg: "avg";
|
|
4101
4121
|
min: "min";
|
|
4102
4122
|
max: "max";
|
|
4103
|
-
sum: "sum";
|
|
4104
4123
|
latest: "latest";
|
|
4105
4124
|
passThresholdRate: "passThresholdRate";
|
|
4106
4125
|
}>;
|
|
@@ -4130,11 +4149,11 @@ declare const evalChartConfigSchema: z$1.ZodObject<{
|
|
|
4130
4149
|
}>;
|
|
4131
4150
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
4132
4151
|
color: z$1.ZodOptional<z$1.ZodEnum<{
|
|
4133
|
-
success: "success";
|
|
4134
4152
|
error: "error";
|
|
4153
|
+
success: "success";
|
|
4154
|
+
warning: "warning";
|
|
4135
4155
|
accent: "accent";
|
|
4136
4156
|
accentDim: "accentDim";
|
|
4137
|
-
warning: "warning";
|
|
4138
4157
|
textMuted: "textMuted";
|
|
4139
4158
|
}>>;
|
|
4140
4159
|
axis: z$1.ZodOptional<z$1.ZodEnum<{
|
|
@@ -4145,20 +4164,20 @@ declare const evalChartConfigSchema: z$1.ZodObject<{
|
|
|
4145
4164
|
source: z$1.ZodLiteral<"column">;
|
|
4146
4165
|
key: z$1.ZodString;
|
|
4147
4166
|
aggregate: z$1.ZodEnum<{
|
|
4167
|
+
sum: "sum";
|
|
4148
4168
|
avg: "avg";
|
|
4149
4169
|
min: "min";
|
|
4150
4170
|
max: "max";
|
|
4151
|
-
sum: "sum";
|
|
4152
4171
|
latest: "latest";
|
|
4153
4172
|
passThresholdRate: "passThresholdRate";
|
|
4154
4173
|
}>;
|
|
4155
4174
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
4156
4175
|
color: z$1.ZodOptional<z$1.ZodEnum<{
|
|
4157
|
-
success: "success";
|
|
4158
4176
|
error: "error";
|
|
4177
|
+
success: "success";
|
|
4178
|
+
warning: "warning";
|
|
4159
4179
|
accent: "accent";
|
|
4160
4180
|
accentDim: "accentDim";
|
|
4161
|
-
warning: "warning";
|
|
4162
4181
|
textMuted: "textMuted";
|
|
4163
4182
|
}>>;
|
|
4164
4183
|
axis: z$1.ZodOptional<z$1.ZodEnum<{
|
|
@@ -4187,10 +4206,10 @@ declare const evalChartConfigSchema: z$1.ZodObject<{
|
|
|
4187
4206
|
source: z$1.ZodLiteral<"column">;
|
|
4188
4207
|
key: z$1.ZodString;
|
|
4189
4208
|
aggregate: z$1.ZodEnum<{
|
|
4209
|
+
sum: "sum";
|
|
4190
4210
|
avg: "avg";
|
|
4191
4211
|
min: "min";
|
|
4192
4212
|
max: "max";
|
|
4193
|
-
sum: "sum";
|
|
4194
4213
|
latest: "latest";
|
|
4195
4214
|
passThresholdRate: "passThresholdRate";
|
|
4196
4215
|
}>;
|
|
@@ -4220,11 +4239,11 @@ declare const evalChartsConfigSchema: z$1.ZodArray<z$1.ZodObject<{
|
|
|
4220
4239
|
}>;
|
|
4221
4240
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
4222
4241
|
color: z$1.ZodOptional<z$1.ZodEnum<{
|
|
4223
|
-
success: "success";
|
|
4224
4242
|
error: "error";
|
|
4243
|
+
success: "success";
|
|
4244
|
+
warning: "warning";
|
|
4225
4245
|
accent: "accent";
|
|
4226
4246
|
accentDim: "accentDim";
|
|
4227
|
-
warning: "warning";
|
|
4228
4247
|
textMuted: "textMuted";
|
|
4229
4248
|
}>>;
|
|
4230
4249
|
axis: z$1.ZodOptional<z$1.ZodEnum<{
|
|
@@ -4235,20 +4254,20 @@ declare const evalChartsConfigSchema: z$1.ZodArray<z$1.ZodObject<{
|
|
|
4235
4254
|
source: z$1.ZodLiteral<"column">;
|
|
4236
4255
|
key: z$1.ZodString;
|
|
4237
4256
|
aggregate: z$1.ZodEnum<{
|
|
4257
|
+
sum: "sum";
|
|
4238
4258
|
avg: "avg";
|
|
4239
4259
|
min: "min";
|
|
4240
4260
|
max: "max";
|
|
4241
|
-
sum: "sum";
|
|
4242
4261
|
latest: "latest";
|
|
4243
4262
|
passThresholdRate: "passThresholdRate";
|
|
4244
4263
|
}>;
|
|
4245
4264
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
4246
4265
|
color: z$1.ZodOptional<z$1.ZodEnum<{
|
|
4247
|
-
success: "success";
|
|
4248
4266
|
error: "error";
|
|
4267
|
+
success: "success";
|
|
4268
|
+
warning: "warning";
|
|
4249
4269
|
accent: "accent";
|
|
4250
4270
|
accentDim: "accentDim";
|
|
4251
|
-
warning: "warning";
|
|
4252
4271
|
textMuted: "textMuted";
|
|
4253
4272
|
}>>;
|
|
4254
4273
|
axis: z$1.ZodOptional<z$1.ZodEnum<{
|
|
@@ -4277,10 +4296,10 @@ declare const evalChartsConfigSchema: z$1.ZodArray<z$1.ZodObject<{
|
|
|
4277
4296
|
source: z$1.ZodLiteral<"column">;
|
|
4278
4297
|
key: z$1.ZodString;
|
|
4279
4298
|
aggregate: z$1.ZodEnum<{
|
|
4299
|
+
sum: "sum";
|
|
4280
4300
|
avg: "avg";
|
|
4281
4301
|
min: "min";
|
|
4282
4302
|
max: "max";
|
|
4283
|
-
sum: "sum";
|
|
4284
4303
|
latest: "latest";
|
|
4285
4304
|
passThresholdRate: "passThresholdRate";
|
|
4286
4305
|
}>;
|
|
@@ -4555,8 +4574,8 @@ declare const llmCallMetricFormatSchema: z$1.ZodEnum<{
|
|
|
4555
4574
|
string: "string";
|
|
4556
4575
|
number: "number";
|
|
4557
4576
|
boolean: "boolean";
|
|
4558
|
-
json: "json";
|
|
4559
4577
|
duration: "duration";
|
|
4578
|
+
json: "json";
|
|
4560
4579
|
}>;
|
|
4561
4580
|
/** Render format applied to an LLM-call metric value. */
|
|
4562
4581
|
type LlmCallMetricFormat = z$1.infer<typeof llmCallMetricFormatSchema>;
|
|
@@ -4565,8 +4584,8 @@ declare const apiCallMetricFormatSchema: z$1.ZodEnum<{
|
|
|
4565
4584
|
string: "string";
|
|
4566
4585
|
number: "number";
|
|
4567
4586
|
boolean: "boolean";
|
|
4568
|
-
json: "json";
|
|
4569
4587
|
duration: "duration";
|
|
4588
|
+
json: "json";
|
|
4570
4589
|
}>;
|
|
4571
4590
|
/** Render format applied to an API-call metric value. */
|
|
4572
4591
|
type ApiCallMetricFormat = z$1.infer<typeof apiCallMetricFormatSchema>;
|
|
@@ -4584,10 +4603,10 @@ declare const apiCallMetricPlacementSchema: z$1.ZodEnum<{
|
|
|
4584
4603
|
}>;
|
|
4585
4604
|
/** Placement option for an API-call metric. */
|
|
4586
4605
|
type ApiCallMetricPlacement = z$1.infer<typeof apiCallMetricPlacementSchema>;
|
|
4587
|
-
/** Context passed to
|
|
4606
|
+
/** Context passed to LLM/API-call derived attribute functions. */
|
|
4588
4607
|
type CallDerivedAttributeContext = {
|
|
4589
|
-
/**
|
|
4590
|
-
span: EvalTraceSpan; /** Dot-path helper for reading from
|
|
4608
|
+
/** Current attributes from the matching trace span. */attributes: Record<string, unknown> | undefined; /** Matching trace span. */
|
|
4609
|
+
span: EvalTraceSpan; /** Dot-path helper for reading from the current span attributes. */
|
|
4591
4610
|
get: (path: string) => unknown;
|
|
4592
4611
|
};
|
|
4593
4612
|
/**
|
|
@@ -4595,14 +4614,27 @@ type CallDerivedAttributeContext = {
|
|
|
4595
4614
|
* LLM/API-call span. Return `undefined` to omit the attribute for that span.
|
|
4596
4615
|
*/
|
|
4597
4616
|
type CallDerivedAttribute = (ctx: CallDerivedAttributeContext) => unknown;
|
|
4617
|
+
/**
|
|
4618
|
+
* Runner-side function used to derive multiple span attributes from a matching
|
|
4619
|
+
* LLM/API-call span. Returned object keys are dot-paths under
|
|
4620
|
+
* `span.attributes`; `undefined` values are skipped.
|
|
4621
|
+
*/
|
|
4622
|
+
type CallDerivedAttributesFn = (ctx: CallDerivedAttributeContext) => Record<string, unknown> | undefined;
|
|
4623
|
+
/** Authored LLM/API-call derived-attributes config. */
|
|
4624
|
+
type CallDerivedAttributesConfig = Record<string, CallDerivedAttribute> | CallDerivedAttributesFn;
|
|
4598
4625
|
/** One resolved derived span attribute rule. */
|
|
4599
4626
|
type ResolvedCallDerivedAttribute = {
|
|
4600
|
-
/** Dot-path where
|
|
4627
|
+
/** Dot-path where one derived value is persisted on `span.attributes`. */path?: string;
|
|
4601
4628
|
/**
|
|
4602
|
-
* Function that derives
|
|
4629
|
+
* Function that derives one persisted value for each matching span. Omitted
|
|
4603
4630
|
* after this config is serialized to the browser.
|
|
4604
4631
|
*/
|
|
4605
4632
|
compute?: CallDerivedAttribute;
|
|
4633
|
+
/**
|
|
4634
|
+
* Function that derives multiple persisted values for each matching span.
|
|
4635
|
+
* Omitted after this config is serialized to the browser.
|
|
4636
|
+
*/
|
|
4637
|
+
computeMany?: CallDerivedAttributesFn;
|
|
4606
4638
|
};
|
|
4607
4639
|
/**
|
|
4608
4640
|
* Schema for a single user-defined metric attached to LLM call rows.
|
|
@@ -4622,8 +4654,8 @@ declare const llmCallMetricSchema: z$1.ZodObject<{
|
|
|
4622
4654
|
string: "string";
|
|
4623
4655
|
number: "number";
|
|
4624
4656
|
boolean: "boolean";
|
|
4625
|
-
json: "json";
|
|
4626
4657
|
duration: "duration";
|
|
4658
|
+
json: "json";
|
|
4627
4659
|
}>>;
|
|
4628
4660
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
4629
4661
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -4651,8 +4683,8 @@ declare const apiCallMetricSchema: z$1.ZodObject<{
|
|
|
4651
4683
|
string: "string";
|
|
4652
4684
|
number: "number";
|
|
4653
4685
|
boolean: "boolean";
|
|
4654
|
-
json: "json";
|
|
4655
4686
|
duration: "duration";
|
|
4687
|
+
json: "json";
|
|
4656
4688
|
}>>;
|
|
4657
4689
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
4658
4690
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -4701,6 +4733,18 @@ declare const llmCallPricingSchema: z$1.ZodObject<{
|
|
|
4701
4733
|
type LlmCallPricing = z$1.infer<typeof llmCallPricingSchema>;
|
|
4702
4734
|
/** Model-keyed pricing registry authored in `agent-evals.config.ts`. */
|
|
4703
4735
|
type LlmCallPricingRegistry = Record<string, LlmCallPricing>;
|
|
4736
|
+
/**
|
|
4737
|
+
* Schema for extra currencies displayed in the LLM calls breakdown table.
|
|
4738
|
+
* Costs are still derived in USD, then multiplied by `usdToCurrencyRate`.
|
|
4739
|
+
*/
|
|
4740
|
+
declare const llmCallCostCurrencySchema: z$1.ZodObject<{
|
|
4741
|
+
code: z$1.ZodString;
|
|
4742
|
+
label: z$1.ZodOptional<z$1.ZodString>;
|
|
4743
|
+
usdToCurrencyRate: z$1.ZodNumber;
|
|
4744
|
+
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
4745
|
+
}, z$1.core.$strip>;
|
|
4746
|
+
/** Extra LLM-call cost currency authored in `agent-evals.config.ts`. */
|
|
4747
|
+
type LlmCallCostCurrency = z$1.infer<typeof llmCallCostCurrencySchema>;
|
|
4704
4748
|
/** Schema for the global LLM calls config block in `agent-evals.config.ts`. */
|
|
4705
4749
|
declare const llmCallsConfigSchema: z$1.ZodObject<{
|
|
4706
4750
|
kinds: z$1.ZodOptional<z$1.ZodArray<z$1.ZodString>>;
|
|
@@ -4721,7 +4765,7 @@ declare const llmCallsConfigSchema: z$1.ZodObject<{
|
|
|
4721
4765
|
reasoning: z$1.ZodOptional<z$1.ZodString>;
|
|
4722
4766
|
toolCalls: z$1.ZodOptional<z$1.ZodString>;
|
|
4723
4767
|
}, z$1.core.$strip>>;
|
|
4724
|
-
derivedAttributes: z$1.ZodOptional<z$1.
|
|
4768
|
+
derivedAttributes: z$1.ZodOptional<z$1.ZodType<CallDerivedAttributesConfig, unknown, z$1.core.$ZodTypeInternals<CallDerivedAttributesConfig, unknown>>>;
|
|
4725
4769
|
pricing: z$1.ZodOptional<z$1.ZodRecord<z$1.ZodString, z$1.ZodObject<{
|
|
4726
4770
|
inputUsdPerMillion: z$1.ZodOptional<z$1.ZodNumber>;
|
|
4727
4771
|
outputUsdPerMillion: z$1.ZodOptional<z$1.ZodNumber>;
|
|
@@ -4739,6 +4783,12 @@ declare const llmCallsConfigSchema: z$1.ZodObject<{
|
|
|
4739
4783
|
reasoningUsdPerMillion: z$1.ZodOptional<z$1.ZodNumber>;
|
|
4740
4784
|
}, z$1.core.$strip>>>;
|
|
4741
4785
|
}, z$1.core.$strip>>>;
|
|
4786
|
+
costCurrencies: z$1.ZodOptional<z$1.ZodArray<z$1.ZodObject<{
|
|
4787
|
+
code: z$1.ZodString;
|
|
4788
|
+
label: z$1.ZodOptional<z$1.ZodString>;
|
|
4789
|
+
usdToCurrencyRate: z$1.ZodNumber;
|
|
4790
|
+
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
4791
|
+
}, z$1.core.$strip>>>;
|
|
4742
4792
|
metrics: z$1.ZodOptional<z$1.ZodArray<z$1.ZodObject<{
|
|
4743
4793
|
label: z$1.ZodString;
|
|
4744
4794
|
tooltip: z$1.ZodOptional<z$1.ZodString>;
|
|
@@ -4747,8 +4797,8 @@ declare const llmCallsConfigSchema: z$1.ZodObject<{
|
|
|
4747
4797
|
string: "string";
|
|
4748
4798
|
number: "number";
|
|
4749
4799
|
boolean: "boolean";
|
|
4750
|
-
json: "json";
|
|
4751
4800
|
duration: "duration";
|
|
4801
|
+
json: "json";
|
|
4752
4802
|
}>>;
|
|
4753
4803
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
4754
4804
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -4774,7 +4824,7 @@ declare const apiCallsConfigSchema: z$1.ZodObject<{
|
|
|
4774
4824
|
durationMs: z$1.ZodOptional<z$1.ZodString>;
|
|
4775
4825
|
error: z$1.ZodOptional<z$1.ZodString>;
|
|
4776
4826
|
}, z$1.core.$strip>>;
|
|
4777
|
-
derivedAttributes: z$1.ZodOptional<z$1.
|
|
4827
|
+
derivedAttributes: z$1.ZodOptional<z$1.ZodType<CallDerivedAttributesConfig, unknown, z$1.core.$ZodTypeInternals<CallDerivedAttributesConfig, unknown>>>;
|
|
4778
4828
|
metrics: z$1.ZodOptional<z$1.ZodArray<z$1.ZodObject<{
|
|
4779
4829
|
label: z$1.ZodString;
|
|
4780
4830
|
tooltip: z$1.ZodOptional<z$1.ZodString>;
|
|
@@ -4783,8 +4833,8 @@ declare const apiCallsConfigSchema: z$1.ZodObject<{
|
|
|
4783
4833
|
string: "string";
|
|
4784
4834
|
number: "number";
|
|
4785
4835
|
boolean: "boolean";
|
|
4786
|
-
json: "json";
|
|
4787
4836
|
duration: "duration";
|
|
4837
|
+
json: "json";
|
|
4788
4838
|
}>>;
|
|
4789
4839
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
4790
4840
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -4824,6 +4874,7 @@ type ResolvedLlmCallsConfig = {
|
|
|
4824
4874
|
derivedAttributes: ResolvedCallDerivedAttribute[];
|
|
4825
4875
|
metrics: ResolvedLlmCallMetric[];
|
|
4826
4876
|
pricing: ResolvedLlmCallPricing[];
|
|
4877
|
+
costCurrencies: ResolvedLlmCallCostCurrency[];
|
|
4827
4878
|
};
|
|
4828
4879
|
/** Resolved API-calls config sent to the UI with all defaults applied. */
|
|
4829
4880
|
type ResolvedApiCallsConfig = {
|
|
@@ -4872,6 +4923,13 @@ type ResolvedLlmCallPricing = {
|
|
|
4872
4923
|
cacheCreationInput1hUsdPerMillion?: number;
|
|
4873
4924
|
reasoningUsdPerMillion?: number;
|
|
4874
4925
|
};
|
|
4926
|
+
/** Fully-resolved extra currency used by the LLM calls tab. */
|
|
4927
|
+
type ResolvedLlmCallCostCurrency = {
|
|
4928
|
+
code: string;
|
|
4929
|
+
label?: string;
|
|
4930
|
+
usdToCurrencyRate: number;
|
|
4931
|
+
numberFormat?: NumberDisplayOptions;
|
|
4932
|
+
};
|
|
4875
4933
|
/** Default LLM-calls config the UI uses before the workspace fetch resolves. */
|
|
4876
4934
|
declare const DEFAULT_LLM_CALLS_CONFIG: ResolvedLlmCallsConfig;
|
|
4877
4935
|
/** Default API-calls config the UI uses before the workspace fetch resolves. */
|
|
@@ -4887,6 +4945,8 @@ declare const DEFAULT_API_CALLS_CONFIG: ResolvedApiCallsConfig;
|
|
|
4887
4945
|
* - Missing `metrics[].placements` defaults to `['body']`.
|
|
4888
4946
|
* - Missing `pricing` defaults to an empty registry; built-in costs are only
|
|
4889
4947
|
* derived from configured model-keyed pricing and token counts.
|
|
4948
|
+
* - Missing `costCurrencies` defaults to an empty list; extra currencies only
|
|
4949
|
+
* affect the expanded LLM calls breakdown table.
|
|
4890
4950
|
*/
|
|
4891
4951
|
declare function resolveLlmCallsConfig(input: LlmCallsConfigInput | undefined): ResolvedLlmCallsConfig;
|
|
4892
4952
|
/**
|
|
@@ -4985,6 +5045,9 @@ type AgentEvalsConfig = {
|
|
|
4985
5045
|
* outputUsdPerMillion: 0.6,
|
|
4986
5046
|
* },
|
|
4987
5047
|
* },
|
|
5048
|
+
* costCurrencies: [
|
|
5049
|
+
* { code: 'BRL', usdToCurrencyRate: 5.7, numberFormat: { prefix: 'R$ ' } },
|
|
5050
|
+
* ],
|
|
4988
5051
|
* }
|
|
4989
5052
|
* ```
|
|
4990
5053
|
*/
|
|
@@ -5072,8 +5135,8 @@ declare const agentEvalsConfigSchema: z$1.ZodObject<{
|
|
|
5072
5135
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
5073
5136
|
string: "string";
|
|
5074
5137
|
number: "number";
|
|
5075
|
-
json: "json";
|
|
5076
5138
|
duration: "duration";
|
|
5139
|
+
json: "json";
|
|
5077
5140
|
}>>;
|
|
5078
5141
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
5079
5142
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -5086,9 +5149,9 @@ declare const agentEvalsConfigSchema: z$1.ZodObject<{
|
|
|
5086
5149
|
subtree: "subtree";
|
|
5087
5150
|
}>>;
|
|
5088
5151
|
mode: z$1.ZodOptional<z$1.ZodEnum<{
|
|
5089
|
-
sum: "sum";
|
|
5090
|
-
last: "last";
|
|
5091
5152
|
all: "all";
|
|
5153
|
+
last: "last";
|
|
5154
|
+
sum: "sum";
|
|
5092
5155
|
}>>;
|
|
5093
5156
|
transform: z$1.ZodOptional<z$1.ZodCustom<TraceAttributeTransform, TraceAttributeTransform>>;
|
|
5094
5157
|
}, z$1.core.$strip>>>;
|
|
@@ -5111,22 +5174,22 @@ declare const agentEvalsConfigSchema: z$1.ZodObject<{
|
|
|
5111
5174
|
key: z$1.ZodString;
|
|
5112
5175
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
5113
5176
|
aggregate: z$1.ZodEnum<{
|
|
5177
|
+
last: "last";
|
|
5178
|
+
sum: "sum";
|
|
5114
5179
|
avg: "avg";
|
|
5115
5180
|
min: "min";
|
|
5116
5181
|
max: "max";
|
|
5117
|
-
sum: "sum";
|
|
5118
|
-
last: "last";
|
|
5119
5182
|
}>;
|
|
5120
5183
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
5121
5184
|
number: "number";
|
|
5122
5185
|
boolean: "boolean";
|
|
5186
|
+
duration: "duration";
|
|
5187
|
+
json: "json";
|
|
5123
5188
|
file: "file";
|
|
5124
5189
|
markdown: "markdown";
|
|
5125
|
-
json: "json";
|
|
5126
5190
|
image: "image";
|
|
5127
5191
|
audio: "audio";
|
|
5128
5192
|
video: "video";
|
|
5129
|
-
duration: "duration";
|
|
5130
5193
|
percent: "percent";
|
|
5131
5194
|
passFail: "passFail";
|
|
5132
5195
|
stars: "stars";
|
|
@@ -5153,7 +5216,7 @@ declare const agentEvalsConfigSchema: z$1.ZodObject<{
|
|
|
5153
5216
|
reasoning: z$1.ZodOptional<z$1.ZodString>;
|
|
5154
5217
|
toolCalls: z$1.ZodOptional<z$1.ZodString>;
|
|
5155
5218
|
}, z$1.core.$strip>>;
|
|
5156
|
-
derivedAttributes: z$1.ZodOptional<z$1.
|
|
5219
|
+
derivedAttributes: z$1.ZodOptional<z$1.ZodType<CallDerivedAttributesConfig, unknown, z$1.core.$ZodTypeInternals<CallDerivedAttributesConfig, unknown>>>;
|
|
5157
5220
|
pricing: z$1.ZodOptional<z$1.ZodRecord<z$1.ZodString, z$1.ZodObject<{
|
|
5158
5221
|
inputUsdPerMillion: z$1.ZodOptional<z$1.ZodNumber>;
|
|
5159
5222
|
outputUsdPerMillion: z$1.ZodOptional<z$1.ZodNumber>;
|
|
@@ -5171,6 +5234,12 @@ declare const agentEvalsConfigSchema: z$1.ZodObject<{
|
|
|
5171
5234
|
reasoningUsdPerMillion: z$1.ZodOptional<z$1.ZodNumber>;
|
|
5172
5235
|
}, z$1.core.$strip>>>;
|
|
5173
5236
|
}, z$1.core.$strip>>>;
|
|
5237
|
+
costCurrencies: z$1.ZodOptional<z$1.ZodArray<z$1.ZodObject<{
|
|
5238
|
+
code: z$1.ZodString;
|
|
5239
|
+
label: z$1.ZodOptional<z$1.ZodString>;
|
|
5240
|
+
usdToCurrencyRate: z$1.ZodNumber;
|
|
5241
|
+
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
5242
|
+
}, z$1.core.$strip>>>;
|
|
5174
5243
|
metrics: z$1.ZodOptional<z$1.ZodArray<z$1.ZodObject<{
|
|
5175
5244
|
label: z$1.ZodString;
|
|
5176
5245
|
tooltip: z$1.ZodOptional<z$1.ZodString>;
|
|
@@ -5179,8 +5248,8 @@ declare const agentEvalsConfigSchema: z$1.ZodObject<{
|
|
|
5179
5248
|
string: "string";
|
|
5180
5249
|
number: "number";
|
|
5181
5250
|
boolean: "boolean";
|
|
5182
|
-
json: "json";
|
|
5183
5251
|
duration: "duration";
|
|
5252
|
+
json: "json";
|
|
5184
5253
|
}>>;
|
|
5185
5254
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
5186
5255
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -5215,7 +5284,7 @@ declare const agentEvalsConfigSchema: z$1.ZodObject<{
|
|
|
5215
5284
|
durationMs: z$1.ZodOptional<z$1.ZodString>;
|
|
5216
5285
|
error: z$1.ZodOptional<z$1.ZodString>;
|
|
5217
5286
|
}, z$1.core.$strip>>;
|
|
5218
|
-
derivedAttributes: z$1.ZodOptional<z$1.
|
|
5287
|
+
derivedAttributes: z$1.ZodOptional<z$1.ZodType<CallDerivedAttributesConfig, unknown, z$1.core.$ZodTypeInternals<CallDerivedAttributesConfig, unknown>>>;
|
|
5219
5288
|
metrics: z$1.ZodOptional<z$1.ZodArray<z$1.ZodObject<{
|
|
5220
5289
|
label: z$1.ZodString;
|
|
5221
5290
|
tooltip: z$1.ZodOptional<z$1.ZodString>;
|
|
@@ -5224,8 +5293,8 @@ declare const agentEvalsConfigSchema: z$1.ZodObject<{
|
|
|
5224
5293
|
string: "string";
|
|
5225
5294
|
number: "number";
|
|
5226
5295
|
boolean: "boolean";
|
|
5227
|
-
json: "json";
|
|
5228
5296
|
duration: "duration";
|
|
5297
|
+
json: "json";
|
|
5229
5298
|
}>>;
|
|
5230
5299
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
5231
5300
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -5504,8 +5573,8 @@ declare const cacheRecordingSchema: z$1.ZodObject<{
|
|
|
5504
5573
|
finalStatus: z$1.ZodOptional<z$1.ZodEnum<{
|
|
5505
5574
|
error: "error";
|
|
5506
5575
|
running: "running";
|
|
5507
|
-
cancelled: "cancelled";
|
|
5508
5576
|
ok: "ok";
|
|
5577
|
+
cancelled: "cancelled";
|
|
5509
5578
|
}>>;
|
|
5510
5579
|
finalError: z$1.ZodOptional<z$1.ZodObject<{
|
|
5511
5580
|
name: z$1.ZodOptional<z$1.ZodString>;
|
|
@@ -5577,8 +5646,8 @@ declare const cacheEntrySchema: z$1.ZodObject<{
|
|
|
5577
5646
|
finalStatus: z$1.ZodOptional<z$1.ZodEnum<{
|
|
5578
5647
|
error: "error";
|
|
5579
5648
|
running: "running";
|
|
5580
|
-
cancelled: "cancelled";
|
|
5581
5649
|
ok: "ok";
|
|
5650
|
+
cancelled: "cancelled";
|
|
5582
5651
|
}>>;
|
|
5583
5652
|
finalError: z$1.ZodOptional<z$1.ZodObject<{
|
|
5584
5653
|
name: z$1.ZodOptional<z$1.ZodString>;
|
|
@@ -5666,8 +5735,8 @@ declare const cacheEntryWithDebugKeySchema: z$1.ZodObject<{
|
|
|
5666
5735
|
finalStatus: z$1.ZodOptional<z$1.ZodEnum<{
|
|
5667
5736
|
error: "error";
|
|
5668
5737
|
running: "running";
|
|
5669
|
-
cancelled: "cancelled";
|
|
5670
5738
|
ok: "ok";
|
|
5739
|
+
cancelled: "cancelled";
|
|
5671
5740
|
}>>;
|
|
5672
5741
|
finalError: z$1.ZodOptional<z$1.ZodObject<{
|
|
5673
5742
|
name: z$1.ZodOptional<z$1.ZodString>;
|
|
@@ -5755,8 +5824,8 @@ declare const cacheFileSchema: z$1.ZodObject<{
|
|
|
5755
5824
|
finalStatus: z$1.ZodOptional<z$1.ZodEnum<{
|
|
5756
5825
|
error: "error";
|
|
5757
5826
|
running: "running";
|
|
5758
|
-
cancelled: "cancelled";
|
|
5759
5827
|
ok: "ok";
|
|
5828
|
+
cancelled: "cancelled";
|
|
5760
5829
|
}>>;
|
|
5761
5830
|
finalError: z$1.ZodOptional<z$1.ZodObject<{
|
|
5762
5831
|
name: z$1.ZodOptional<z$1.ZodString>;
|
|
@@ -6214,4 +6283,4 @@ type ManualInputDescriptor = z$1.infer<typeof manualInputDescriptorSchema>; //#e
|
|
|
6214
6283
|
*/
|
|
6215
6284
|
declare function runCli(argv: string[]): Promise<void>;
|
|
6216
6285
|
//#endregion
|
|
6217
|
-
export { type AgentEvalsConfig, type ApiCallEntry, type ApiCallMetric, type ApiCallMetricFormat, type ApiCallMetricPlacement, type ApiCallMetricValue, type ApiCallsConfigInput, type AssertionFailure, type CacheActivityEntry, type CacheAdapter, type CacheDebugKeyEntry, type CacheDebugKeyFile, type CacheDebugKeyWrite, type CacheEntry, type CacheEntryWithDebugKey, type CacheFile, type CacheHitEntry, type CacheKeyHashInput, type CacheKeyHashOptions, type CacheListItem, type CacheMode, type CacheOperationType, type CacheRecording, type CacheRecordingFrame, type CacheRecordingOp, type CacheScopeContext, type CacheSerializationOptions, type CacheStatus, type CallDerivedAttribute, type CallDerivedAttributeContext, type CaptureEvalSpanErrorLevel, type CaptureEvalSpanErrorOptions, type CaseDetail, type CaseRow, type CellValue, type ColumnDef, type ColumnFormat, type ColumnKind, type ConfigReloadState, type ConfigReloadStatus, type CreateRunRequest, DEFAULT_API_CALLS_CONFIG, DEFAULT_LLM_CALLS_CONFIG, type DefaultConfigKey, type DerivedStatus, type DiscoveryIssue, EvalAssertionError, type EvalCacheConfig, type EvalCase, type EvalCaseScope, type EvalChartAggregate, type EvalChartAxis, type EvalChartBuiltinMetric, type EvalChartColor, type EvalChartConfig, type EvalChartMetric, type EvalChartTooltipExtra, type EvalChartType, type EvalChartsConfig, type EvalColumnOverride, type EvalColumns, type EvalDefinition, type EvalDeriveConfig, type EvalDeriveContext, type EvalDeriveFn, type EvalDeriveMap, type EvalDeriveValueFn, type EvalDisplayStatus, type EvalExecuteContext, type EvalExpectation, type EvalFreshnessStatus, type EvalManualInputConfig, type EvalManualScoreDef, type EvalOutputs, type EvalOutputsSchema, type EvalRunner, type EvalRuntimeScope, type EvalScoreContext, type EvalScoreDef, type EvalScoreFn, type EvalSetOutput, type EvalStartTime, type EvalStatAggregate, type EvalStatItem, type EvalStatsConfig, type EvalSummary, type EvalTimeUnit, type EvalTraceSpan, type EvalTraceSpanError, type EvalTraceSpanWarning, type EvalTraceTree, type FileRef, type JsonCell, type LlmCallEntry, type LlmCallMetric, type LlmCallMetricFormat, type LlmCallMetricPlacement, type LlmCallMetricValue, type LlmCallPricing, type LlmCallPricingRate, type LlmCallPricingRegistry, type LlmCallsConfigInput, type ManualInputDescriptor, type ManualInputFieldDescriptor, type ManualInputFieldKind, type ManualInputFieldOverride, type ManualInputFieldsConfig, type ManualInputFileValue, type ManualInputSelectOption, type MaterializeManualInputFilesResult, type NumberDisplayOptions, type ReadManualInputFileResult, type RemoveDefaultConfig, type RepoFileRef, type ResolvedApiCallMetric, type ResolvedApiCallsConfig, type ResolvedCallDerivedAttribute, type ResolvedLlmCallMetric, type ResolvedLlmCallPricing, type ResolvedLlmCallsConfig, type RunArtifactRef, type RunInEvalScopeOptions, type RunLogEntry, type RunLogLevel, type RunLogLocation, type RunLogPhase, type RunLogsConfigInput, type RunManifest, type RunSummary, type ScalarCell, type ScopedCaseSummary, type ScoreTrace, type SerializedCacheSpan, type SerializedCacheValue, type SpanCacheOptions, type SseEnvelope, type SseEventType, type TraceActiveSpan, type TraceAttributeDisplay, type TraceAttributeDisplayFormat, type TraceAttributeDisplayInput, type TraceAttributeDisplayPlacement, type TraceAttributeTransform, type TraceAttributeTransformContext, type TraceCacheInfo, type TraceCacheRef, type TraceDisplayConfig, type TraceDisplayInputConfig, type TraceSpanInfo, type TrialSelectionMode, type UpdateManualScoreRequest, advanceEvalTime, agentEvalsConfigSchema, apiCallMetricFormatSchema, apiCallMetricPlacementSchema, apiCallMetricSchema, apiCallsConfigSchema, appendToEvalOutput, applyDerivedCallAttributes, assertionFailureSchema, buildCaseKey, buildEvalKey, buildTraceTree, cacheDebugKeyEntrySchema, cacheDebugKeyFileSchema, cacheEntrySchema, cacheEntryWithDebugKeySchema, cacheFileSchema, cacheListItemSchema, cacheModeSchema, cacheOperationTypeSchema, cacheRecordingOpSchema, cacheRecordingSchema, cacheStatusSchema, captureEvalSpanError, caseDetailSchema, caseRowSchema, cellValueSchema, cleanupStagedManualInputFiles, columnDefSchema, columnFormatSchema, columnKindSchema, configReloadStateSchema, configReloadStatusSchema, createRunRequestSchema, createRunner, defaultConfigKeySchema, defineEval, deriveScopedSummaryFromCases, deriveStatusFromCaseRows, deriveStatusFromChildStatuses, deserializeCacheRecording, deserializeCacheValue, discoveryIssueSchema, evalAssert, evalChartAggregateSchema, evalChartAxisSchema, evalChartBuiltinMetricSchema, evalChartColorSchema, evalChartConfigSchema, evalChartMetricSchema, evalChartTooltipExtraSchema, evalChartTypeSchema, evalChartsConfigSchema, evalColumnOverrideSchema, evalColumnsSchema, evalDeriveConfigSchema, evalExpect, evalFreshnessStatusSchema, evalLog, evalSpan, evalStatAggregateSchema, evalStatItemSchema, evalStatsConfigSchema, evalSummarySchema, evalTracer, extractApiCalls, extractCacheEntries, extractCacheHits, extractLlmCalls, fileRefSchema, getCaseRowCaseKey, getCaseRowEvalKey, getCurrentScope, getEvalCaseInput, getEvalDisplayStatus, getEvalRegistry, getEvalStartTime, getEvalTitle, getNestedAttribute, hashCacheKey, hashCacheKeySync, incrementEvalOutput, isInEvalScope, isManualInputFileValue, jsonCellSchema, llmCallMetricFormatSchema, llmCallMetricPlacementSchema, llmCallMetricSchema, llmCallPricingRateSchema, llmCallPricingSchema, llmCallsConfigSchema, manualInputBooleanFieldSchema, manualInputDescriptorSchema, manualInputFieldDescriptorSchema, manualInputFileValueSchema, manualInputJsonFieldSchema, manualInputMultilineFieldSchema, manualInputNumberFieldSchema, manualInputSelectFieldSchema, manualInputSelectOptionSchema, manualInputTextFieldSchema, materializeManualInputFiles, mergeEvalOutput, nextEvalId, numberDisplayOptionsSchema, readManualInputFile, removeDefaultConfigSchema, repoFile, repoFileRefSchema, resolveApiCallsConfig, resolveLlmCallsConfig, runArtifactRefSchema, runCli, runInEvalRuntimeScope, runInEvalScope, runInExistingEvalScope, runLogEntrySchema, runLogLevelSchema, runLogLocationSchema, runLogPhaseSchema, runLogsConfigSchema, runManifestSchema, runSummarySchema, scoreTraceSchema, serializeCacheRecording, serializeCacheValue, serializedCacheSpanSchema, setEvalOutput, setScopeCacheContext, spanCacheOptionsSchema, sseEnvelopeSchema, stageManualInputFile, stageManualInputFileFromPath, startEvalBackgroundJob, traceAttributeDisplayFormatSchema, traceAttributeDisplayInputSchema, traceAttributeDisplayPlacementSchema, traceAttributeDisplaySchema, traceCacheRefSchema, traceDisplayConfigSchema, traceDisplayInputConfigSchema, traceSpanErrorSchema, traceSpanKindSchema, traceSpanSchema, traceSpanWarningSchema, trialSelectionModeSchema, updateManualScoreRequestSchema, z };
|
|
6286
|
+
export { type AgentEvalsConfig, type ApiCallEntry, type ApiCallMetric, type ApiCallMetricFormat, type ApiCallMetricPlacement, type ApiCallMetricValue, type ApiCallsConfigInput, type AssertionFailure, type CacheActivityEntry, type CacheAdapter, type CacheDebugKeyEntry, type CacheDebugKeyFile, type CacheDebugKeyWrite, type CacheEntry, type CacheEntryWithDebugKey, type CacheFile, type CacheHitEntry, type CacheKeyHashInput, type CacheKeyHashOptions, type CacheListItem, type CacheMode, type CacheOperationType, type CacheRecording, type CacheRecordingFrame, type CacheRecordingOp, type CacheScopeContext, type CacheSerializationOptions, type CacheStatus, type CallDerivedAttribute, type CallDerivedAttributeContext, type CallDerivedAttributesConfig, type CallDerivedAttributesFn, type CaptureEvalSpanErrorLevel, type CaptureEvalSpanErrorOptions, type CaseDetail, type CaseRow, type CellValue, type ColumnDef, type ColumnFormat, type ColumnKind, type ConfigReloadState, type ConfigReloadStatus, type CreateRunRequest, DEFAULT_API_CALLS_CONFIG, DEFAULT_LLM_CALLS_CONFIG, type DefaultConfigKey, type DerivedStatus, type DiscoveryIssue, EvalAssertionError, type EvalCacheConfig, type EvalCase, type EvalCaseScope, type EvalChartAggregate, type EvalChartAxis, type EvalChartBuiltinMetric, type EvalChartColor, type EvalChartConfig, type EvalChartMetric, type EvalChartTooltipExtra, type EvalChartType, type EvalChartsConfig, type EvalColumnOverride, type EvalColumns, type EvalDefinition, type EvalDeriveConfig, type EvalDeriveContext, type EvalDeriveFn, type EvalDeriveMap, type EvalDeriveValueFn, type EvalDisplayStatus, type EvalExecuteContext, type EvalExpectation, type EvalFreshnessStatus, type EvalManualInputConfig, type EvalManualScoreDef, type EvalOutputs, type EvalOutputsSchema, type EvalRunner, type EvalRuntimeScope, type EvalScoreContext, type EvalScoreDef, type EvalScoreFn, type EvalSetOutput, type EvalStartTime, type EvalStatAggregate, type EvalStatItem, type EvalStatsConfig, type EvalSummary, type EvalTimeUnit, type EvalTraceSpan, type EvalTraceSpanError, type EvalTraceSpanWarning, type EvalTraceTree, type FileRef, type JsonCell, type LlmCallCostCurrency, type LlmCallEntry, type LlmCallMetric, type LlmCallMetricFormat, type LlmCallMetricPlacement, type LlmCallMetricValue, type LlmCallPricing, type LlmCallPricingRate, type LlmCallPricingRegistry, type LlmCallsConfigInput, type ManualInputDescriptor, type ManualInputFieldDescriptor, type ManualInputFieldKind, type ManualInputFieldOverride, type ManualInputFieldsConfig, type ManualInputFileValue, type ManualInputSelectOption, type MaterializeManualInputFilesResult, type NumberDisplayOptions, type ReadManualInputFileResult, type RemoveDefaultConfig, type RepoFileRef, type ResolvedApiCallMetric, type ResolvedApiCallsConfig, type ResolvedCallDerivedAttribute, type ResolvedLlmCallCostCurrency, type ResolvedLlmCallMetric, type ResolvedLlmCallPricing, type ResolvedLlmCallsConfig, type RunArtifactRef, type RunInEvalScopeOptions, type RunLogEntry, type RunLogLevel, type RunLogLocation, type RunLogPhase, type RunLogsConfigInput, type RunManifest, type RunSummary, type ScalarCell, type ScopedCaseSummary, type ScoreTrace, type SerializedCacheSpan, type SerializedCacheValue, type SpanCacheOptions, type SseEnvelope, type SseEventType, type TraceActiveSpan, type TraceAttributeDisplay, type TraceAttributeDisplayFormat, type TraceAttributeDisplayInput, type TraceAttributeDisplayPlacement, type TraceAttributeTransform, type TraceAttributeTransformContext, type TraceCacheInfo, type TraceCacheRef, type TraceDisplayConfig, type TraceDisplayInputConfig, type TraceSpanInfo, type TrialSelectionMode, type UpdateManualScoreRequest, advanceEvalTime, agentEvalsConfigSchema, apiCallMetricFormatSchema, apiCallMetricPlacementSchema, apiCallMetricSchema, apiCallsConfigSchema, appendToEvalOutput, applyDerivedCallAttributes, assertionFailureSchema, buildCaseKey, buildEvalKey, buildTraceTree, cacheDebugKeyEntrySchema, cacheDebugKeyFileSchema, cacheEntrySchema, cacheEntryWithDebugKeySchema, cacheFileSchema, cacheListItemSchema, cacheModeSchema, cacheOperationTypeSchema, cacheRecordingOpSchema, cacheRecordingSchema, cacheStatusSchema, captureEvalSpanError, caseDetailSchema, caseRowSchema, cellValueSchema, cleanupStagedManualInputFiles, columnDefSchema, columnFormatSchema, columnKindSchema, configReloadStateSchema, configReloadStatusSchema, createRunRequestSchema, createRunner, defaultConfigKeySchema, defineEval, deriveScopedSummaryFromCases, deriveStatusFromCaseRows, deriveStatusFromChildStatuses, deserializeCacheRecording, deserializeCacheValue, discoveryIssueSchema, evalAssert, evalChartAggregateSchema, evalChartAxisSchema, evalChartBuiltinMetricSchema, evalChartColorSchema, evalChartConfigSchema, evalChartMetricSchema, evalChartTooltipExtraSchema, evalChartTypeSchema, evalChartsConfigSchema, evalColumnOverrideSchema, evalColumnsSchema, evalDeriveConfigSchema, evalExpect, evalFreshnessStatusSchema, evalLog, evalSpan, evalStatAggregateSchema, evalStatItemSchema, evalStatsConfigSchema, evalSummarySchema, evalTracer, extractApiCalls, extractCacheEntries, extractCacheHits, extractLlmCalls, fileRefSchema, getCaseRowCaseKey, getCaseRowEvalKey, getCurrentScope, getEvalCaseInput, getEvalDisplayStatus, getEvalRegistry, getEvalStartTime, getEvalTitle, getNestedAttribute, hashCacheKey, hashCacheKeySync, incrementEvalOutput, isInEvalScope, isManualInputFileValue, jsonCellSchema, llmCallCostCurrencySchema, llmCallMetricFormatSchema, llmCallMetricPlacementSchema, llmCallMetricSchema, llmCallPricingRateSchema, llmCallPricingSchema, llmCallsConfigSchema, manualInputBooleanFieldSchema, manualInputDescriptorSchema, manualInputFieldDescriptorSchema, manualInputFileValueSchema, manualInputJsonFieldSchema, manualInputMultilineFieldSchema, manualInputNumberFieldSchema, manualInputSelectFieldSchema, manualInputSelectOptionSchema, manualInputTextFieldSchema, materializeManualInputFiles, mergeEvalOutput, nextEvalId, numberDisplayOptionsSchema, readManualInputFile, removeDefaultConfigSchema, repoFile, repoFileRefSchema, resolveApiCallsConfig, resolveLlmCallsConfig, runArtifactRefSchema, runCli, runInEvalRuntimeScope, runInEvalScope, runInExistingEvalScope, runLogEntrySchema, runLogLevelSchema, runLogLocationSchema, runLogPhaseSchema, runLogsConfigSchema, runManifestSchema, runSummarySchema, scoreTraceSchema, serializeCacheRecording, serializeCacheValue, serializedCacheSpanSchema, setEvalOutput, setScopeCacheContext, spanCacheOptionsSchema, sseEnvelopeSchema, stageManualInputFile, stageManualInputFileFromPath, startEvalBackgroundJob, traceAttributeDisplayFormatSchema, traceAttributeDisplayInputSchema, traceAttributeDisplayPlacementSchema, traceAttributeDisplaySchema, traceCacheRefSchema, traceDisplayConfigSchema, traceDisplayInputConfigSchema, traceSpanErrorSchema, traceSpanKindSchema, traceSpanSchema, traceSpanWarningSchema, trialSelectionModeSchema, updateManualScoreRequestSchema, z };
|