@ls-stack/agent-eval 0.36.0 → 0.38.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/{app-BlNzXWDM.mjs → app-DD-8kx5H.mjs} +50 -6
- package/dist/apps/web/dist/assets/index-C6PgBOfP.css +1 -0
- package/dist/apps/web/dist/assets/index-CO86PsY-.js +140 -0
- package/dist/apps/web/dist/index.html +2 -2
- package/dist/bin.mjs +14 -3
- package/dist/{cli-Dg3abrOv.mjs → cli-BUX6tr9J.mjs} +106 -25
- package/dist/index.d.mts +159 -150
- package/dist/index.mjs +3 -3
- package/dist/runChild.mjs +73 -2
- package/dist/{runOrchestration-V1TxX8es.mjs → runOrchestration-BhUFWvq9.mjs} +293 -121
- package/dist/{runner-BCs5rzej.mjs → runner-B1wfPKNH.mjs} +2 -2
- package/dist/{runner-znY6PY1M.mjs → runner-CoRf7Vef.mjs} +1 -1
- package/dist/src-BwJ5tod2.mjs +3 -0
- package/package.json +3 -3
- package/skills/agent-eval/SKILL.md +18 -6
- package/dist/apps/web/dist/assets/index-BYtcGddU.js +0 -140
- package/dist/apps/web/dist/assets/index-D0rC5MSS.css +0 -1
- package/dist/src-DBypR4TV.mjs +0 -3
package/dist/index.d.mts
CHANGED
|
@@ -127,6 +127,7 @@ declare const evalSummarySchema$1: z$1.ZodObject<{
|
|
|
127
127
|
}>>;
|
|
128
128
|
}, z$1.core.$strip>>;
|
|
129
129
|
caseCount: z$1.ZodNullable<z$1.ZodNumber>;
|
|
130
|
+
caseIds: z$1.ZodOptional<z$1.ZodArray<z$1.ZodString>>;
|
|
130
131
|
lastRunStatus: z$1.ZodNullable<z$1.ZodEnum<{
|
|
131
132
|
error: "error";
|
|
132
133
|
pass: "pass";
|
|
@@ -617,6 +618,7 @@ declare const runManifestSchema$1: z$1.ZodObject<{
|
|
|
617
618
|
cancelled: "cancelled";
|
|
618
619
|
error: "error";
|
|
619
620
|
}>;
|
|
621
|
+
temporary: z$1.ZodDefault<z$1.ZodOptional<z$1.ZodBoolean>>;
|
|
620
622
|
startedAt: z$1.ZodString;
|
|
621
623
|
endedAt: z$1.ZodNullable<z$1.ZodString>;
|
|
622
624
|
commitSha: z$1.ZodDefault<z$1.ZodOptional<z$1.ZodNullable<z$1.ZodString>>>;
|
|
@@ -963,6 +965,7 @@ declare const createRunRequestSchema$1: z$1.ZodObject<{
|
|
|
963
965
|
caseIds: z$1.ZodOptional<z$1.ZodArray<z$1.ZodString>>;
|
|
964
966
|
}, z$1.core.$strip>;
|
|
965
967
|
trials: z$1.ZodNumber;
|
|
968
|
+
temporary: z$1.ZodOptional<z$1.ZodBoolean>;
|
|
966
969
|
cache: z$1.ZodOptional<z$1.ZodObject<{
|
|
967
970
|
mode: z$1.ZodDefault<z$1.ZodEnum<{
|
|
968
971
|
use: "use";
|
|
@@ -2349,6 +2352,56 @@ declare function readManualInputFile(value: ManualInputFileValue, options?: {
|
|
|
2349
2352
|
* @returns A repo-backed file reference suitable for file/media columns.
|
|
2350
2353
|
*/
|
|
2351
2354
|
declare function repoFile(path: string, mimeType?: string): RepoFileRef$1; //#endregion
|
|
2355
|
+
//#region src/cacheSerialization.d.ts
|
|
2356
|
+
declare const serializedCacheValueMarker = "__aecs";
|
|
2357
|
+
type JsonSafeCacheValueType = 'ArrayBuffer' | 'BigInt' | 'Blob' | 'Date' | 'Error' | 'ExternalJson' | 'File' | 'Float64Array' | 'Headers' | 'Map' | 'Number' | 'Object' | 'RegExp' | 'Set' | 'URL' | 'URLSearchParams' | 'Undefined';
|
|
2358
|
+
type JsonSafeSerializedCacheValue = {
|
|
2359
|
+
[serializedCacheValueMarker]: `v1:${JsonSafeCacheValueType}`;
|
|
2360
|
+
compressedLength?: number;
|
|
2361
|
+
hash?: string;
|
|
2362
|
+
length?: number;
|
|
2363
|
+
path?: string;
|
|
2364
|
+
value?: unknown;
|
|
2365
|
+
};
|
|
2366
|
+
/** JSON-safe persisted representation for one rich cached value. */
|
|
2367
|
+
type SerializedCacheValue = JsonSafeSerializedCacheValue;
|
|
2368
|
+
/** Metadata for a Brotli-compressed external JSON blob. */
|
|
2369
|
+
type ExternalJsonBlobRef = {
|
|
2370
|
+
/** Original UTF-8 JSON byte length. */length: number; /** Brotli-compressed byte length. */
|
|
2371
|
+
compressedLength: number; /** SHA-256 digest of the original UTF-8 JSON payload. */
|
|
2372
|
+
hash: `sha256:${string}`; /** Store-relative Brotli blob path. */
|
|
2373
|
+
path: string;
|
|
2374
|
+
};
|
|
2375
|
+
/** Store used by cache serialization for large nested JSON values. */
|
|
2376
|
+
type CacheSerializationExternalJsonStore = {
|
|
2377
|
+
/** Persist canonical JSON and return its content-addressed ref. */write(rawJson: string): Promise<ExternalJsonBlobRef>; /** Read a previously persisted canonical JSON payload. */
|
|
2378
|
+
read(ref: ExternalJsonBlobRef): Promise<string>;
|
|
2379
|
+
};
|
|
2380
|
+
/** Options controlling how rich cache values are persisted as JSON-safe data. */
|
|
2381
|
+
type CacheSerializationOptions = {
|
|
2382
|
+
/** Preserve JavaScript `undefined` values with explicit tagged wrappers. */preserveUndefined?: boolean; /** Externalize large nested JSON values through Brotli blob refs. */
|
|
2383
|
+
compress?: boolean; /** Store used for large nested JSON values when `compress` is enabled. */
|
|
2384
|
+
externalJsonStore?: CacheSerializationExternalJsonStore;
|
|
2385
|
+
};
|
|
2386
|
+
/**
|
|
2387
|
+
* Serialize one cached value while keeping plain JSON as plain JSON.
|
|
2388
|
+
*
|
|
2389
|
+
* Rich runtime values use small tagged wrappers. Undefined values are omitted
|
|
2390
|
+
* by default; pass `preserveUndefined: true` to round-trip them explicitly.
|
|
2391
|
+
*/
|
|
2392
|
+
declare function serializeCacheValue(value: unknown, options?: CacheSerializationOptions | undefined): Promise<unknown>;
|
|
2393
|
+
/** Revive one cached value, while preserving legacy JSON-round-tripped data. */
|
|
2394
|
+
declare function deserializeCacheValue(value: unknown): unknown;
|
|
2395
|
+
/** Replace external JSON blob refs with their parsed serialized payloads. */
|
|
2396
|
+
/**
|
|
2397
|
+
* Serialize all rich values captured in a cache recording before persistence.
|
|
2398
|
+
*
|
|
2399
|
+
* Undefined values are omitted by default; pass `preserveUndefined: true` to
|
|
2400
|
+
* retain the legacy explicit undefined wrappers in the recording payload.
|
|
2401
|
+
*/
|
|
2402
|
+
declare function serializeCacheRecording(recording: CacheRecording$1, options?: CacheSerializationOptions | undefined): Promise<CacheRecording$1>;
|
|
2403
|
+
/** Revive all rich values captured in a cache recording after lookup. */
|
|
2404
|
+
declare function deserializeCacheRecording(recording: CacheRecording$1): CacheRecording$1; //#endregion
|
|
2352
2405
|
//#region src/runtime.d.ts
|
|
2353
2406
|
declare global {
|
|
2354
2407
|
var __agentEvalsRealDate: DateConstructor | undefined;
|
|
@@ -2372,7 +2425,8 @@ type CacheDebugKeyWrite = {
|
|
|
2372
2425
|
* starts executing.
|
|
2373
2426
|
*/
|
|
2374
2427
|
type CacheAdapter = {
|
|
2375
|
-
/** Return the stored entry for `keyHash` under `namespace`, or `null`. */lookup(namespace: string, keyHash: string): Promise<CacheEntry$1 | null>;
|
|
2428
|
+
/** Return the stored entry for `keyHash` under `namespace`, or `null`. */lookup(namespace: string, keyHash: string): Promise<CacheEntry$1 | null>; /** Optional store for large nested JSON values persisted outside cache JSON. */
|
|
2429
|
+
externalJsonStore?: CacheSerializationExternalJsonStore;
|
|
2376
2430
|
/**
|
|
2377
2431
|
* Persist a cache entry. Must be safe under concurrent calls.
|
|
2378
2432
|
*
|
|
@@ -2604,54 +2658,6 @@ declare function incrementEvalOutput(key: string, delta: number): void;
|
|
|
2604
2658
|
* call.
|
|
2605
2659
|
*/
|
|
2606
2660
|
declare function evalAssert(condition: unknown, message: string): asserts condition; //#endregion
|
|
2607
|
-
//#region src/cacheSerialization.d.ts
|
|
2608
|
-
declare const serializedCacheValueMarker = "__aecs";
|
|
2609
|
-
declare const jsonSafeCacheValueVersion = "json-safe-v1";
|
|
2610
|
-
type JsonSafeCacheValueType = 'ArrayBuffer' | 'BigInt' | 'Blob' | 'CompressedJson' | 'CompressedString' | 'Date' | 'Error' | 'File' | 'Float64Array' | 'Headers' | 'Map' | 'Number' | 'Object' | 'RegExp' | 'Set' | 'URL' | 'URLSearchParams' | 'Undefined';
|
|
2611
|
-
type JsonSafeSerializedCacheValue = {
|
|
2612
|
-
[serializedCacheValueMarker]: typeof jsonSafeCacheValueVersion;
|
|
2613
|
-
codec?: 'gzip';
|
|
2614
|
-
length?: number;
|
|
2615
|
-
type: JsonSafeCacheValueType;
|
|
2616
|
-
value?: unknown;
|
|
2617
|
-
};
|
|
2618
|
-
/** JSON-safe persisted representation for one rich cached value. */
|
|
2619
|
-
type SerializedCacheValue = JsonSafeSerializedCacheValue;
|
|
2620
|
-
/** Options controlling how rich cache values are persisted as JSON-safe data. */
|
|
2621
|
-
type CacheSerializationOptions = {
|
|
2622
|
-
/**
|
|
2623
|
-
* Preserve JavaScript `undefined` values with explicit tagged wrappers.
|
|
2624
|
-
*
|
|
2625
|
-
* Disabled by default so undefined object fields, array items, map entries,
|
|
2626
|
-
* and set items are omitted instead of being written to cache files.
|
|
2627
|
-
*/
|
|
2628
|
-
preserveUndefined?: boolean;
|
|
2629
|
-
/**
|
|
2630
|
-
* Compress large nested strings/JSON blobs with gzip wrappers.
|
|
2631
|
-
*
|
|
2632
|
-
* Enabled by default for reusable cache files. Disable for output artifacts
|
|
2633
|
-
* that need synchronous browser-side deserialization.
|
|
2634
|
-
*/
|
|
2635
|
-
compress?: boolean;
|
|
2636
|
-
};
|
|
2637
|
-
/**
|
|
2638
|
-
* Serialize one cached value while keeping plain JSON as plain JSON.
|
|
2639
|
-
*
|
|
2640
|
-
* Rich runtime values use small tagged wrappers. Undefined values are omitted
|
|
2641
|
-
* by default; pass `preserveUndefined: true` to round-trip them explicitly.
|
|
2642
|
-
*/
|
|
2643
|
-
declare function serializeCacheValue(value: unknown, options?: CacheSerializationOptions | undefined): Promise<unknown>;
|
|
2644
|
-
/** Revive one cached value, while preserving legacy JSON-round-tripped data. */
|
|
2645
|
-
declare function deserializeCacheValue(value: unknown): unknown;
|
|
2646
|
-
/**
|
|
2647
|
-
* Serialize all rich values captured in a cache recording before persistence.
|
|
2648
|
-
*
|
|
2649
|
-
* Undefined values are omitted by default; pass `preserveUndefined: true` to
|
|
2650
|
-
* retain the legacy explicit undefined wrappers in the recording payload.
|
|
2651
|
-
*/
|
|
2652
|
-
declare function serializeCacheRecording(recording: CacheRecording$1, options?: CacheSerializationOptions | undefined): Promise<CacheRecording$1>;
|
|
2653
|
-
/** Revive all rich values captured in a cache recording after lookup. */
|
|
2654
|
-
declare function deserializeCacheRecording(recording: CacheRecording$1): CacheRecording$1; //#endregion
|
|
2655
2661
|
//#region src/valueCache.d.ts
|
|
2656
2662
|
/** Info accepted by `evalTracer.cache(info, fn)` for spanless value caching. */
|
|
2657
2663
|
type TraceCacheInfo = {
|
|
@@ -2916,12 +2922,12 @@ declare const columnFormatSchema: z$1.ZodEnum<{
|
|
|
2916
2922
|
number: "number";
|
|
2917
2923
|
boolean: "boolean";
|
|
2918
2924
|
file: "file";
|
|
2919
|
-
duration: "duration";
|
|
2920
2925
|
markdown: "markdown";
|
|
2921
2926
|
json: "json";
|
|
2922
2927
|
image: "image";
|
|
2923
2928
|
audio: "audio";
|
|
2924
2929
|
video: "video";
|
|
2930
|
+
duration: "duration";
|
|
2925
2931
|
percent: "percent";
|
|
2926
2932
|
passFail: "passFail";
|
|
2927
2933
|
stars: "stars";
|
|
@@ -2941,12 +2947,12 @@ declare const columnDefSchema: z$1.ZodObject<{
|
|
|
2941
2947
|
number: "number";
|
|
2942
2948
|
boolean: "boolean";
|
|
2943
2949
|
file: "file";
|
|
2944
|
-
duration: "duration";
|
|
2945
2950
|
markdown: "markdown";
|
|
2946
2951
|
json: "json";
|
|
2947
2952
|
image: "image";
|
|
2948
2953
|
audio: "audio";
|
|
2949
2954
|
video: "video";
|
|
2955
|
+
duration: "duration";
|
|
2950
2956
|
percent: "percent";
|
|
2951
2957
|
passFail: "passFail";
|
|
2952
2958
|
stars: "stars";
|
|
@@ -2991,8 +2997,8 @@ declare const traceSpanKindSchema: z$1.ZodString;
|
|
|
2991
2997
|
declare const traceAttributeDisplayFormatSchema: z$1.ZodEnum<{
|
|
2992
2998
|
string: "string";
|
|
2993
2999
|
number: "number";
|
|
2994
|
-
duration: "duration";
|
|
2995
3000
|
json: "json";
|
|
3001
|
+
duration: "duration";
|
|
2996
3002
|
}>;
|
|
2997
3003
|
/**
|
|
2998
3004
|
* Formatting hint for trace attribute values rendered by the UI.
|
|
@@ -3016,8 +3022,8 @@ declare const traceAttributeDisplaySchema: z$1.ZodObject<{
|
|
|
3016
3022
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3017
3023
|
string: "string";
|
|
3018
3024
|
number: "number";
|
|
3019
|
-
duration: "duration";
|
|
3020
3025
|
json: "json";
|
|
3026
|
+
duration: "duration";
|
|
3021
3027
|
}>>;
|
|
3022
3028
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
3023
3029
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -3030,9 +3036,9 @@ declare const traceAttributeDisplaySchema: z$1.ZodObject<{
|
|
|
3030
3036
|
subtree: "subtree";
|
|
3031
3037
|
}>>;
|
|
3032
3038
|
mode: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3033
|
-
sum: "sum";
|
|
3034
|
-
last: "last";
|
|
3035
3039
|
all: "all";
|
|
3040
|
+
last: "last";
|
|
3041
|
+
sum: "sum";
|
|
3036
3042
|
}>>;
|
|
3037
3043
|
}, z$1.core.$strip>;
|
|
3038
3044
|
/**
|
|
@@ -3052,8 +3058,8 @@ declare const traceDisplayConfigSchema: z$1.ZodObject<{
|
|
|
3052
3058
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3053
3059
|
string: "string";
|
|
3054
3060
|
number: "number";
|
|
3055
|
-
duration: "duration";
|
|
3056
3061
|
json: "json";
|
|
3062
|
+
duration: "duration";
|
|
3057
3063
|
}>>;
|
|
3058
3064
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
3059
3065
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -3066,9 +3072,9 @@ declare const traceDisplayConfigSchema: z$1.ZodObject<{
|
|
|
3066
3072
|
subtree: "subtree";
|
|
3067
3073
|
}>>;
|
|
3068
3074
|
mode: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3069
|
-
sum: "sum";
|
|
3070
|
-
last: "last";
|
|
3071
3075
|
all: "all";
|
|
3076
|
+
last: "last";
|
|
3077
|
+
sum: "sum";
|
|
3072
3078
|
}>>;
|
|
3073
3079
|
}, z$1.core.$strip>>>;
|
|
3074
3080
|
}, z$1.core.$strip>;
|
|
@@ -3092,8 +3098,8 @@ declare const traceAttributeDisplayInputSchema: z$1.ZodObject<{
|
|
|
3092
3098
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3093
3099
|
string: "string";
|
|
3094
3100
|
number: "number";
|
|
3095
|
-
duration: "duration";
|
|
3096
3101
|
json: "json";
|
|
3102
|
+
duration: "duration";
|
|
3097
3103
|
}>>;
|
|
3098
3104
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
3099
3105
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -3106,9 +3112,9 @@ declare const traceAttributeDisplayInputSchema: z$1.ZodObject<{
|
|
|
3106
3112
|
subtree: "subtree";
|
|
3107
3113
|
}>>;
|
|
3108
3114
|
mode: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3109
|
-
sum: "sum";
|
|
3110
|
-
last: "last";
|
|
3111
3115
|
all: "all";
|
|
3116
|
+
last: "last";
|
|
3117
|
+
sum: "sum";
|
|
3112
3118
|
}>>;
|
|
3113
3119
|
transform: z$1.ZodOptional<z$1.ZodCustom<TraceAttributeTransform, TraceAttributeTransform>>;
|
|
3114
3120
|
}, z$1.core.$strip>;
|
|
@@ -3130,8 +3136,8 @@ declare const traceDisplayInputConfigSchema: z$1.ZodObject<{
|
|
|
3130
3136
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3131
3137
|
string: "string";
|
|
3132
3138
|
number: "number";
|
|
3133
|
-
duration: "duration";
|
|
3134
3139
|
json: "json";
|
|
3140
|
+
duration: "duration";
|
|
3135
3141
|
}>>;
|
|
3136
3142
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
3137
3143
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -3144,9 +3150,9 @@ declare const traceDisplayInputConfigSchema: z$1.ZodObject<{
|
|
|
3144
3150
|
subtree: "subtree";
|
|
3145
3151
|
}>>;
|
|
3146
3152
|
mode: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3147
|
-
sum: "sum";
|
|
3148
|
-
last: "last";
|
|
3149
3153
|
all: "all";
|
|
3154
|
+
last: "last";
|
|
3155
|
+
sum: "sum";
|
|
3150
3156
|
}>>;
|
|
3151
3157
|
transform: z$1.ZodOptional<z$1.ZodCustom<TraceAttributeTransform, TraceAttributeTransform>>;
|
|
3152
3158
|
}, z$1.core.$strip>>>;
|
|
@@ -3225,11 +3231,11 @@ declare const evalFreshnessStatusSchema: z$1.ZodEnum<{
|
|
|
3225
3231
|
type EvalFreshnessStatus = z$1.infer<typeof evalFreshnessStatusSchema>;
|
|
3226
3232
|
/** Reducer used to collapse a column's per-case values into a single stat. */
|
|
3227
3233
|
declare const evalStatAggregateSchema: z$1.ZodEnum<{
|
|
3234
|
+
last: "last";
|
|
3235
|
+
sum: "sum";
|
|
3228
3236
|
avg: "avg";
|
|
3229
3237
|
min: "min";
|
|
3230
3238
|
max: "max";
|
|
3231
|
-
sum: "sum";
|
|
3232
|
-
last: "last";
|
|
3233
3239
|
}>;
|
|
3234
3240
|
/** Reducer used to collapse a column's per-case values into a single stat. */
|
|
3235
3241
|
type EvalStatAggregate = z$1.infer<typeof evalStatAggregateSchema>;
|
|
@@ -3253,22 +3259,22 @@ declare const evalStatItemSchema: z$1.ZodDiscriminatedUnion<[z$1.ZodObject<{
|
|
|
3253
3259
|
key: z$1.ZodString;
|
|
3254
3260
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
3255
3261
|
aggregate: z$1.ZodEnum<{
|
|
3262
|
+
last: "last";
|
|
3263
|
+
sum: "sum";
|
|
3256
3264
|
avg: "avg";
|
|
3257
3265
|
min: "min";
|
|
3258
3266
|
max: "max";
|
|
3259
|
-
sum: "sum";
|
|
3260
|
-
last: "last";
|
|
3261
3267
|
}>;
|
|
3262
3268
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3263
3269
|
number: "number";
|
|
3264
3270
|
boolean: "boolean";
|
|
3265
3271
|
file: "file";
|
|
3266
|
-
duration: "duration";
|
|
3267
3272
|
markdown: "markdown";
|
|
3268
3273
|
json: "json";
|
|
3269
3274
|
image: "image";
|
|
3270
3275
|
audio: "audio";
|
|
3271
3276
|
video: "video";
|
|
3277
|
+
duration: "duration";
|
|
3272
3278
|
percent: "percent";
|
|
3273
3279
|
passFail: "passFail";
|
|
3274
3280
|
stars: "stars";
|
|
@@ -3295,22 +3301,22 @@ declare const evalStatsConfigSchema: z$1.ZodArray<z$1.ZodDiscriminatedUnion<[z$1
|
|
|
3295
3301
|
key: z$1.ZodString;
|
|
3296
3302
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
3297
3303
|
aggregate: z$1.ZodEnum<{
|
|
3304
|
+
last: "last";
|
|
3305
|
+
sum: "sum";
|
|
3298
3306
|
avg: "avg";
|
|
3299
3307
|
min: "min";
|
|
3300
3308
|
max: "max";
|
|
3301
|
-
sum: "sum";
|
|
3302
|
-
last: "last";
|
|
3303
3309
|
}>;
|
|
3304
3310
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3305
3311
|
number: "number";
|
|
3306
3312
|
boolean: "boolean";
|
|
3307
3313
|
file: "file";
|
|
3308
|
-
duration: "duration";
|
|
3309
3314
|
markdown: "markdown";
|
|
3310
3315
|
json: "json";
|
|
3311
3316
|
image: "image";
|
|
3312
3317
|
audio: "audio";
|
|
3313
3318
|
video: "video";
|
|
3319
|
+
duration: "duration";
|
|
3314
3320
|
percent: "percent";
|
|
3315
3321
|
passFail: "passFail";
|
|
3316
3322
|
stars: "stars";
|
|
@@ -3348,12 +3354,12 @@ declare const evalSummarySchema: z$1.ZodObject<{
|
|
|
3348
3354
|
number: "number";
|
|
3349
3355
|
boolean: "boolean";
|
|
3350
3356
|
file: "file";
|
|
3351
|
-
duration: "duration";
|
|
3352
3357
|
markdown: "markdown";
|
|
3353
3358
|
json: "json";
|
|
3354
3359
|
image: "image";
|
|
3355
3360
|
audio: "audio";
|
|
3356
3361
|
video: "video";
|
|
3362
|
+
duration: "duration";
|
|
3357
3363
|
percent: "percent";
|
|
3358
3364
|
passFail: "passFail";
|
|
3359
3365
|
stars: "stars";
|
|
@@ -3372,12 +3378,13 @@ declare const evalSummarySchema: z$1.ZodObject<{
|
|
|
3372
3378
|
}>>;
|
|
3373
3379
|
}, z$1.core.$strip>>;
|
|
3374
3380
|
caseCount: z$1.ZodNullable<z$1.ZodNumber>;
|
|
3381
|
+
caseIds: z$1.ZodOptional<z$1.ZodArray<z$1.ZodString>>;
|
|
3375
3382
|
lastRunStatus: z$1.ZodNullable<z$1.ZodEnum<{
|
|
3376
3383
|
error: "error";
|
|
3377
|
-
pass: "pass";
|
|
3378
|
-
fail: "fail";
|
|
3379
3384
|
running: "running";
|
|
3380
3385
|
cancelled: "cancelled";
|
|
3386
|
+
pass: "pass";
|
|
3387
|
+
fail: "fail";
|
|
3381
3388
|
unscored: "unscored";
|
|
3382
3389
|
}>>;
|
|
3383
3390
|
stats: z$1.ZodOptional<z$1.ZodArray<z$1.ZodDiscriminatedUnion<[z$1.ZodObject<{
|
|
@@ -3396,22 +3403,22 @@ declare const evalSummarySchema: z$1.ZodObject<{
|
|
|
3396
3403
|
key: z$1.ZodString;
|
|
3397
3404
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
3398
3405
|
aggregate: z$1.ZodEnum<{
|
|
3406
|
+
last: "last";
|
|
3407
|
+
sum: "sum";
|
|
3399
3408
|
avg: "avg";
|
|
3400
3409
|
min: "min";
|
|
3401
3410
|
max: "max";
|
|
3402
|
-
sum: "sum";
|
|
3403
|
-
last: "last";
|
|
3404
3411
|
}>;
|
|
3405
3412
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3406
3413
|
number: "number";
|
|
3407
3414
|
boolean: "boolean";
|
|
3408
3415
|
file: "file";
|
|
3409
|
-
duration: "duration";
|
|
3410
3416
|
markdown: "markdown";
|
|
3411
3417
|
json: "json";
|
|
3412
3418
|
image: "image";
|
|
3413
3419
|
audio: "audio";
|
|
3414
3420
|
video: "video";
|
|
3421
|
+
duration: "duration";
|
|
3415
3422
|
percent: "percent";
|
|
3416
3423
|
passFail: "passFail";
|
|
3417
3424
|
stars: "stars";
|
|
@@ -3437,10 +3444,10 @@ declare const evalSummarySchema: z$1.ZodObject<{
|
|
|
3437
3444
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
3438
3445
|
color: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3439
3446
|
success: "success";
|
|
3440
|
-
accent: "accent";
|
|
3441
3447
|
error: "error";
|
|
3442
|
-
accentDim: "accentDim";
|
|
3443
3448
|
warning: "warning";
|
|
3449
|
+
accent: "accent";
|
|
3450
|
+
accentDim: "accentDim";
|
|
3444
3451
|
textMuted: "textMuted";
|
|
3445
3452
|
}>>;
|
|
3446
3453
|
axis: z$1.ZodOptional<z$1.ZodEnum<{
|
|
@@ -3451,20 +3458,20 @@ declare const evalSummarySchema: z$1.ZodObject<{
|
|
|
3451
3458
|
source: z$1.ZodLiteral<"column">;
|
|
3452
3459
|
key: z$1.ZodString;
|
|
3453
3460
|
aggregate: z$1.ZodEnum<{
|
|
3461
|
+
sum: "sum";
|
|
3454
3462
|
avg: "avg";
|
|
3455
3463
|
min: "min";
|
|
3456
3464
|
max: "max";
|
|
3457
|
-
sum: "sum";
|
|
3458
3465
|
latest: "latest";
|
|
3459
3466
|
passThresholdRate: "passThresholdRate";
|
|
3460
3467
|
}>;
|
|
3461
3468
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
3462
3469
|
color: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3463
3470
|
success: "success";
|
|
3464
|
-
accent: "accent";
|
|
3465
3471
|
error: "error";
|
|
3466
|
-
accentDim: "accentDim";
|
|
3467
3472
|
warning: "warning";
|
|
3473
|
+
accent: "accent";
|
|
3474
|
+
accentDim: "accentDim";
|
|
3468
3475
|
textMuted: "textMuted";
|
|
3469
3476
|
}>>;
|
|
3470
3477
|
axis: z$1.ZodOptional<z$1.ZodEnum<{
|
|
@@ -3493,10 +3500,10 @@ declare const evalSummarySchema: z$1.ZodObject<{
|
|
|
3493
3500
|
source: z$1.ZodLiteral<"column">;
|
|
3494
3501
|
key: z$1.ZodString;
|
|
3495
3502
|
aggregate: z$1.ZodEnum<{
|
|
3503
|
+
sum: "sum";
|
|
3496
3504
|
avg: "avg";
|
|
3497
3505
|
min: "min";
|
|
3498
3506
|
max: "max";
|
|
3499
|
-
sum: "sum";
|
|
3500
3507
|
latest: "latest";
|
|
3501
3508
|
passThresholdRate: "passThresholdRate";
|
|
3502
3509
|
}>;
|
|
@@ -3592,11 +3599,11 @@ declare const caseRowSchema: z$1.ZodObject<{
|
|
|
3592
3599
|
evalId: z$1.ZodString;
|
|
3593
3600
|
status: z$1.ZodEnum<{
|
|
3594
3601
|
error: "error";
|
|
3595
|
-
|
|
3596
|
-
fail: "fail";
|
|
3602
|
+
pending: "pending";
|
|
3597
3603
|
running: "running";
|
|
3598
3604
|
cancelled: "cancelled";
|
|
3599
|
-
|
|
3605
|
+
pass: "pass";
|
|
3606
|
+
fail: "fail";
|
|
3600
3607
|
}>;
|
|
3601
3608
|
durationMs: z$1.ZodNullable<z$1.ZodNumber>;
|
|
3602
3609
|
costUsd: z$1.ZodOptional<z$1.ZodNullable<z$1.ZodNumber>>;
|
|
@@ -3725,8 +3732,8 @@ declare const scoreTraceSchema: z$1.ZodObject<{
|
|
|
3725
3732
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3726
3733
|
string: "string";
|
|
3727
3734
|
number: "number";
|
|
3728
|
-
duration: "duration";
|
|
3729
3735
|
json: "json";
|
|
3736
|
+
duration: "duration";
|
|
3730
3737
|
}>>;
|
|
3731
3738
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
3732
3739
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -3739,9 +3746,9 @@ declare const scoreTraceSchema: z$1.ZodObject<{
|
|
|
3739
3746
|
subtree: "subtree";
|
|
3740
3747
|
}>>;
|
|
3741
3748
|
mode: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3742
|
-
sum: "sum";
|
|
3743
|
-
last: "last";
|
|
3744
3749
|
all: "all";
|
|
3750
|
+
last: "last";
|
|
3751
|
+
sum: "sum";
|
|
3745
3752
|
}>>;
|
|
3746
3753
|
}, z$1.core.$strip>>>;
|
|
3747
3754
|
}, z$1.core.$strip>;
|
|
@@ -3756,11 +3763,11 @@ declare const caseDetailSchema: z$1.ZodObject<{
|
|
|
3756
3763
|
evalId: z$1.ZodString;
|
|
3757
3764
|
status: z$1.ZodEnum<{
|
|
3758
3765
|
error: "error";
|
|
3759
|
-
|
|
3760
|
-
fail: "fail";
|
|
3766
|
+
pending: "pending";
|
|
3761
3767
|
running: "running";
|
|
3762
3768
|
cancelled: "cancelled";
|
|
3763
|
-
|
|
3769
|
+
pass: "pass";
|
|
3770
|
+
fail: "fail";
|
|
3764
3771
|
}>;
|
|
3765
3772
|
input: z$1.ZodUnknown;
|
|
3766
3773
|
trace: z$1.ZodArray<z$1.ZodObject<{
|
|
@@ -3811,8 +3818,8 @@ declare const caseDetailSchema: z$1.ZodObject<{
|
|
|
3811
3818
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3812
3819
|
string: "string";
|
|
3813
3820
|
number: "number";
|
|
3814
|
-
duration: "duration";
|
|
3815
3821
|
json: "json";
|
|
3822
|
+
duration: "duration";
|
|
3816
3823
|
}>>;
|
|
3817
3824
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
3818
3825
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -3825,9 +3832,9 @@ declare const caseDetailSchema: z$1.ZodObject<{
|
|
|
3825
3832
|
subtree: "subtree";
|
|
3826
3833
|
}>>;
|
|
3827
3834
|
mode: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3828
|
-
sum: "sum";
|
|
3829
|
-
last: "last";
|
|
3830
3835
|
all: "all";
|
|
3836
|
+
last: "last";
|
|
3837
|
+
sum: "sum";
|
|
3831
3838
|
}>>;
|
|
3832
3839
|
}, z$1.core.$strip>>>;
|
|
3833
3840
|
}, z$1.core.$strip>;
|
|
@@ -3880,8 +3887,8 @@ declare const caseDetailSchema: z$1.ZodObject<{
|
|
|
3880
3887
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3881
3888
|
string: "string";
|
|
3882
3889
|
number: "number";
|
|
3883
|
-
duration: "duration";
|
|
3884
3890
|
json: "json";
|
|
3891
|
+
duration: "duration";
|
|
3885
3892
|
}>>;
|
|
3886
3893
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
3887
3894
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -3894,9 +3901,9 @@ declare const caseDetailSchema: z$1.ZodObject<{
|
|
|
3894
3901
|
subtree: "subtree";
|
|
3895
3902
|
}>>;
|
|
3896
3903
|
mode: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3897
|
-
sum: "sum";
|
|
3898
|
-
last: "last";
|
|
3899
3904
|
all: "all";
|
|
3905
|
+
last: "last";
|
|
3906
|
+
sum: "sum";
|
|
3900
3907
|
}>>;
|
|
3901
3908
|
}, z$1.core.$strip>>>;
|
|
3902
3909
|
}, z$1.core.$strip>;
|
|
@@ -3956,10 +3963,10 @@ declare const caseDetailSchema: z$1.ZodObject<{
|
|
|
3956
3963
|
namespace: z$1.ZodString;
|
|
3957
3964
|
key: z$1.ZodString;
|
|
3958
3965
|
status: z$1.ZodEnum<{
|
|
3966
|
+
bypass: "bypass";
|
|
3967
|
+
refresh: "refresh";
|
|
3959
3968
|
hit: "hit";
|
|
3960
3969
|
miss: "miss";
|
|
3961
|
-
refresh: "refresh";
|
|
3962
|
-
bypass: "bypass";
|
|
3963
3970
|
}>;
|
|
3964
3971
|
read: z$1.ZodOptional<z$1.ZodBoolean>;
|
|
3965
3972
|
stored: z$1.ZodOptional<z$1.ZodBoolean>;
|
|
@@ -4030,10 +4037,10 @@ declare const evalChartBuiltinMetricSchema: z$1.ZodEnum<{
|
|
|
4030
4037
|
type EvalChartBuiltinMetric = z$1.infer<typeof evalChartBuiltinMetricSchema>;
|
|
4031
4038
|
/** Reducer applied to a numeric column across all cases of a single run. */
|
|
4032
4039
|
declare const evalChartAggregateSchema: z$1.ZodEnum<{
|
|
4040
|
+
sum: "sum";
|
|
4033
4041
|
avg: "avg";
|
|
4034
4042
|
min: "min";
|
|
4035
4043
|
max: "max";
|
|
4036
|
-
sum: "sum";
|
|
4037
4044
|
latest: "latest";
|
|
4038
4045
|
passThresholdRate: "passThresholdRate";
|
|
4039
4046
|
}>;
|
|
@@ -4045,10 +4052,10 @@ type EvalChartAggregate = z$1.infer<typeof evalChartAggregateSchema>;
|
|
|
4045
4052
|
*/
|
|
4046
4053
|
declare const evalChartColorSchema: z$1.ZodEnum<{
|
|
4047
4054
|
success: "success";
|
|
4048
|
-
accent: "accent";
|
|
4049
4055
|
error: "error";
|
|
4050
|
-
accentDim: "accentDim";
|
|
4051
4056
|
warning: "warning";
|
|
4057
|
+
accent: "accent";
|
|
4058
|
+
accentDim: "accentDim";
|
|
4052
4059
|
textMuted: "textMuted";
|
|
4053
4060
|
}>;
|
|
4054
4061
|
/** Semantic color token resolved to a theme color by the web UI. */
|
|
@@ -4074,10 +4081,10 @@ declare const evalChartMetricSchema: z$1.ZodDiscriminatedUnion<[z$1.ZodObject<{
|
|
|
4074
4081
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
4075
4082
|
color: z$1.ZodOptional<z$1.ZodEnum<{
|
|
4076
4083
|
success: "success";
|
|
4077
|
-
accent: "accent";
|
|
4078
4084
|
error: "error";
|
|
4079
|
-
accentDim: "accentDim";
|
|
4080
4085
|
warning: "warning";
|
|
4086
|
+
accent: "accent";
|
|
4087
|
+
accentDim: "accentDim";
|
|
4081
4088
|
textMuted: "textMuted";
|
|
4082
4089
|
}>>;
|
|
4083
4090
|
axis: z$1.ZodOptional<z$1.ZodEnum<{
|
|
@@ -4088,20 +4095,20 @@ declare const evalChartMetricSchema: z$1.ZodDiscriminatedUnion<[z$1.ZodObject<{
|
|
|
4088
4095
|
source: z$1.ZodLiteral<"column">;
|
|
4089
4096
|
key: z$1.ZodString;
|
|
4090
4097
|
aggregate: z$1.ZodEnum<{
|
|
4098
|
+
sum: "sum";
|
|
4091
4099
|
avg: "avg";
|
|
4092
4100
|
min: "min";
|
|
4093
4101
|
max: "max";
|
|
4094
|
-
sum: "sum";
|
|
4095
4102
|
latest: "latest";
|
|
4096
4103
|
passThresholdRate: "passThresholdRate";
|
|
4097
4104
|
}>;
|
|
4098
4105
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
4099
4106
|
color: z$1.ZodOptional<z$1.ZodEnum<{
|
|
4100
4107
|
success: "success";
|
|
4101
|
-
accent: "accent";
|
|
4102
4108
|
error: "error";
|
|
4103
|
-
accentDim: "accentDim";
|
|
4104
4109
|
warning: "warning";
|
|
4110
|
+
accent: "accent";
|
|
4111
|
+
accentDim: "accentDim";
|
|
4105
4112
|
textMuted: "textMuted";
|
|
4106
4113
|
}>>;
|
|
4107
4114
|
axis: z$1.ZodOptional<z$1.ZodEnum<{
|
|
@@ -4123,10 +4130,10 @@ declare const evalChartTooltipExtraSchema: z$1.ZodDiscriminatedUnion<[z$1.ZodObj
|
|
|
4123
4130
|
source: z$1.ZodLiteral<"column">;
|
|
4124
4131
|
key: z$1.ZodString;
|
|
4125
4132
|
aggregate: z$1.ZodEnum<{
|
|
4133
|
+
sum: "sum";
|
|
4126
4134
|
avg: "avg";
|
|
4127
4135
|
min: "min";
|
|
4128
4136
|
max: "max";
|
|
4129
|
-
sum: "sum";
|
|
4130
4137
|
latest: "latest";
|
|
4131
4138
|
passThresholdRate: "passThresholdRate";
|
|
4132
4139
|
}>;
|
|
@@ -4157,10 +4164,10 @@ declare const evalChartConfigSchema: z$1.ZodObject<{
|
|
|
4157
4164
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
4158
4165
|
color: z$1.ZodOptional<z$1.ZodEnum<{
|
|
4159
4166
|
success: "success";
|
|
4160
|
-
accent: "accent";
|
|
4161
4167
|
error: "error";
|
|
4162
|
-
accentDim: "accentDim";
|
|
4163
4168
|
warning: "warning";
|
|
4169
|
+
accent: "accent";
|
|
4170
|
+
accentDim: "accentDim";
|
|
4164
4171
|
textMuted: "textMuted";
|
|
4165
4172
|
}>>;
|
|
4166
4173
|
axis: z$1.ZodOptional<z$1.ZodEnum<{
|
|
@@ -4171,20 +4178,20 @@ declare const evalChartConfigSchema: z$1.ZodObject<{
|
|
|
4171
4178
|
source: z$1.ZodLiteral<"column">;
|
|
4172
4179
|
key: z$1.ZodString;
|
|
4173
4180
|
aggregate: z$1.ZodEnum<{
|
|
4181
|
+
sum: "sum";
|
|
4174
4182
|
avg: "avg";
|
|
4175
4183
|
min: "min";
|
|
4176
4184
|
max: "max";
|
|
4177
|
-
sum: "sum";
|
|
4178
4185
|
latest: "latest";
|
|
4179
4186
|
passThresholdRate: "passThresholdRate";
|
|
4180
4187
|
}>;
|
|
4181
4188
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
4182
4189
|
color: z$1.ZodOptional<z$1.ZodEnum<{
|
|
4183
4190
|
success: "success";
|
|
4184
|
-
accent: "accent";
|
|
4185
4191
|
error: "error";
|
|
4186
|
-
accentDim: "accentDim";
|
|
4187
4192
|
warning: "warning";
|
|
4193
|
+
accent: "accent";
|
|
4194
|
+
accentDim: "accentDim";
|
|
4188
4195
|
textMuted: "textMuted";
|
|
4189
4196
|
}>>;
|
|
4190
4197
|
axis: z$1.ZodOptional<z$1.ZodEnum<{
|
|
@@ -4213,10 +4220,10 @@ declare const evalChartConfigSchema: z$1.ZodObject<{
|
|
|
4213
4220
|
source: z$1.ZodLiteral<"column">;
|
|
4214
4221
|
key: z$1.ZodString;
|
|
4215
4222
|
aggregate: z$1.ZodEnum<{
|
|
4223
|
+
sum: "sum";
|
|
4216
4224
|
avg: "avg";
|
|
4217
4225
|
min: "min";
|
|
4218
4226
|
max: "max";
|
|
4219
|
-
sum: "sum";
|
|
4220
4227
|
latest: "latest";
|
|
4221
4228
|
passThresholdRate: "passThresholdRate";
|
|
4222
4229
|
}>;
|
|
@@ -4247,10 +4254,10 @@ declare const evalChartsConfigSchema: z$1.ZodArray<z$1.ZodObject<{
|
|
|
4247
4254
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
4248
4255
|
color: z$1.ZodOptional<z$1.ZodEnum<{
|
|
4249
4256
|
success: "success";
|
|
4250
|
-
accent: "accent";
|
|
4251
4257
|
error: "error";
|
|
4252
|
-
accentDim: "accentDim";
|
|
4253
4258
|
warning: "warning";
|
|
4259
|
+
accent: "accent";
|
|
4260
|
+
accentDim: "accentDim";
|
|
4254
4261
|
textMuted: "textMuted";
|
|
4255
4262
|
}>>;
|
|
4256
4263
|
axis: z$1.ZodOptional<z$1.ZodEnum<{
|
|
@@ -4261,20 +4268,20 @@ declare const evalChartsConfigSchema: z$1.ZodArray<z$1.ZodObject<{
|
|
|
4261
4268
|
source: z$1.ZodLiteral<"column">;
|
|
4262
4269
|
key: z$1.ZodString;
|
|
4263
4270
|
aggregate: z$1.ZodEnum<{
|
|
4271
|
+
sum: "sum";
|
|
4264
4272
|
avg: "avg";
|
|
4265
4273
|
min: "min";
|
|
4266
4274
|
max: "max";
|
|
4267
|
-
sum: "sum";
|
|
4268
4275
|
latest: "latest";
|
|
4269
4276
|
passThresholdRate: "passThresholdRate";
|
|
4270
4277
|
}>;
|
|
4271
4278
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
4272
4279
|
color: z$1.ZodOptional<z$1.ZodEnum<{
|
|
4273
4280
|
success: "success";
|
|
4274
|
-
accent: "accent";
|
|
4275
4281
|
error: "error";
|
|
4276
|
-
accentDim: "accentDim";
|
|
4277
4282
|
warning: "warning";
|
|
4283
|
+
accent: "accent";
|
|
4284
|
+
accentDim: "accentDim";
|
|
4278
4285
|
textMuted: "textMuted";
|
|
4279
4286
|
}>>;
|
|
4280
4287
|
axis: z$1.ZodOptional<z$1.ZodEnum<{
|
|
@@ -4303,10 +4310,10 @@ declare const evalChartsConfigSchema: z$1.ZodArray<z$1.ZodObject<{
|
|
|
4303
4310
|
source: z$1.ZodLiteral<"column">;
|
|
4304
4311
|
key: z$1.ZodString;
|
|
4305
4312
|
aggregate: z$1.ZodEnum<{
|
|
4313
|
+
sum: "sum";
|
|
4306
4314
|
avg: "avg";
|
|
4307
4315
|
min: "min";
|
|
4308
4316
|
max: "max";
|
|
4309
|
-
sum: "sum";
|
|
4310
4317
|
latest: "latest";
|
|
4311
4318
|
passThresholdRate: "passThresholdRate";
|
|
4312
4319
|
}>;
|
|
@@ -4322,11 +4329,12 @@ declare const runManifestSchema: z$1.ZodObject<{
|
|
|
4322
4329
|
shortId: z$1.ZodString;
|
|
4323
4330
|
status: z$1.ZodEnum<{
|
|
4324
4331
|
error: "error";
|
|
4325
|
-
running: "running";
|
|
4326
|
-
cancelled: "cancelled";
|
|
4327
4332
|
pending: "pending";
|
|
4333
|
+
running: "running";
|
|
4328
4334
|
completed: "completed";
|
|
4335
|
+
cancelled: "cancelled";
|
|
4329
4336
|
}>;
|
|
4337
|
+
temporary: z$1.ZodDefault<z$1.ZodOptional<z$1.ZodBoolean>>;
|
|
4330
4338
|
startedAt: z$1.ZodString;
|
|
4331
4339
|
endedAt: z$1.ZodNullable<z$1.ZodString>;
|
|
4332
4340
|
commitSha: z$1.ZodDefault<z$1.ZodOptional<z$1.ZodNullable<z$1.ZodString>>>;
|
|
@@ -4348,9 +4356,9 @@ declare const runManifestSchema: z$1.ZodObject<{
|
|
|
4348
4356
|
median: "median";
|
|
4349
4357
|
}>>>;
|
|
4350
4358
|
cacheMode: z$1.ZodOptional<z$1.ZodEnum<{
|
|
4351
|
-
refresh: "refresh";
|
|
4352
|
-
bypass: "bypass";
|
|
4353
4359
|
use: "use";
|
|
4360
|
+
bypass: "bypass";
|
|
4361
|
+
refresh: "refresh";
|
|
4354
4362
|
}>>;
|
|
4355
4363
|
}, z$1.core.$strip>;
|
|
4356
4364
|
/** Persisted lifecycle metadata for a single eval run. */
|
|
@@ -4360,10 +4368,10 @@ declare const runSummarySchema: z$1.ZodObject<{
|
|
|
4360
4368
|
runId: z$1.ZodString;
|
|
4361
4369
|
status: z$1.ZodEnum<{
|
|
4362
4370
|
error: "error";
|
|
4363
|
-
running: "running";
|
|
4364
|
-
cancelled: "cancelled";
|
|
4365
4371
|
pending: "pending";
|
|
4372
|
+
running: "running";
|
|
4366
4373
|
completed: "completed";
|
|
4374
|
+
cancelled: "cancelled";
|
|
4367
4375
|
}>;
|
|
4368
4376
|
totalCases: z$1.ZodNumber;
|
|
4369
4377
|
passedCases: z$1.ZodNumber;
|
|
@@ -4581,8 +4589,8 @@ declare const llmCallMetricFormatSchema: z$1.ZodEnum<{
|
|
|
4581
4589
|
string: "string";
|
|
4582
4590
|
number: "number";
|
|
4583
4591
|
boolean: "boolean";
|
|
4584
|
-
duration: "duration";
|
|
4585
4592
|
json: "json";
|
|
4593
|
+
duration: "duration";
|
|
4586
4594
|
}>;
|
|
4587
4595
|
/** Render format applied to an LLM-call metric value. */
|
|
4588
4596
|
type LlmCallMetricFormat = z$1.infer<typeof llmCallMetricFormatSchema>;
|
|
@@ -4591,8 +4599,8 @@ declare const apiCallMetricFormatSchema: z$1.ZodEnum<{
|
|
|
4591
4599
|
string: "string";
|
|
4592
4600
|
number: "number";
|
|
4593
4601
|
boolean: "boolean";
|
|
4594
|
-
duration: "duration";
|
|
4595
4602
|
json: "json";
|
|
4603
|
+
duration: "duration";
|
|
4596
4604
|
}>;
|
|
4597
4605
|
/** Render format applied to an API-call metric value. */
|
|
4598
4606
|
type ApiCallMetricFormat = z$1.infer<typeof apiCallMetricFormatSchema>;
|
|
@@ -4661,8 +4669,8 @@ declare const llmCallMetricSchema: z$1.ZodObject<{
|
|
|
4661
4669
|
string: "string";
|
|
4662
4670
|
number: "number";
|
|
4663
4671
|
boolean: "boolean";
|
|
4664
|
-
duration: "duration";
|
|
4665
4672
|
json: "json";
|
|
4673
|
+
duration: "duration";
|
|
4666
4674
|
}>>;
|
|
4667
4675
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
4668
4676
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -4690,8 +4698,8 @@ declare const apiCallMetricSchema: z$1.ZodObject<{
|
|
|
4690
4698
|
string: "string";
|
|
4691
4699
|
number: "number";
|
|
4692
4700
|
boolean: "boolean";
|
|
4693
|
-
duration: "duration";
|
|
4694
4701
|
json: "json";
|
|
4702
|
+
duration: "duration";
|
|
4695
4703
|
}>>;
|
|
4696
4704
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
4697
4705
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -4804,8 +4812,8 @@ declare const llmCallsConfigSchema: z$1.ZodObject<{
|
|
|
4804
4812
|
string: "string";
|
|
4805
4813
|
number: "number";
|
|
4806
4814
|
boolean: "boolean";
|
|
4807
|
-
duration: "duration";
|
|
4808
4815
|
json: "json";
|
|
4816
|
+
duration: "duration";
|
|
4809
4817
|
}>>;
|
|
4810
4818
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
4811
4819
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -4840,8 +4848,8 @@ declare const apiCallsConfigSchema: z$1.ZodObject<{
|
|
|
4840
4848
|
string: "string";
|
|
4841
4849
|
number: "number";
|
|
4842
4850
|
boolean: "boolean";
|
|
4843
|
-
duration: "duration";
|
|
4844
4851
|
json: "json";
|
|
4852
|
+
duration: "duration";
|
|
4845
4853
|
}>>;
|
|
4846
4854
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
4847
4855
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -5142,8 +5150,8 @@ declare const agentEvalsConfigSchema: z$1.ZodObject<{
|
|
|
5142
5150
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
5143
5151
|
string: "string";
|
|
5144
5152
|
number: "number";
|
|
5145
|
-
duration: "duration";
|
|
5146
5153
|
json: "json";
|
|
5154
|
+
duration: "duration";
|
|
5147
5155
|
}>>;
|
|
5148
5156
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
5149
5157
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -5156,9 +5164,9 @@ declare const agentEvalsConfigSchema: z$1.ZodObject<{
|
|
|
5156
5164
|
subtree: "subtree";
|
|
5157
5165
|
}>>;
|
|
5158
5166
|
mode: z$1.ZodOptional<z$1.ZodEnum<{
|
|
5159
|
-
sum: "sum";
|
|
5160
|
-
last: "last";
|
|
5161
5167
|
all: "all";
|
|
5168
|
+
last: "last";
|
|
5169
|
+
sum: "sum";
|
|
5162
5170
|
}>>;
|
|
5163
5171
|
transform: z$1.ZodOptional<z$1.ZodCustom<TraceAttributeTransform, TraceAttributeTransform>>;
|
|
5164
5172
|
}, z$1.core.$strip>>>;
|
|
@@ -5181,22 +5189,22 @@ declare const agentEvalsConfigSchema: z$1.ZodObject<{
|
|
|
5181
5189
|
key: z$1.ZodString;
|
|
5182
5190
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
5183
5191
|
aggregate: z$1.ZodEnum<{
|
|
5192
|
+
last: "last";
|
|
5193
|
+
sum: "sum";
|
|
5184
5194
|
avg: "avg";
|
|
5185
5195
|
min: "min";
|
|
5186
5196
|
max: "max";
|
|
5187
|
-
sum: "sum";
|
|
5188
|
-
last: "last";
|
|
5189
5197
|
}>;
|
|
5190
5198
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
5191
5199
|
number: "number";
|
|
5192
5200
|
boolean: "boolean";
|
|
5193
5201
|
file: "file";
|
|
5194
|
-
duration: "duration";
|
|
5195
5202
|
markdown: "markdown";
|
|
5196
5203
|
json: "json";
|
|
5197
5204
|
image: "image";
|
|
5198
5205
|
audio: "audio";
|
|
5199
5206
|
video: "video";
|
|
5207
|
+
duration: "duration";
|
|
5200
5208
|
percent: "percent";
|
|
5201
5209
|
passFail: "passFail";
|
|
5202
5210
|
stars: "stars";
|
|
@@ -5255,8 +5263,8 @@ declare const agentEvalsConfigSchema: z$1.ZodObject<{
|
|
|
5255
5263
|
string: "string";
|
|
5256
5264
|
number: "number";
|
|
5257
5265
|
boolean: "boolean";
|
|
5258
|
-
duration: "duration";
|
|
5259
5266
|
json: "json";
|
|
5267
|
+
duration: "duration";
|
|
5260
5268
|
}>>;
|
|
5261
5269
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
5262
5270
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -5300,8 +5308,8 @@ declare const agentEvalsConfigSchema: z$1.ZodObject<{
|
|
|
5300
5308
|
string: "string";
|
|
5301
5309
|
number: "number";
|
|
5302
5310
|
boolean: "boolean";
|
|
5303
|
-
duration: "duration";
|
|
5304
5311
|
json: "json";
|
|
5312
|
+
duration: "duration";
|
|
5305
5313
|
}>>;
|
|
5306
5314
|
numberFormat: z$1.ZodOptional<z$1.ZodType<NumberDisplayOptions, unknown, z$1.core.$ZodTypeInternals<NumberDisplayOptions, unknown>>>;
|
|
5307
5315
|
placements: z$1.ZodOptional<z$1.ZodArray<z$1.ZodEnum<{
|
|
@@ -5534,9 +5542,9 @@ declare function extractApiCalls(spans: EvalTraceSpan[], config: ResolvedApiCall
|
|
|
5534
5542
|
* - `refresh`: never read, always write (forces re-execution and overwrites).
|
|
5535
5543
|
*/
|
|
5536
5544
|
declare const cacheModeSchema: z$1.ZodEnum<{
|
|
5537
|
-
refresh: "refresh";
|
|
5538
|
-
bypass: "bypass";
|
|
5539
5545
|
use: "use";
|
|
5546
|
+
bypass: "bypass";
|
|
5547
|
+
refresh: "refresh";
|
|
5540
5548
|
}>;
|
|
5541
5549
|
/** Mode controlling how cached spans behave during a run. */
|
|
5542
5550
|
type CacheMode = z$1.infer<typeof cacheModeSchema>;
|
|
@@ -5557,10 +5565,10 @@ declare const cacheOperationTypeSchema: z$1.ZodEnum<{
|
|
|
5557
5565
|
type CacheOperationType = z$1.infer<typeof cacheOperationTypeSchema>;
|
|
5558
5566
|
/** Status of a cache lookup recorded on a span or case scope. */
|
|
5559
5567
|
declare const cacheStatusSchema: z$1.ZodEnum<{
|
|
5568
|
+
bypass: "bypass";
|
|
5569
|
+
refresh: "refresh";
|
|
5560
5570
|
hit: "hit";
|
|
5561
5571
|
miss: "miss";
|
|
5562
|
-
refresh: "refresh";
|
|
5563
|
-
bypass: "bypass";
|
|
5564
5572
|
}>;
|
|
5565
5573
|
/** Status of a cache lookup recorded on a span or case scope. */
|
|
5566
5574
|
type CacheStatus = z$1.infer<typeof cacheStatusSchema>;
|
|
@@ -5577,10 +5585,10 @@ declare const traceCacheRefSchema: z$1.ZodObject<{
|
|
|
5577
5585
|
namespace: z$1.ZodString;
|
|
5578
5586
|
key: z$1.ZodString;
|
|
5579
5587
|
status: z$1.ZodEnum<{
|
|
5588
|
+
bypass: "bypass";
|
|
5589
|
+
refresh: "refresh";
|
|
5580
5590
|
hit: "hit";
|
|
5581
5591
|
miss: "miss";
|
|
5582
|
-
refresh: "refresh";
|
|
5583
|
-
bypass: "bypass";
|
|
5584
5592
|
}>;
|
|
5585
5593
|
read: z$1.ZodOptional<z$1.ZodBoolean>;
|
|
5586
5594
|
stored: z$1.ZodOptional<z$1.ZodBoolean>;
|
|
@@ -6094,11 +6102,12 @@ declare const createRunRequestSchema: z$1.ZodObject<{
|
|
|
6094
6102
|
caseIds: z$1.ZodOptional<z$1.ZodArray<z$1.ZodString>>;
|
|
6095
6103
|
}, z$1.core.$strip>;
|
|
6096
6104
|
trials: z$1.ZodNumber;
|
|
6105
|
+
temporary: z$1.ZodOptional<z$1.ZodBoolean>;
|
|
6097
6106
|
cache: z$1.ZodOptional<z$1.ZodObject<{
|
|
6098
6107
|
mode: z$1.ZodDefault<z$1.ZodEnum<{
|
|
6099
|
-
refresh: "refresh";
|
|
6100
|
-
bypass: "bypass";
|
|
6101
6108
|
use: "use";
|
|
6109
|
+
bypass: "bypass";
|
|
6110
|
+
refresh: "refresh";
|
|
6102
6111
|
}>>;
|
|
6103
6112
|
}, z$1.core.$strip>>;
|
|
6104
6113
|
manualInputs: z$1.ZodOptional<z$1.ZodRecord<z$1.ZodString, z$1.ZodUnknown>>;
|