@ls-stack/agent-eval 0.37.0 → 0.38.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/{app-C7ON9Wdh.mjs → app-DD-8kx5H.mjs} +15 -6
- package/dist/apps/web/dist/assets/index-C6PgBOfP.css +1 -0
- package/dist/apps/web/dist/assets/{index-BiwYbMem.js → index-CO86PsY-.js} +43 -43
- package/dist/apps/web/dist/index.html +2 -2
- package/dist/bin.mjs +14 -3
- package/dist/{cli-CwGcJYWe.mjs → cli-BUX6tr9J.mjs} +60 -28
- package/dist/index.d.mts +122 -119
- package/dist/index.mjs +3 -3
- package/dist/runChild.mjs +30 -1
- package/dist/{runOrchestration-C4o5TcIu.mjs → runOrchestration-BhUFWvq9.mjs} +251 -114
- package/dist/{runner-BTH8m_Er.mjs → runner-B1wfPKNH.mjs} +2 -2
- package/dist/{runner-LqeHPID6.mjs → runner-CoRf7Vef.mjs} +1 -1
- package/dist/src-BwJ5tod2.mjs +3 -0
- package/package.json +2 -2
- package/skills/agent-eval/SKILL.md +9 -5
- package/dist/apps/web/dist/assets/index-CKdoOah2.css +0 -1
- package/dist/src--13_4uDG.mjs +0 -3
package/dist/index.d.mts
CHANGED
|
@@ -2352,6 +2352,56 @@ declare function readManualInputFile(value: ManualInputFileValue, options?: {
|
|
|
2352
2352
|
* @returns A repo-backed file reference suitable for file/media columns.
|
|
2353
2353
|
*/
|
|
2354
2354
|
declare function repoFile(path: string, mimeType?: string): RepoFileRef$1; //#endregion
|
|
2355
|
+
//#region src/cacheSerialization.d.ts
|
|
2356
|
+
declare const serializedCacheValueMarker = "__aecs";
|
|
2357
|
+
type JsonSafeCacheValueType = 'ArrayBuffer' | 'BigInt' | 'Blob' | 'Date' | 'Error' | 'ExternalJson' | 'File' | 'Float64Array' | 'Headers' | 'Map' | 'Number' | 'Object' | 'RegExp' | 'Set' | 'URL' | 'URLSearchParams' | 'Undefined';
|
|
2358
|
+
type JsonSafeSerializedCacheValue = {
|
|
2359
|
+
[serializedCacheValueMarker]: `v1:${JsonSafeCacheValueType}`;
|
|
2360
|
+
compressedLength?: number;
|
|
2361
|
+
hash?: string;
|
|
2362
|
+
length?: number;
|
|
2363
|
+
path?: string;
|
|
2364
|
+
value?: unknown;
|
|
2365
|
+
};
|
|
2366
|
+
/** JSON-safe persisted representation for one rich cached value. */
|
|
2367
|
+
type SerializedCacheValue = JsonSafeSerializedCacheValue;
|
|
2368
|
+
/** Metadata for a Brotli-compressed external JSON blob. */
|
|
2369
|
+
type ExternalJsonBlobRef = {
|
|
2370
|
+
/** Original UTF-8 JSON byte length. */length: number; /** Brotli-compressed byte length. */
|
|
2371
|
+
compressedLength: number; /** SHA-256 digest of the original UTF-8 JSON payload. */
|
|
2372
|
+
hash: `sha256:${string}`; /** Store-relative Brotli blob path. */
|
|
2373
|
+
path: string;
|
|
2374
|
+
};
|
|
2375
|
+
/** Store used by cache serialization for large nested JSON values. */
|
|
2376
|
+
type CacheSerializationExternalJsonStore = {
|
|
2377
|
+
/** Persist canonical JSON and return its content-addressed ref. */write(rawJson: string): Promise<ExternalJsonBlobRef>; /** Read a previously persisted canonical JSON payload. */
|
|
2378
|
+
read(ref: ExternalJsonBlobRef): Promise<string>;
|
|
2379
|
+
};
|
|
2380
|
+
/** Options controlling how rich cache values are persisted as JSON-safe data. */
|
|
2381
|
+
type CacheSerializationOptions = {
|
|
2382
|
+
/** Preserve JavaScript `undefined` values with explicit tagged wrappers. */preserveUndefined?: boolean; /** Externalize large nested JSON values through Brotli blob refs. */
|
|
2383
|
+
compress?: boolean; /** Store used for large nested JSON values when `compress` is enabled. */
|
|
2384
|
+
externalJsonStore?: CacheSerializationExternalJsonStore;
|
|
2385
|
+
};
|
|
2386
|
+
/**
|
|
2387
|
+
* Serialize one cached value while keeping plain JSON as plain JSON.
|
|
2388
|
+
*
|
|
2389
|
+
* Rich runtime values use small tagged wrappers. Undefined values are omitted
|
|
2390
|
+
* by default; pass `preserveUndefined: true` to round-trip them explicitly.
|
|
2391
|
+
*/
|
|
2392
|
+
declare function serializeCacheValue(value: unknown, options?: CacheSerializationOptions | undefined): Promise<unknown>;
|
|
2393
|
+
/** Revive one cached value, while preserving legacy JSON-round-tripped data. */
|
|
2394
|
+
declare function deserializeCacheValue(value: unknown): unknown;
|
|
2395
|
+
/** Replace external JSON blob refs with their parsed serialized payloads. */
|
|
2396
|
+
/**
|
|
2397
|
+
* Serialize all rich values captured in a cache recording before persistence.
|
|
2398
|
+
*
|
|
2399
|
+
* Undefined values are omitted by default; pass `preserveUndefined: true` to
|
|
2400
|
+
* retain the legacy explicit undefined wrappers in the recording payload.
|
|
2401
|
+
*/
|
|
2402
|
+
declare function serializeCacheRecording(recording: CacheRecording$1, options?: CacheSerializationOptions | undefined): Promise<CacheRecording$1>;
|
|
2403
|
+
/** Revive all rich values captured in a cache recording after lookup. */
|
|
2404
|
+
declare function deserializeCacheRecording(recording: CacheRecording$1): CacheRecording$1; //#endregion
|
|
2355
2405
|
//#region src/runtime.d.ts
|
|
2356
2406
|
declare global {
|
|
2357
2407
|
var __agentEvalsRealDate: DateConstructor | undefined;
|
|
@@ -2375,7 +2425,8 @@ type CacheDebugKeyWrite = {
|
|
|
2375
2425
|
* starts executing.
|
|
2376
2426
|
*/
|
|
2377
2427
|
type CacheAdapter = {
|
|
2378
|
-
/** Return the stored entry for `keyHash` under `namespace`, or `null`. */lookup(namespace: string, keyHash: string): Promise<CacheEntry$1 | null>;
|
|
2428
|
+
/** Return the stored entry for `keyHash` under `namespace`, or `null`. */lookup(namespace: string, keyHash: string): Promise<CacheEntry$1 | null>; /** Optional store for large nested JSON values persisted outside cache JSON. */
|
|
2429
|
+
externalJsonStore?: CacheSerializationExternalJsonStore;
|
|
2379
2430
|
/**
|
|
2380
2431
|
* Persist a cache entry. Must be safe under concurrent calls.
|
|
2381
2432
|
*
|
|
@@ -2607,54 +2658,6 @@ declare function incrementEvalOutput(key: string, delta: number): void;
|
|
|
2607
2658
|
* call.
|
|
2608
2659
|
*/
|
|
2609
2660
|
declare function evalAssert(condition: unknown, message: string): asserts condition; //#endregion
|
|
2610
|
-
//#region src/cacheSerialization.d.ts
|
|
2611
|
-
declare const serializedCacheValueMarker = "__aecs";
|
|
2612
|
-
declare const jsonSafeCacheValueVersion = "json-safe-v1";
|
|
2613
|
-
type JsonSafeCacheValueType = 'ArrayBuffer' | 'BigInt' | 'Blob' | 'CompressedJson' | 'CompressedString' | 'Date' | 'Error' | 'File' | 'Float64Array' | 'Headers' | 'Map' | 'Number' | 'Object' | 'RegExp' | 'Set' | 'URL' | 'URLSearchParams' | 'Undefined';
|
|
2614
|
-
type JsonSafeSerializedCacheValue = {
|
|
2615
|
-
[serializedCacheValueMarker]: typeof jsonSafeCacheValueVersion;
|
|
2616
|
-
codec?: 'gzip';
|
|
2617
|
-
length?: number;
|
|
2618
|
-
type: JsonSafeCacheValueType;
|
|
2619
|
-
value?: unknown;
|
|
2620
|
-
};
|
|
2621
|
-
/** JSON-safe persisted representation for one rich cached value. */
|
|
2622
|
-
type SerializedCacheValue = JsonSafeSerializedCacheValue;
|
|
2623
|
-
/** Options controlling how rich cache values are persisted as JSON-safe data. */
|
|
2624
|
-
type CacheSerializationOptions = {
|
|
2625
|
-
/**
|
|
2626
|
-
* Preserve JavaScript `undefined` values with explicit tagged wrappers.
|
|
2627
|
-
*
|
|
2628
|
-
* Disabled by default so undefined object fields, array items, map entries,
|
|
2629
|
-
* and set items are omitted instead of being written to cache files.
|
|
2630
|
-
*/
|
|
2631
|
-
preserveUndefined?: boolean;
|
|
2632
|
-
/**
|
|
2633
|
-
* Compress large nested strings/JSON blobs with gzip wrappers.
|
|
2634
|
-
*
|
|
2635
|
-
* Enabled by default for reusable cache files. Disable for output artifacts
|
|
2636
|
-
* that need synchronous browser-side deserialization.
|
|
2637
|
-
*/
|
|
2638
|
-
compress?: boolean;
|
|
2639
|
-
};
|
|
2640
|
-
/**
|
|
2641
|
-
* Serialize one cached value while keeping plain JSON as plain JSON.
|
|
2642
|
-
*
|
|
2643
|
-
* Rich runtime values use small tagged wrappers. Undefined values are omitted
|
|
2644
|
-
* by default; pass `preserveUndefined: true` to round-trip them explicitly.
|
|
2645
|
-
*/
|
|
2646
|
-
declare function serializeCacheValue(value: unknown, options?: CacheSerializationOptions | undefined): Promise<unknown>;
|
|
2647
|
-
/** Revive one cached value, while preserving legacy JSON-round-tripped data. */
|
|
2648
|
-
declare function deserializeCacheValue(value: unknown): unknown;
|
|
2649
|
-
/**
|
|
2650
|
-
* Serialize all rich values captured in a cache recording before persistence.
|
|
2651
|
-
*
|
|
2652
|
-
* Undefined values are omitted by default; pass `preserveUndefined: true` to
|
|
2653
|
-
* retain the legacy explicit undefined wrappers in the recording payload.
|
|
2654
|
-
*/
|
|
2655
|
-
declare function serializeCacheRecording(recording: CacheRecording$1, options?: CacheSerializationOptions | undefined): Promise<CacheRecording$1>;
|
|
2656
|
-
/** Revive all rich values captured in a cache recording after lookup. */
|
|
2657
|
-
declare function deserializeCacheRecording(recording: CacheRecording$1): CacheRecording$1; //#endregion
|
|
2658
2661
|
//#region src/valueCache.d.ts
|
|
2659
2662
|
/** Info accepted by `evalTracer.cache(info, fn)` for spanless value caching. */
|
|
2660
2663
|
type TraceCacheInfo = {
|
|
@@ -3033,9 +3036,9 @@ declare const traceAttributeDisplaySchema: z$1.ZodObject<{
|
|
|
3033
3036
|
subtree: "subtree";
|
|
3034
3037
|
}>>;
|
|
3035
3038
|
mode: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3036
|
-
sum: "sum";
|
|
3037
|
-
last: "last";
|
|
3038
3039
|
all: "all";
|
|
3040
|
+
last: "last";
|
|
3041
|
+
sum: "sum";
|
|
3039
3042
|
}>>;
|
|
3040
3043
|
}, z$1.core.$strip>;
|
|
3041
3044
|
/**
|
|
@@ -3069,9 +3072,9 @@ declare const traceDisplayConfigSchema: z$1.ZodObject<{
|
|
|
3069
3072
|
subtree: "subtree";
|
|
3070
3073
|
}>>;
|
|
3071
3074
|
mode: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3072
|
-
sum: "sum";
|
|
3073
|
-
last: "last";
|
|
3074
3075
|
all: "all";
|
|
3076
|
+
last: "last";
|
|
3077
|
+
sum: "sum";
|
|
3075
3078
|
}>>;
|
|
3076
3079
|
}, z$1.core.$strip>>>;
|
|
3077
3080
|
}, z$1.core.$strip>;
|
|
@@ -3109,9 +3112,9 @@ declare const traceAttributeDisplayInputSchema: z$1.ZodObject<{
|
|
|
3109
3112
|
subtree: "subtree";
|
|
3110
3113
|
}>>;
|
|
3111
3114
|
mode: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3112
|
-
sum: "sum";
|
|
3113
|
-
last: "last";
|
|
3114
3115
|
all: "all";
|
|
3116
|
+
last: "last";
|
|
3117
|
+
sum: "sum";
|
|
3115
3118
|
}>>;
|
|
3116
3119
|
transform: z$1.ZodOptional<z$1.ZodCustom<TraceAttributeTransform, TraceAttributeTransform>>;
|
|
3117
3120
|
}, z$1.core.$strip>;
|
|
@@ -3147,9 +3150,9 @@ declare const traceDisplayInputConfigSchema: z$1.ZodObject<{
|
|
|
3147
3150
|
subtree: "subtree";
|
|
3148
3151
|
}>>;
|
|
3149
3152
|
mode: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3150
|
-
sum: "sum";
|
|
3151
|
-
last: "last";
|
|
3152
3153
|
all: "all";
|
|
3154
|
+
last: "last";
|
|
3155
|
+
sum: "sum";
|
|
3153
3156
|
}>>;
|
|
3154
3157
|
transform: z$1.ZodOptional<z$1.ZodCustom<TraceAttributeTransform, TraceAttributeTransform>>;
|
|
3155
3158
|
}, z$1.core.$strip>>>;
|
|
@@ -3228,11 +3231,11 @@ declare const evalFreshnessStatusSchema: z$1.ZodEnum<{
|
|
|
3228
3231
|
type EvalFreshnessStatus = z$1.infer<typeof evalFreshnessStatusSchema>;
|
|
3229
3232
|
/** Reducer used to collapse a column's per-case values into a single stat. */
|
|
3230
3233
|
declare const evalStatAggregateSchema: z$1.ZodEnum<{
|
|
3234
|
+
last: "last";
|
|
3235
|
+
sum: "sum";
|
|
3231
3236
|
avg: "avg";
|
|
3232
3237
|
min: "min";
|
|
3233
3238
|
max: "max";
|
|
3234
|
-
sum: "sum";
|
|
3235
|
-
last: "last";
|
|
3236
3239
|
}>;
|
|
3237
3240
|
/** Reducer used to collapse a column's per-case values into a single stat. */
|
|
3238
3241
|
type EvalStatAggregate = z$1.infer<typeof evalStatAggregateSchema>;
|
|
@@ -3256,11 +3259,11 @@ declare const evalStatItemSchema: z$1.ZodDiscriminatedUnion<[z$1.ZodObject<{
|
|
|
3256
3259
|
key: z$1.ZodString;
|
|
3257
3260
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
3258
3261
|
aggregate: z$1.ZodEnum<{
|
|
3262
|
+
last: "last";
|
|
3263
|
+
sum: "sum";
|
|
3259
3264
|
avg: "avg";
|
|
3260
3265
|
min: "min";
|
|
3261
3266
|
max: "max";
|
|
3262
|
-
sum: "sum";
|
|
3263
|
-
last: "last";
|
|
3264
3267
|
}>;
|
|
3265
3268
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3266
3269
|
number: "number";
|
|
@@ -3298,11 +3301,11 @@ declare const evalStatsConfigSchema: z$1.ZodArray<z$1.ZodDiscriminatedUnion<[z$1
|
|
|
3298
3301
|
key: z$1.ZodString;
|
|
3299
3302
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
3300
3303
|
aggregate: z$1.ZodEnum<{
|
|
3304
|
+
last: "last";
|
|
3305
|
+
sum: "sum";
|
|
3301
3306
|
avg: "avg";
|
|
3302
3307
|
min: "min";
|
|
3303
3308
|
max: "max";
|
|
3304
|
-
sum: "sum";
|
|
3305
|
-
last: "last";
|
|
3306
3309
|
}>;
|
|
3307
3310
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3308
3311
|
number: "number";
|
|
@@ -3378,10 +3381,10 @@ declare const evalSummarySchema: z$1.ZodObject<{
|
|
|
3378
3381
|
caseIds: z$1.ZodOptional<z$1.ZodArray<z$1.ZodString>>;
|
|
3379
3382
|
lastRunStatus: z$1.ZodNullable<z$1.ZodEnum<{
|
|
3380
3383
|
error: "error";
|
|
3381
|
-
pass: "pass";
|
|
3382
|
-
fail: "fail";
|
|
3383
3384
|
running: "running";
|
|
3384
3385
|
cancelled: "cancelled";
|
|
3386
|
+
pass: "pass";
|
|
3387
|
+
fail: "fail";
|
|
3385
3388
|
unscored: "unscored";
|
|
3386
3389
|
}>>;
|
|
3387
3390
|
stats: z$1.ZodOptional<z$1.ZodArray<z$1.ZodDiscriminatedUnion<[z$1.ZodObject<{
|
|
@@ -3400,11 +3403,11 @@ declare const evalSummarySchema: z$1.ZodObject<{
|
|
|
3400
3403
|
key: z$1.ZodString;
|
|
3401
3404
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
3402
3405
|
aggregate: z$1.ZodEnum<{
|
|
3406
|
+
last: "last";
|
|
3407
|
+
sum: "sum";
|
|
3403
3408
|
avg: "avg";
|
|
3404
3409
|
min: "min";
|
|
3405
3410
|
max: "max";
|
|
3406
|
-
sum: "sum";
|
|
3407
|
-
last: "last";
|
|
3408
3411
|
}>;
|
|
3409
3412
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3410
3413
|
number: "number";
|
|
@@ -3442,9 +3445,9 @@ declare const evalSummarySchema: z$1.ZodObject<{
|
|
|
3442
3445
|
color: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3443
3446
|
success: "success";
|
|
3444
3447
|
error: "error";
|
|
3448
|
+
warning: "warning";
|
|
3445
3449
|
accent: "accent";
|
|
3446
3450
|
accentDim: "accentDim";
|
|
3447
|
-
warning: "warning";
|
|
3448
3451
|
textMuted: "textMuted";
|
|
3449
3452
|
}>>;
|
|
3450
3453
|
axis: z$1.ZodOptional<z$1.ZodEnum<{
|
|
@@ -3455,10 +3458,10 @@ declare const evalSummarySchema: z$1.ZodObject<{
|
|
|
3455
3458
|
source: z$1.ZodLiteral<"column">;
|
|
3456
3459
|
key: z$1.ZodString;
|
|
3457
3460
|
aggregate: z$1.ZodEnum<{
|
|
3461
|
+
sum: "sum";
|
|
3458
3462
|
avg: "avg";
|
|
3459
3463
|
min: "min";
|
|
3460
3464
|
max: "max";
|
|
3461
|
-
sum: "sum";
|
|
3462
3465
|
latest: "latest";
|
|
3463
3466
|
passThresholdRate: "passThresholdRate";
|
|
3464
3467
|
}>;
|
|
@@ -3466,9 +3469,9 @@ declare const evalSummarySchema: z$1.ZodObject<{
|
|
|
3466
3469
|
color: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3467
3470
|
success: "success";
|
|
3468
3471
|
error: "error";
|
|
3472
|
+
warning: "warning";
|
|
3469
3473
|
accent: "accent";
|
|
3470
3474
|
accentDim: "accentDim";
|
|
3471
|
-
warning: "warning";
|
|
3472
3475
|
textMuted: "textMuted";
|
|
3473
3476
|
}>>;
|
|
3474
3477
|
axis: z$1.ZodOptional<z$1.ZodEnum<{
|
|
@@ -3497,10 +3500,10 @@ declare const evalSummarySchema: z$1.ZodObject<{
|
|
|
3497
3500
|
source: z$1.ZodLiteral<"column">;
|
|
3498
3501
|
key: z$1.ZodString;
|
|
3499
3502
|
aggregate: z$1.ZodEnum<{
|
|
3503
|
+
sum: "sum";
|
|
3500
3504
|
avg: "avg";
|
|
3501
3505
|
min: "min";
|
|
3502
3506
|
max: "max";
|
|
3503
|
-
sum: "sum";
|
|
3504
3507
|
latest: "latest";
|
|
3505
3508
|
passThresholdRate: "passThresholdRate";
|
|
3506
3509
|
}>;
|
|
@@ -3596,11 +3599,11 @@ declare const caseRowSchema: z$1.ZodObject<{
|
|
|
3596
3599
|
evalId: z$1.ZodString;
|
|
3597
3600
|
status: z$1.ZodEnum<{
|
|
3598
3601
|
error: "error";
|
|
3599
|
-
|
|
3600
|
-
fail: "fail";
|
|
3602
|
+
pending: "pending";
|
|
3601
3603
|
running: "running";
|
|
3602
3604
|
cancelled: "cancelled";
|
|
3603
|
-
|
|
3605
|
+
pass: "pass";
|
|
3606
|
+
fail: "fail";
|
|
3604
3607
|
}>;
|
|
3605
3608
|
durationMs: z$1.ZodNullable<z$1.ZodNumber>;
|
|
3606
3609
|
costUsd: z$1.ZodOptional<z$1.ZodNullable<z$1.ZodNumber>>;
|
|
@@ -3743,9 +3746,9 @@ declare const scoreTraceSchema: z$1.ZodObject<{
|
|
|
3743
3746
|
subtree: "subtree";
|
|
3744
3747
|
}>>;
|
|
3745
3748
|
mode: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3746
|
-
sum: "sum";
|
|
3747
|
-
last: "last";
|
|
3748
3749
|
all: "all";
|
|
3750
|
+
last: "last";
|
|
3751
|
+
sum: "sum";
|
|
3749
3752
|
}>>;
|
|
3750
3753
|
}, z$1.core.$strip>>>;
|
|
3751
3754
|
}, z$1.core.$strip>;
|
|
@@ -3760,11 +3763,11 @@ declare const caseDetailSchema: z$1.ZodObject<{
|
|
|
3760
3763
|
evalId: z$1.ZodString;
|
|
3761
3764
|
status: z$1.ZodEnum<{
|
|
3762
3765
|
error: "error";
|
|
3763
|
-
|
|
3764
|
-
fail: "fail";
|
|
3766
|
+
pending: "pending";
|
|
3765
3767
|
running: "running";
|
|
3766
3768
|
cancelled: "cancelled";
|
|
3767
|
-
|
|
3769
|
+
pass: "pass";
|
|
3770
|
+
fail: "fail";
|
|
3768
3771
|
}>;
|
|
3769
3772
|
input: z$1.ZodUnknown;
|
|
3770
3773
|
trace: z$1.ZodArray<z$1.ZodObject<{
|
|
@@ -3829,9 +3832,9 @@ declare const caseDetailSchema: z$1.ZodObject<{
|
|
|
3829
3832
|
subtree: "subtree";
|
|
3830
3833
|
}>>;
|
|
3831
3834
|
mode: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3832
|
-
sum: "sum";
|
|
3833
|
-
last: "last";
|
|
3834
3835
|
all: "all";
|
|
3836
|
+
last: "last";
|
|
3837
|
+
sum: "sum";
|
|
3835
3838
|
}>>;
|
|
3836
3839
|
}, z$1.core.$strip>>>;
|
|
3837
3840
|
}, z$1.core.$strip>;
|
|
@@ -3898,9 +3901,9 @@ declare const caseDetailSchema: z$1.ZodObject<{
|
|
|
3898
3901
|
subtree: "subtree";
|
|
3899
3902
|
}>>;
|
|
3900
3903
|
mode: z$1.ZodOptional<z$1.ZodEnum<{
|
|
3901
|
-
sum: "sum";
|
|
3902
|
-
last: "last";
|
|
3903
3904
|
all: "all";
|
|
3905
|
+
last: "last";
|
|
3906
|
+
sum: "sum";
|
|
3904
3907
|
}>>;
|
|
3905
3908
|
}, z$1.core.$strip>>>;
|
|
3906
3909
|
}, z$1.core.$strip>;
|
|
@@ -3960,10 +3963,10 @@ declare const caseDetailSchema: z$1.ZodObject<{
|
|
|
3960
3963
|
namespace: z$1.ZodString;
|
|
3961
3964
|
key: z$1.ZodString;
|
|
3962
3965
|
status: z$1.ZodEnum<{
|
|
3966
|
+
bypass: "bypass";
|
|
3967
|
+
refresh: "refresh";
|
|
3963
3968
|
hit: "hit";
|
|
3964
3969
|
miss: "miss";
|
|
3965
|
-
refresh: "refresh";
|
|
3966
|
-
bypass: "bypass";
|
|
3967
3970
|
}>;
|
|
3968
3971
|
read: z$1.ZodOptional<z$1.ZodBoolean>;
|
|
3969
3972
|
stored: z$1.ZodOptional<z$1.ZodBoolean>;
|
|
@@ -4034,10 +4037,10 @@ declare const evalChartBuiltinMetricSchema: z$1.ZodEnum<{
|
|
|
4034
4037
|
type EvalChartBuiltinMetric = z$1.infer<typeof evalChartBuiltinMetricSchema>;
|
|
4035
4038
|
/** Reducer applied to a numeric column across all cases of a single run. */
|
|
4036
4039
|
declare const evalChartAggregateSchema: z$1.ZodEnum<{
|
|
4040
|
+
sum: "sum";
|
|
4037
4041
|
avg: "avg";
|
|
4038
4042
|
min: "min";
|
|
4039
4043
|
max: "max";
|
|
4040
|
-
sum: "sum";
|
|
4041
4044
|
latest: "latest";
|
|
4042
4045
|
passThresholdRate: "passThresholdRate";
|
|
4043
4046
|
}>;
|
|
@@ -4050,9 +4053,9 @@ type EvalChartAggregate = z$1.infer<typeof evalChartAggregateSchema>;
|
|
|
4050
4053
|
declare const evalChartColorSchema: z$1.ZodEnum<{
|
|
4051
4054
|
success: "success";
|
|
4052
4055
|
error: "error";
|
|
4056
|
+
warning: "warning";
|
|
4053
4057
|
accent: "accent";
|
|
4054
4058
|
accentDim: "accentDim";
|
|
4055
|
-
warning: "warning";
|
|
4056
4059
|
textMuted: "textMuted";
|
|
4057
4060
|
}>;
|
|
4058
4061
|
/** Semantic color token resolved to a theme color by the web UI. */
|
|
@@ -4079,9 +4082,9 @@ declare const evalChartMetricSchema: z$1.ZodDiscriminatedUnion<[z$1.ZodObject<{
|
|
|
4079
4082
|
color: z$1.ZodOptional<z$1.ZodEnum<{
|
|
4080
4083
|
success: "success";
|
|
4081
4084
|
error: "error";
|
|
4085
|
+
warning: "warning";
|
|
4082
4086
|
accent: "accent";
|
|
4083
4087
|
accentDim: "accentDim";
|
|
4084
|
-
warning: "warning";
|
|
4085
4088
|
textMuted: "textMuted";
|
|
4086
4089
|
}>>;
|
|
4087
4090
|
axis: z$1.ZodOptional<z$1.ZodEnum<{
|
|
@@ -4092,10 +4095,10 @@ declare const evalChartMetricSchema: z$1.ZodDiscriminatedUnion<[z$1.ZodObject<{
|
|
|
4092
4095
|
source: z$1.ZodLiteral<"column">;
|
|
4093
4096
|
key: z$1.ZodString;
|
|
4094
4097
|
aggregate: z$1.ZodEnum<{
|
|
4098
|
+
sum: "sum";
|
|
4095
4099
|
avg: "avg";
|
|
4096
4100
|
min: "min";
|
|
4097
4101
|
max: "max";
|
|
4098
|
-
sum: "sum";
|
|
4099
4102
|
latest: "latest";
|
|
4100
4103
|
passThresholdRate: "passThresholdRate";
|
|
4101
4104
|
}>;
|
|
@@ -4103,9 +4106,9 @@ declare const evalChartMetricSchema: z$1.ZodDiscriminatedUnion<[z$1.ZodObject<{
|
|
|
4103
4106
|
color: z$1.ZodOptional<z$1.ZodEnum<{
|
|
4104
4107
|
success: "success";
|
|
4105
4108
|
error: "error";
|
|
4109
|
+
warning: "warning";
|
|
4106
4110
|
accent: "accent";
|
|
4107
4111
|
accentDim: "accentDim";
|
|
4108
|
-
warning: "warning";
|
|
4109
4112
|
textMuted: "textMuted";
|
|
4110
4113
|
}>>;
|
|
4111
4114
|
axis: z$1.ZodOptional<z$1.ZodEnum<{
|
|
@@ -4127,10 +4130,10 @@ declare const evalChartTooltipExtraSchema: z$1.ZodDiscriminatedUnion<[z$1.ZodObj
|
|
|
4127
4130
|
source: z$1.ZodLiteral<"column">;
|
|
4128
4131
|
key: z$1.ZodString;
|
|
4129
4132
|
aggregate: z$1.ZodEnum<{
|
|
4133
|
+
sum: "sum";
|
|
4130
4134
|
avg: "avg";
|
|
4131
4135
|
min: "min";
|
|
4132
4136
|
max: "max";
|
|
4133
|
-
sum: "sum";
|
|
4134
4137
|
latest: "latest";
|
|
4135
4138
|
passThresholdRate: "passThresholdRate";
|
|
4136
4139
|
}>;
|
|
@@ -4162,9 +4165,9 @@ declare const evalChartConfigSchema: z$1.ZodObject<{
|
|
|
4162
4165
|
color: z$1.ZodOptional<z$1.ZodEnum<{
|
|
4163
4166
|
success: "success";
|
|
4164
4167
|
error: "error";
|
|
4168
|
+
warning: "warning";
|
|
4165
4169
|
accent: "accent";
|
|
4166
4170
|
accentDim: "accentDim";
|
|
4167
|
-
warning: "warning";
|
|
4168
4171
|
textMuted: "textMuted";
|
|
4169
4172
|
}>>;
|
|
4170
4173
|
axis: z$1.ZodOptional<z$1.ZodEnum<{
|
|
@@ -4175,10 +4178,10 @@ declare const evalChartConfigSchema: z$1.ZodObject<{
|
|
|
4175
4178
|
source: z$1.ZodLiteral<"column">;
|
|
4176
4179
|
key: z$1.ZodString;
|
|
4177
4180
|
aggregate: z$1.ZodEnum<{
|
|
4181
|
+
sum: "sum";
|
|
4178
4182
|
avg: "avg";
|
|
4179
4183
|
min: "min";
|
|
4180
4184
|
max: "max";
|
|
4181
|
-
sum: "sum";
|
|
4182
4185
|
latest: "latest";
|
|
4183
4186
|
passThresholdRate: "passThresholdRate";
|
|
4184
4187
|
}>;
|
|
@@ -4186,9 +4189,9 @@ declare const evalChartConfigSchema: z$1.ZodObject<{
|
|
|
4186
4189
|
color: z$1.ZodOptional<z$1.ZodEnum<{
|
|
4187
4190
|
success: "success";
|
|
4188
4191
|
error: "error";
|
|
4192
|
+
warning: "warning";
|
|
4189
4193
|
accent: "accent";
|
|
4190
4194
|
accentDim: "accentDim";
|
|
4191
|
-
warning: "warning";
|
|
4192
4195
|
textMuted: "textMuted";
|
|
4193
4196
|
}>>;
|
|
4194
4197
|
axis: z$1.ZodOptional<z$1.ZodEnum<{
|
|
@@ -4217,10 +4220,10 @@ declare const evalChartConfigSchema: z$1.ZodObject<{
|
|
|
4217
4220
|
source: z$1.ZodLiteral<"column">;
|
|
4218
4221
|
key: z$1.ZodString;
|
|
4219
4222
|
aggregate: z$1.ZodEnum<{
|
|
4223
|
+
sum: "sum";
|
|
4220
4224
|
avg: "avg";
|
|
4221
4225
|
min: "min";
|
|
4222
4226
|
max: "max";
|
|
4223
|
-
sum: "sum";
|
|
4224
4227
|
latest: "latest";
|
|
4225
4228
|
passThresholdRate: "passThresholdRate";
|
|
4226
4229
|
}>;
|
|
@@ -4252,9 +4255,9 @@ declare const evalChartsConfigSchema: z$1.ZodArray<z$1.ZodObject<{
|
|
|
4252
4255
|
color: z$1.ZodOptional<z$1.ZodEnum<{
|
|
4253
4256
|
success: "success";
|
|
4254
4257
|
error: "error";
|
|
4258
|
+
warning: "warning";
|
|
4255
4259
|
accent: "accent";
|
|
4256
4260
|
accentDim: "accentDim";
|
|
4257
|
-
warning: "warning";
|
|
4258
4261
|
textMuted: "textMuted";
|
|
4259
4262
|
}>>;
|
|
4260
4263
|
axis: z$1.ZodOptional<z$1.ZodEnum<{
|
|
@@ -4265,10 +4268,10 @@ declare const evalChartsConfigSchema: z$1.ZodArray<z$1.ZodObject<{
|
|
|
4265
4268
|
source: z$1.ZodLiteral<"column">;
|
|
4266
4269
|
key: z$1.ZodString;
|
|
4267
4270
|
aggregate: z$1.ZodEnum<{
|
|
4271
|
+
sum: "sum";
|
|
4268
4272
|
avg: "avg";
|
|
4269
4273
|
min: "min";
|
|
4270
4274
|
max: "max";
|
|
4271
|
-
sum: "sum";
|
|
4272
4275
|
latest: "latest";
|
|
4273
4276
|
passThresholdRate: "passThresholdRate";
|
|
4274
4277
|
}>;
|
|
@@ -4276,9 +4279,9 @@ declare const evalChartsConfigSchema: z$1.ZodArray<z$1.ZodObject<{
|
|
|
4276
4279
|
color: z$1.ZodOptional<z$1.ZodEnum<{
|
|
4277
4280
|
success: "success";
|
|
4278
4281
|
error: "error";
|
|
4282
|
+
warning: "warning";
|
|
4279
4283
|
accent: "accent";
|
|
4280
4284
|
accentDim: "accentDim";
|
|
4281
|
-
warning: "warning";
|
|
4282
4285
|
textMuted: "textMuted";
|
|
4283
4286
|
}>>;
|
|
4284
4287
|
axis: z$1.ZodOptional<z$1.ZodEnum<{
|
|
@@ -4307,10 +4310,10 @@ declare const evalChartsConfigSchema: z$1.ZodArray<z$1.ZodObject<{
|
|
|
4307
4310
|
source: z$1.ZodLiteral<"column">;
|
|
4308
4311
|
key: z$1.ZodString;
|
|
4309
4312
|
aggregate: z$1.ZodEnum<{
|
|
4313
|
+
sum: "sum";
|
|
4310
4314
|
avg: "avg";
|
|
4311
4315
|
min: "min";
|
|
4312
4316
|
max: "max";
|
|
4313
|
-
sum: "sum";
|
|
4314
4317
|
latest: "latest";
|
|
4315
4318
|
passThresholdRate: "passThresholdRate";
|
|
4316
4319
|
}>;
|
|
@@ -4326,10 +4329,10 @@ declare const runManifestSchema: z$1.ZodObject<{
|
|
|
4326
4329
|
shortId: z$1.ZodString;
|
|
4327
4330
|
status: z$1.ZodEnum<{
|
|
4328
4331
|
error: "error";
|
|
4329
|
-
running: "running";
|
|
4330
|
-
cancelled: "cancelled";
|
|
4331
4332
|
pending: "pending";
|
|
4333
|
+
running: "running";
|
|
4332
4334
|
completed: "completed";
|
|
4335
|
+
cancelled: "cancelled";
|
|
4333
4336
|
}>;
|
|
4334
4337
|
temporary: z$1.ZodDefault<z$1.ZodOptional<z$1.ZodBoolean>>;
|
|
4335
4338
|
startedAt: z$1.ZodString;
|
|
@@ -4338,9 +4341,9 @@ declare const runManifestSchema: z$1.ZodObject<{
|
|
|
4338
4341
|
evalSourceFingerprints: z$1.ZodDefault<z$1.ZodOptional<z$1.ZodRecord<z$1.ZodString, z$1.ZodString>>>;
|
|
4339
4342
|
target: z$1.ZodObject<{
|
|
4340
4343
|
mode: z$1.ZodEnum<{
|
|
4341
|
-
caseIds: "caseIds";
|
|
4342
4344
|
all: "all";
|
|
4343
4345
|
evalIds: "evalIds";
|
|
4346
|
+
caseIds: "caseIds";
|
|
4344
4347
|
}>;
|
|
4345
4348
|
evalKeys: z$1.ZodOptional<z$1.ZodArray<z$1.ZodString>>;
|
|
4346
4349
|
files: z$1.ZodOptional<z$1.ZodArray<z$1.ZodString>>;
|
|
@@ -4353,9 +4356,9 @@ declare const runManifestSchema: z$1.ZodObject<{
|
|
|
4353
4356
|
median: "median";
|
|
4354
4357
|
}>>>;
|
|
4355
4358
|
cacheMode: z$1.ZodOptional<z$1.ZodEnum<{
|
|
4356
|
-
refresh: "refresh";
|
|
4357
|
-
bypass: "bypass";
|
|
4358
4359
|
use: "use";
|
|
4360
|
+
bypass: "bypass";
|
|
4361
|
+
refresh: "refresh";
|
|
4359
4362
|
}>>;
|
|
4360
4363
|
}, z$1.core.$strip>;
|
|
4361
4364
|
/** Persisted lifecycle metadata for a single eval run. */
|
|
@@ -4365,10 +4368,10 @@ declare const runSummarySchema: z$1.ZodObject<{
|
|
|
4365
4368
|
runId: z$1.ZodString;
|
|
4366
4369
|
status: z$1.ZodEnum<{
|
|
4367
4370
|
error: "error";
|
|
4368
|
-
running: "running";
|
|
4369
|
-
cancelled: "cancelled";
|
|
4370
4371
|
pending: "pending";
|
|
4372
|
+
running: "running";
|
|
4371
4373
|
completed: "completed";
|
|
4374
|
+
cancelled: "cancelled";
|
|
4372
4375
|
}>;
|
|
4373
4376
|
totalCases: z$1.ZodNumber;
|
|
4374
4377
|
passedCases: z$1.ZodNumber;
|
|
@@ -5161,9 +5164,9 @@ declare const agentEvalsConfigSchema: z$1.ZodObject<{
|
|
|
5161
5164
|
subtree: "subtree";
|
|
5162
5165
|
}>>;
|
|
5163
5166
|
mode: z$1.ZodOptional<z$1.ZodEnum<{
|
|
5164
|
-
sum: "sum";
|
|
5165
|
-
last: "last";
|
|
5166
5167
|
all: "all";
|
|
5168
|
+
last: "last";
|
|
5169
|
+
sum: "sum";
|
|
5167
5170
|
}>>;
|
|
5168
5171
|
transform: z$1.ZodOptional<z$1.ZodCustom<TraceAttributeTransform, TraceAttributeTransform>>;
|
|
5169
5172
|
}, z$1.core.$strip>>>;
|
|
@@ -5186,11 +5189,11 @@ declare const agentEvalsConfigSchema: z$1.ZodObject<{
|
|
|
5186
5189
|
key: z$1.ZodString;
|
|
5187
5190
|
label: z$1.ZodOptional<z$1.ZodString>;
|
|
5188
5191
|
aggregate: z$1.ZodEnum<{
|
|
5192
|
+
last: "last";
|
|
5193
|
+
sum: "sum";
|
|
5189
5194
|
avg: "avg";
|
|
5190
5195
|
min: "min";
|
|
5191
5196
|
max: "max";
|
|
5192
|
-
sum: "sum";
|
|
5193
|
-
last: "last";
|
|
5194
5197
|
}>;
|
|
5195
5198
|
format: z$1.ZodOptional<z$1.ZodEnum<{
|
|
5196
5199
|
number: "number";
|
|
@@ -5539,9 +5542,9 @@ declare function extractApiCalls(spans: EvalTraceSpan[], config: ResolvedApiCall
|
|
|
5539
5542
|
* - `refresh`: never read, always write (forces re-execution and overwrites).
|
|
5540
5543
|
*/
|
|
5541
5544
|
declare const cacheModeSchema: z$1.ZodEnum<{
|
|
5542
|
-
refresh: "refresh";
|
|
5543
|
-
bypass: "bypass";
|
|
5544
5545
|
use: "use";
|
|
5546
|
+
bypass: "bypass";
|
|
5547
|
+
refresh: "refresh";
|
|
5545
5548
|
}>;
|
|
5546
5549
|
/** Mode controlling how cached spans behave during a run. */
|
|
5547
5550
|
type CacheMode = z$1.infer<typeof cacheModeSchema>;
|
|
@@ -5562,10 +5565,10 @@ declare const cacheOperationTypeSchema: z$1.ZodEnum<{
|
|
|
5562
5565
|
type CacheOperationType = z$1.infer<typeof cacheOperationTypeSchema>;
|
|
5563
5566
|
/** Status of a cache lookup recorded on a span or case scope. */
|
|
5564
5567
|
declare const cacheStatusSchema: z$1.ZodEnum<{
|
|
5568
|
+
bypass: "bypass";
|
|
5569
|
+
refresh: "refresh";
|
|
5565
5570
|
hit: "hit";
|
|
5566
5571
|
miss: "miss";
|
|
5567
|
-
refresh: "refresh";
|
|
5568
|
-
bypass: "bypass";
|
|
5569
5572
|
}>;
|
|
5570
5573
|
/** Status of a cache lookup recorded on a span or case scope. */
|
|
5571
5574
|
type CacheStatus = z$1.infer<typeof cacheStatusSchema>;
|
|
@@ -5582,10 +5585,10 @@ declare const traceCacheRefSchema: z$1.ZodObject<{
|
|
|
5582
5585
|
namespace: z$1.ZodString;
|
|
5583
5586
|
key: z$1.ZodString;
|
|
5584
5587
|
status: z$1.ZodEnum<{
|
|
5588
|
+
bypass: "bypass";
|
|
5589
|
+
refresh: "refresh";
|
|
5585
5590
|
hit: "hit";
|
|
5586
5591
|
miss: "miss";
|
|
5587
|
-
refresh: "refresh";
|
|
5588
|
-
bypass: "bypass";
|
|
5589
5592
|
}>;
|
|
5590
5593
|
read: z$1.ZodOptional<z$1.ZodBoolean>;
|
|
5591
5594
|
stored: z$1.ZodOptional<z$1.ZodBoolean>;
|
|
@@ -6089,9 +6092,9 @@ type ConfigReloadState = z$1.infer<typeof configReloadStateSchema>;
|
|
|
6089
6092
|
declare const createRunRequestSchema: z$1.ZodObject<{
|
|
6090
6093
|
target: z$1.ZodObject<{
|
|
6091
6094
|
mode: z$1.ZodEnum<{
|
|
6092
|
-
caseIds: "caseIds";
|
|
6093
6095
|
all: "all";
|
|
6094
6096
|
evalIds: "evalIds";
|
|
6097
|
+
caseIds: "caseIds";
|
|
6095
6098
|
}>;
|
|
6096
6099
|
evalKeys: z$1.ZodOptional<z$1.ZodArray<z$1.ZodString>>;
|
|
6097
6100
|
files: z$1.ZodOptional<z$1.ZodArray<z$1.ZodString>>;
|
|
@@ -6102,9 +6105,9 @@ declare const createRunRequestSchema: z$1.ZodObject<{
|
|
|
6102
6105
|
temporary: z$1.ZodOptional<z$1.ZodBoolean>;
|
|
6103
6106
|
cache: z$1.ZodOptional<z$1.ZodObject<{
|
|
6104
6107
|
mode: z$1.ZodDefault<z$1.ZodEnum<{
|
|
6105
|
-
refresh: "refresh";
|
|
6106
|
-
bypass: "bypass";
|
|
6107
6108
|
use: "use";
|
|
6109
|
+
bypass: "bypass";
|
|
6110
|
+
refresh: "refresh";
|
|
6108
6111
|
}>>;
|
|
6109
6112
|
}, z$1.core.$strip>>;
|
|
6110
6113
|
manualInputs: z$1.ZodOptional<z$1.ZodRecord<z$1.ZodString, z$1.ZodUnknown>>;
|
package/dist/index.mjs
CHANGED
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
import { $ as apiCallMetricFormatSchema, $n as evalAssert, $t as evalChartTypeSchema, A as configReloadStateSchema, An as jsonCellSchema, At as evalStatsConfigSchema, B as simulateTokenAllocation, Bn as hashCacheKeySync, Bt as manualInputJsonFieldSchema, Cn as traceSpanSchema, Ct as assertionFailureSchema, Dn as columnFormatSchema, Dt as evalFreshnessStatusSchema, En as columnDefSchema, Et as discoveryIssueSchema, F as extractCacheEntries, Fn as buildTraceTree, Ft as runLogPhaseSchema, G as deriveScopedSummaryFromCases, Gn as repoFile, Gt as manualInputTextFieldSchema, H as getNestedAttribute, Hn as deserializeCacheValue, Ht as manualInputNumberFieldSchema, I as extractCacheHits, In as captureEvalSpanError, It as scoreTraceSchema, J as runManifestSchema, Jn as evalExpect, Jt as evalChartBuiltinMetricSchema, K as deriveStatusFromCaseRows, Kn as manualInputFileValueSchema, Kt as evalChartAggregateSchema, L as extractApiCalls, Ln as evalSpan, Lt as manualInputBooleanFieldSchema, M as createRunRequestSchema, Mn as repoFileRefSchema, Mt as runLogEntrySchema, N as updateManualScoreRequestSchema, Nn as runArtifactRefSchema, Nt as runLogLevelSchema, On as columnKindSchema, Ot as evalStatAggregateSchema, P as sseEnvelopeSchema, Pn as z, Pt as runLogLocationSchema, Q as agentEvalsConfigSchema, Qt as evalChartTooltipExtraSchema, R as extractLlmCalls, Rn as evalTracer, Rt as manualInputDescriptorSchema, Sn as traceSpanKindSchema, St as getCaseRowEvalKey, Tn as cellValueSchema, Tt as caseRowSchema, U as getEvalTitle, Un as serializeCacheRecording, Ut as manualInputSelectFieldSchema, V as applyDerivedCallAttributes, Vn as deserializeCacheRecording, Vt as manualInputMultilineFieldSchema, W as getEvalDisplayStatus, Wn as serializeCacheValue, Wt as manualInputSelectOptionSchema, X as DEFAULT_API_CALLS_CONFIG, Xn as advanceEvalTime, Xt as evalChartConfigSchema, Y as runSummarySchema, Yn as EvalAssertionError, Yt as evalChartColorSchema, Z as DEFAULT_LLM_CALLS_CONFIG, Zn as appendToEvalOutput, Zt as evalChartMetricSchema, _n as traceAttributeDisplayPlacementSchema, _t as runLogsConfigSchema, an as cacheFileSchema, ar as isInEvalScope, at as evalColumnsSchema, bn as traceDisplayInputConfigSchema, bt as buildEvalKey, cn as cacheOperationTypeSchema, cr as runInEvalRuntimeScope, ct as llmCallMetricFormatSchema, dn as cacheStatusSchema, dr as setEvalOutput, dt as llmCallPricingRateSchema, en as evalChartsConfigSchema, er as evalLog, et as apiCallMetricPlacementSchema, fn as serializedCacheSpanSchema, fr as setScopeCacheContext, ft as llmCallPricingSchema, gn as traceAttributeDisplayInputSchema, gt as resolveLlmCallsConfig, hn as traceAttributeDisplayFormatSchema, hr as getEvalRegistry, ht as resolveApiCallsConfig, in as cacheEntryWithDebugKeySchema, ir as incrementEvalOutput, it as evalColumnOverrideSchema, j as configReloadStatusSchema, jn as numberDisplayOptionsSchema, jt as evalSummarySchema, kn as fileRefSchema, kt as evalStatItemSchema, ln as cacheRecordingOpSchema, lr as runInEvalScope, lt as llmCallMetricPlacementSchema, mn as traceCacheRefSchema, mr as defineEval, mt as removeDefaultConfigSchema, nn as cacheDebugKeyFileSchema, nr as getEvalCaseInput, nt as apiCallsConfigSchema, on as cacheListItemSchema, or as mergeEvalOutput, ot as evalDeriveConfigSchema, pn as spanCacheOptionsSchema, pr as startEvalBackgroundJob, pt as llmCallsConfigSchema, q as deriveStatusFromChildStatuses, qn as readManualInputFile, qt as evalChartAxisSchema, rn as cacheEntrySchema, rr as getEvalStartTime, rt as defaultConfigKeySchema, sn as cacheModeSchema, sr as nextEvalId, st as llmCallCostCurrencySchema, tn as cacheDebugKeyEntrySchema, tr as getCurrentScope, tt as apiCallMetricSchema, un as cacheRecordingSchema, ur as runInExistingEvalScope, ut as llmCallMetricSchema, vn as traceAttributeDisplaySchema, vt as trialSelectionModeSchema, wn as traceSpanWarningSchema, wt as caseDetailSchema, xn as traceSpanErrorSchema, xt as getCaseRowCaseKey, yn as traceDisplayConfigSchema, yt as buildCaseKey, z as simulateLlmCallCost, zn as hashCacheKey, zt as manualInputFieldDescriptorSchema } from "./runOrchestration-
|
|
2
|
-
import { a as materializeManualInputFiles, i as isManualInputFileValue, n as createRunner, o as stageManualInputFile, r as cleanupStagedManualInputFiles, s as stageManualInputFileFromPath, t as runCli } from "./cli-
|
|
3
|
-
import "./src
|
|
1
|
+
import { $ as apiCallMetricFormatSchema, $n as evalAssert, $t as evalChartTypeSchema, A as configReloadStateSchema, An as jsonCellSchema, At as evalStatsConfigSchema, B as simulateTokenAllocation, Bn as hashCacheKeySync, Bt as manualInputJsonFieldSchema, Cn as traceSpanSchema, Ct as assertionFailureSchema, Dn as columnFormatSchema, Dt as evalFreshnessStatusSchema, En as columnDefSchema, Et as discoveryIssueSchema, F as extractCacheEntries, Fn as buildTraceTree, Ft as runLogPhaseSchema, G as deriveScopedSummaryFromCases, Gn as repoFile, Gt as manualInputTextFieldSchema, H as getNestedAttribute, Hn as deserializeCacheValue, Ht as manualInputNumberFieldSchema, I as extractCacheHits, In as captureEvalSpanError, It as scoreTraceSchema, J as runManifestSchema, Jn as evalExpect, Jt as evalChartBuiltinMetricSchema, K as deriveStatusFromCaseRows, Kn as manualInputFileValueSchema, Kt as evalChartAggregateSchema, L as extractApiCalls, Ln as evalSpan, Lt as manualInputBooleanFieldSchema, M as createRunRequestSchema, Mn as repoFileRefSchema, Mt as runLogEntrySchema, N as updateManualScoreRequestSchema, Nn as runArtifactRefSchema, Nt as runLogLevelSchema, On as columnKindSchema, Ot as evalStatAggregateSchema, P as sseEnvelopeSchema, Pn as z, Pt as runLogLocationSchema, Q as agentEvalsConfigSchema, Qt as evalChartTooltipExtraSchema, R as extractLlmCalls, Rn as evalTracer, Rt as manualInputDescriptorSchema, Sn as traceSpanKindSchema, St as getCaseRowEvalKey, Tn as cellValueSchema, Tt as caseRowSchema, U as getEvalTitle, Un as serializeCacheRecording, Ut as manualInputSelectFieldSchema, V as applyDerivedCallAttributes, Vn as deserializeCacheRecording, Vt as manualInputMultilineFieldSchema, W as getEvalDisplayStatus, Wn as serializeCacheValue, Wt as manualInputSelectOptionSchema, X as DEFAULT_API_CALLS_CONFIG, Xn as advanceEvalTime, Xt as evalChartConfigSchema, Y as runSummarySchema, Yn as EvalAssertionError, Yt as evalChartColorSchema, Z as DEFAULT_LLM_CALLS_CONFIG, Zn as appendToEvalOutput, Zt as evalChartMetricSchema, _n as traceAttributeDisplayPlacementSchema, _t as runLogsConfigSchema, an as cacheFileSchema, ar as isInEvalScope, at as evalColumnsSchema, bn as traceDisplayInputConfigSchema, bt as buildEvalKey, cn as cacheOperationTypeSchema, cr as runInEvalRuntimeScope, ct as llmCallMetricFormatSchema, dn as cacheStatusSchema, dr as setEvalOutput, dt as llmCallPricingRateSchema, en as evalChartsConfigSchema, er as evalLog, et as apiCallMetricPlacementSchema, fn as serializedCacheSpanSchema, fr as setScopeCacheContext, ft as llmCallPricingSchema, gn as traceAttributeDisplayInputSchema, gt as resolveLlmCallsConfig, hn as traceAttributeDisplayFormatSchema, hr as getEvalRegistry, ht as resolveApiCallsConfig, in as cacheEntryWithDebugKeySchema, ir as incrementEvalOutput, it as evalColumnOverrideSchema, j as configReloadStatusSchema, jn as numberDisplayOptionsSchema, jt as evalSummarySchema, kn as fileRefSchema, kt as evalStatItemSchema, ln as cacheRecordingOpSchema, lr as runInEvalScope, lt as llmCallMetricPlacementSchema, mn as traceCacheRefSchema, mr as defineEval, mt as removeDefaultConfigSchema, nn as cacheDebugKeyFileSchema, nr as getEvalCaseInput, nt as apiCallsConfigSchema, on as cacheListItemSchema, or as mergeEvalOutput, ot as evalDeriveConfigSchema, pn as spanCacheOptionsSchema, pr as startEvalBackgroundJob, pt as llmCallsConfigSchema, q as deriveStatusFromChildStatuses, qn as readManualInputFile, qt as evalChartAxisSchema, rn as cacheEntrySchema, rr as getEvalStartTime, rt as defaultConfigKeySchema, sn as cacheModeSchema, sr as nextEvalId, st as llmCallCostCurrencySchema, tn as cacheDebugKeyEntrySchema, tr as getCurrentScope, tt as apiCallMetricSchema, un as cacheRecordingSchema, ur as runInExistingEvalScope, ut as llmCallMetricSchema, vn as traceAttributeDisplaySchema, vt as trialSelectionModeSchema, wn as traceSpanWarningSchema, wt as caseDetailSchema, xn as traceSpanErrorSchema, xt as getCaseRowCaseKey, yn as traceDisplayConfigSchema, yt as buildCaseKey, z as simulateLlmCallCost, zn as hashCacheKey, zt as manualInputFieldDescriptorSchema } from "./runOrchestration-BhUFWvq9.mjs";
|
|
2
|
+
import { a as materializeManualInputFiles, i as isManualInputFileValue, n as createRunner, o as stageManualInputFile, r as cleanupStagedManualInputFiles, s as stageManualInputFileFromPath, t as runCli } from "./cli-BUX6tr9J.mjs";
|
|
3
|
+
import "./src-BwJ5tod2.mjs";
|
|
4
4
|
export { DEFAULT_API_CALLS_CONFIG, DEFAULT_LLM_CALLS_CONFIG, EvalAssertionError, advanceEvalTime, agentEvalsConfigSchema, apiCallMetricFormatSchema, apiCallMetricPlacementSchema, apiCallMetricSchema, apiCallsConfigSchema, appendToEvalOutput, applyDerivedCallAttributes, assertionFailureSchema, buildCaseKey, buildEvalKey, buildTraceTree, cacheDebugKeyEntrySchema, cacheDebugKeyFileSchema, cacheEntrySchema, cacheEntryWithDebugKeySchema, cacheFileSchema, cacheListItemSchema, cacheModeSchema, cacheOperationTypeSchema, cacheRecordingOpSchema, cacheRecordingSchema, cacheStatusSchema, captureEvalSpanError, caseDetailSchema, caseRowSchema, cellValueSchema, cleanupStagedManualInputFiles, columnDefSchema, columnFormatSchema, columnKindSchema, configReloadStateSchema, configReloadStatusSchema, createRunRequestSchema, createRunner, defaultConfigKeySchema, defineEval, deriveScopedSummaryFromCases, deriveStatusFromCaseRows, deriveStatusFromChildStatuses, deserializeCacheRecording, deserializeCacheValue, discoveryIssueSchema, evalAssert, evalChartAggregateSchema, evalChartAxisSchema, evalChartBuiltinMetricSchema, evalChartColorSchema, evalChartConfigSchema, evalChartMetricSchema, evalChartTooltipExtraSchema, evalChartTypeSchema, evalChartsConfigSchema, evalColumnOverrideSchema, evalColumnsSchema, evalDeriveConfigSchema, evalExpect, evalFreshnessStatusSchema, evalLog, evalSpan, evalStatAggregateSchema, evalStatItemSchema, evalStatsConfigSchema, evalSummarySchema, evalTracer, extractApiCalls, extractCacheEntries, extractCacheHits, extractLlmCalls, fileRefSchema, getCaseRowCaseKey, getCaseRowEvalKey, getCurrentScope, getEvalCaseInput, getEvalDisplayStatus, getEvalRegistry, getEvalStartTime, getEvalTitle, getNestedAttribute, hashCacheKey, hashCacheKeySync, incrementEvalOutput, isInEvalScope, isManualInputFileValue, jsonCellSchema, llmCallCostCurrencySchema, llmCallMetricFormatSchema, llmCallMetricPlacementSchema, llmCallMetricSchema, llmCallPricingRateSchema, llmCallPricingSchema, llmCallsConfigSchema, manualInputBooleanFieldSchema, manualInputDescriptorSchema, manualInputFieldDescriptorSchema, manualInputFileValueSchema, manualInputJsonFieldSchema, manualInputMultilineFieldSchema, manualInputNumberFieldSchema, manualInputSelectFieldSchema, manualInputSelectOptionSchema, manualInputTextFieldSchema, materializeManualInputFiles, mergeEvalOutput, nextEvalId, numberDisplayOptionsSchema, readManualInputFile, removeDefaultConfigSchema, repoFile, repoFileRefSchema, resolveApiCallsConfig, resolveLlmCallsConfig, runArtifactRefSchema, runCli, runInEvalRuntimeScope, runInEvalScope, runInExistingEvalScope, runLogEntrySchema, runLogLevelSchema, runLogLocationSchema, runLogPhaseSchema, runLogsConfigSchema, runManifestSchema, runSummarySchema, scoreTraceSchema, serializeCacheRecording, serializeCacheValue, serializedCacheSpanSchema, setEvalOutput, setScopeCacheContext, simulateLlmCallCost, simulateTokenAllocation, spanCacheOptionsSchema, sseEnvelopeSchema, stageManualInputFile, stageManualInputFileFromPath, startEvalBackgroundJob, traceAttributeDisplayFormatSchema, traceAttributeDisplayInputSchema, traceAttributeDisplayPlacementSchema, traceAttributeDisplaySchema, traceCacheRefSchema, traceDisplayConfigSchema, traceDisplayInputConfigSchema, traceSpanErrorSchema, traceSpanKindSchema, traceSpanSchema, traceSpanWarningSchema, trialSelectionModeSchema, updateManualScoreRequestSchema, z };
|