@ls-stack/agent-eval 0.58.4 → 0.58.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/dist/index.d.mts CHANGED
@@ -405,10 +405,11 @@ type EvalTraceTree = {
405
405
  findSpan: (name: string) => EvalTraceSpan$2 | undefined; /** Return every span whose name exactly matches `name`. */
406
406
  findSpans: (name: string) => EvalTraceSpan$2[]; /** Return whether any span name exactly matches `name`. */
407
407
  hasSpan: (name: string) => boolean; /** Return every span whose kind exactly matches `kind`. */
408
- findSpansByKind: (kind: string) => EvalTraceSpan$2[]; /** Return every span with `kind: 'tool'`. */
409
- findToolCallSpans: () => EvalTraceSpan$2[]; /** Return the names of every span with `kind: 'tool'`. */
410
- listToolCallSpanNames: () => string[]; /** Return whether a `kind: 'tool'` span has a name exactly matching `name`. */
411
- hasToolCallSpan: (name: string) => boolean; /** Return span names in creation order, optionally filtered by kind. */
408
+ findSpansByKind: (kind: string) => EvalTraceSpan$2[]; /** Return every span with `kind: 'tool'` or `kind: 'tool_call'`. */
409
+ findToolCallSpans: () => EvalTraceSpan$2[]; /** Return the names of every span with `kind: 'tool'` or `kind: 'tool_call'`. */
410
+ listToolCallSpanNames: () => string[]; /** Return whether a tool-call span has a name exactly matching `name`. */
411
+ hasToolCallSpan: (name: string) => boolean; /** Return whether a tool-call span name appears exactly `expectedCalls` times. */
412
+ hasNToolCallSpans: (toolName: string, expectedCalls: number) => boolean; /** Return span names in creation order, optionally filtered by kind. */
412
413
  listSpanNames: (kind?: string) => string[]; /** Return span names in depth-first tree order, optionally filtered by kind. */
413
414
  listSpanNamesDfs: (kind?: string) => string[]; /** Return all spans in depth-first tree order. */
414
415
  flattenDfs: () => EvalTraceSpan$2[];
@@ -2241,10 +2242,10 @@ type EvalFreshnessStatus = z$1.infer<typeof evalFreshnessStatusSchema>;
2241
2242
  * `best` selects the highest finite value and `worst` selects the lowest.
2242
2243
  */
2243
2244
  declare const evalStatAggregateSchema: z$1.ZodEnum<{
2244
- min: "min";
2245
- max: "max";
2246
2245
  sum: "sum";
2247
2246
  avg: "avg";
2247
+ min: "min";
2248
+ max: "max";
2248
2249
  best: "best";
2249
2250
  worst: "worst";
2250
2251
  }>;
@@ -2273,10 +2274,10 @@ declare const evalStatItemSchema: z$1.ZodDiscriminatedUnion<[z$1.ZodObject<{
2273
2274
  hideIfNoValue: z$1.ZodOptional<z$1.ZodBoolean>;
2274
2275
  kind: z$1.ZodLiteral<"duration">;
2275
2276
  aggregate: z$1.ZodOptional<z$1.ZodEnum<{
2276
- min: "min";
2277
- max: "max";
2278
2277
  sum: "sum";
2279
2278
  avg: "avg";
2279
+ min: "min";
2280
+ max: "max";
2280
2281
  best: "best";
2281
2282
  worst: "worst";
2282
2283
  }>>;
@@ -2284,10 +2285,10 @@ declare const evalStatItemSchema: z$1.ZodDiscriminatedUnion<[z$1.ZodObject<{
2284
2285
  hideIfNoValue: z$1.ZodOptional<z$1.ZodBoolean>;
2285
2286
  kind: z$1.ZodLiteral<"cacheHits">;
2286
2287
  aggregate: z$1.ZodOptional<z$1.ZodEnum<{
2287
- min: "min";
2288
- max: "max";
2289
2288
  sum: "sum";
2290
2289
  avg: "avg";
2290
+ min: "min";
2291
+ max: "max";
2291
2292
  best: "best";
2292
2293
  worst: "worst";
2293
2294
  }>>;
@@ -2297,10 +2298,10 @@ declare const evalStatItemSchema: z$1.ZodDiscriminatedUnion<[z$1.ZodObject<{
2297
2298
  key: z$1.ZodString;
2298
2299
  label: z$1.ZodOptional<z$1.ZodString>;
2299
2300
  aggregate: z$1.ZodEnum<{
2300
- min: "min";
2301
- max: "max";
2302
2301
  sum: "sum";
2303
2302
  avg: "avg";
2303
+ min: "min";
2304
+ max: "max";
2304
2305
  best: "best";
2305
2306
  worst: "worst";
2306
2307
  }>;
@@ -2337,10 +2338,10 @@ declare const evalStatsConfigSchema: z$1.ZodArray<z$1.ZodDiscriminatedUnion<[z$1
2337
2338
  hideIfNoValue: z$1.ZodOptional<z$1.ZodBoolean>;
2338
2339
  kind: z$1.ZodLiteral<"duration">;
2339
2340
  aggregate: z$1.ZodOptional<z$1.ZodEnum<{
2340
- min: "min";
2341
- max: "max";
2342
2341
  sum: "sum";
2343
2342
  avg: "avg";
2343
+ min: "min";
2344
+ max: "max";
2344
2345
  best: "best";
2345
2346
  worst: "worst";
2346
2347
  }>>;
@@ -2348,10 +2349,10 @@ declare const evalStatsConfigSchema: z$1.ZodArray<z$1.ZodDiscriminatedUnion<[z$1
2348
2349
  hideIfNoValue: z$1.ZodOptional<z$1.ZodBoolean>;
2349
2350
  kind: z$1.ZodLiteral<"cacheHits">;
2350
2351
  aggregate: z$1.ZodOptional<z$1.ZodEnum<{
2351
- min: "min";
2352
- max: "max";
2353
2352
  sum: "sum";
2354
2353
  avg: "avg";
2354
+ min: "min";
2355
+ max: "max";
2355
2356
  best: "best";
2356
2357
  worst: "worst";
2357
2358
  }>>;
@@ -2361,10 +2362,10 @@ declare const evalStatsConfigSchema: z$1.ZodArray<z$1.ZodDiscriminatedUnion<[z$1
2361
2362
  key: z$1.ZodString;
2362
2363
  label: z$1.ZodOptional<z$1.ZodString>;
2363
2364
  aggregate: z$1.ZodEnum<{
2364
- min: "min";
2365
- max: "max";
2366
2365
  sum: "sum";
2367
2366
  avg: "avg";
2367
+ min: "min";
2368
+ max: "max";
2368
2369
  best: "best";
2369
2370
  worst: "worst";
2370
2371
  }>;
@@ -2464,10 +2465,10 @@ declare const evalSummarySchema$1: z$1.ZodObject<{
2464
2465
  hideIfNoValue: z$1.ZodOptional<z$1.ZodBoolean>;
2465
2466
  kind: z$1.ZodLiteral<"duration">;
2466
2467
  aggregate: z$1.ZodOptional<z$1.ZodEnum<{
2467
- min: "min";
2468
- max: "max";
2469
2468
  sum: "sum";
2470
2469
  avg: "avg";
2470
+ min: "min";
2471
+ max: "max";
2471
2472
  best: "best";
2472
2473
  worst: "worst";
2473
2474
  }>>;
@@ -2475,10 +2476,10 @@ declare const evalSummarySchema$1: z$1.ZodObject<{
2475
2476
  hideIfNoValue: z$1.ZodOptional<z$1.ZodBoolean>;
2476
2477
  kind: z$1.ZodLiteral<"cacheHits">;
2477
2478
  aggregate: z$1.ZodOptional<z$1.ZodEnum<{
2478
- min: "min";
2479
- max: "max";
2480
2479
  sum: "sum";
2481
2480
  avg: "avg";
2481
+ min: "min";
2482
+ max: "max";
2482
2483
  best: "best";
2483
2484
  worst: "worst";
2484
2485
  }>>;
@@ -2488,10 +2489,10 @@ declare const evalSummarySchema$1: z$1.ZodObject<{
2488
2489
  key: z$1.ZodString;
2489
2490
  label: z$1.ZodOptional<z$1.ZodString>;
2490
2491
  aggregate: z$1.ZodEnum<{
2491
- min: "min";
2492
- max: "max";
2493
2492
  sum: "sum";
2494
2493
  avg: "avg";
2494
+ min: "min";
2495
+ max: "max";
2495
2496
  best: "best";
2496
2497
  worst: "worst";
2497
2498
  }>;
@@ -2515,10 +2516,10 @@ declare const evalSummarySchema$1: z$1.ZodObject<{
2515
2516
  accent: z$1.ZodOptional<z$1.ZodBoolean>;
2516
2517
  }, z$1.core.$strip>], "kind">>>;
2517
2518
  defaultStatAggregate: z$1.ZodOptional<z$1.ZodEnum<{
2518
- min: "min";
2519
- max: "max";
2520
2519
  sum: "sum";
2521
2520
  avg: "avg";
2521
+ min: "min";
2522
+ max: "max";
2522
2523
  best: "best";
2523
2524
  worst: "worst";
2524
2525
  }>>;
@@ -2534,15 +2535,15 @@ declare const evalSummarySchema$1: z$1.ZodObject<{
2534
2535
  metrics: z$1.ZodArray<z$1.ZodDiscriminatedUnion<[z$1.ZodObject<{
2535
2536
  source: z$1.ZodLiteral<"builtin">;
2536
2537
  metric: z$1.ZodEnum<{
2537
- durationMs: "durationMs";
2538
2538
  passRate: "passRate";
2539
+ durationMs: "durationMs";
2539
2540
  }>;
2540
2541
  label: z$1.ZodOptional<z$1.ZodString>;
2541
2542
  color: z$1.ZodOptional<z$1.ZodEnum<{
2542
- error: "error";
2543
2543
  success: "success";
2544
- accent: "accent";
2544
+ error: "error";
2545
2545
  warning: "warning";
2546
+ accent: "accent";
2546
2547
  accentDim: "accentDim";
2547
2548
  textMuted: "textMuted";
2548
2549
  }>>;
@@ -2554,19 +2555,19 @@ declare const evalSummarySchema$1: z$1.ZodObject<{
2554
2555
  source: z$1.ZodLiteral<"column">;
2555
2556
  key: z$1.ZodString;
2556
2557
  aggregate: z$1.ZodEnum<{
2557
- min: "min";
2558
- max: "max";
2559
2558
  sum: "sum";
2560
2559
  avg: "avg";
2560
+ min: "min";
2561
+ max: "max";
2561
2562
  latest: "latest";
2562
2563
  passThresholdRate: "passThresholdRate";
2563
2564
  }>;
2564
2565
  label: z$1.ZodOptional<z$1.ZodString>;
2565
2566
  color: z$1.ZodOptional<z$1.ZodEnum<{
2566
- error: "error";
2567
2567
  success: "success";
2568
- accent: "accent";
2568
+ error: "error";
2569
2569
  warning: "warning";
2570
+ accent: "accent";
2570
2571
  accentDim: "accentDim";
2571
2572
  textMuted: "textMuted";
2572
2573
  }>>;
@@ -2588,18 +2589,18 @@ declare const evalSummarySchema$1: z$1.ZodObject<{
2588
2589
  tooltipExtras: z$1.ZodOptional<z$1.ZodArray<z$1.ZodDiscriminatedUnion<[z$1.ZodObject<{
2589
2590
  source: z$1.ZodLiteral<"builtin">;
2590
2591
  metric: z$1.ZodEnum<{
2591
- durationMs: "durationMs";
2592
2592
  passRate: "passRate";
2593
+ durationMs: "durationMs";
2593
2594
  }>;
2594
2595
  label: z$1.ZodOptional<z$1.ZodString>;
2595
2596
  }, z$1.core.$strip>, z$1.ZodObject<{
2596
2597
  source: z$1.ZodLiteral<"column">;
2597
2598
  key: z$1.ZodString;
2598
2599
  aggregate: z$1.ZodEnum<{
2599
- min: "min";
2600
- max: "max";
2601
2600
  sum: "sum";
2602
2601
  avg: "avg";
2602
+ min: "min";
2603
+ max: "max";
2603
2604
  latest: "latest";
2604
2605
  passThresholdRate: "passThresholdRate";
2605
2606
  }>;
@@ -2698,9 +2699,9 @@ declare const caseRowSchema$1: z$1.ZodObject<{
2698
2699
  error: "error";
2699
2700
  running: "running";
2700
2701
  cancelled: "cancelled";
2701
- pending: "pending";
2702
2702
  pass: "pass";
2703
2703
  fail: "fail";
2704
+ pending: "pending";
2704
2705
  }>;
2705
2706
  durationMs: z$1.ZodNullable<z$1.ZodNumber>;
2706
2707
  cacheHits: z$1.ZodOptional<z$1.ZodNumber>;
@@ -2779,9 +2780,9 @@ declare const runLogLevelSchema: z$1.ZodEnum<{
2779
2780
  type RunLogLevel = z$1.infer<typeof runLogLevelSchema>;
2780
2781
  /** Eval runner phase that emitted a captured case log. */
2781
2782
  declare const runLogPhaseSchema: z$1.ZodEnum<{
2782
- tracingAssertions: "tracingAssertions";
2783
2783
  eval: "eval";
2784
2784
  derive: "derive";
2785
+ tracingAssertions: "tracingAssertions";
2785
2786
  outputsSchema: "outputsSchema";
2786
2787
  scorer: "scorer";
2787
2788
  }>;
@@ -2806,9 +2807,9 @@ declare const runLogEntrySchema: z$1.ZodObject<{
2806
2807
  warn: "warn";
2807
2808
  }>;
2808
2809
  phase: z$1.ZodEnum<{
2809
- tracingAssertions: "tracingAssertions";
2810
2810
  eval: "eval";
2811
2811
  derive: "derive";
2812
+ tracingAssertions: "tracingAssertions";
2812
2813
  outputsSchema: "outputsSchema";
2813
2814
  scorer: "scorer";
2814
2815
  }>;
@@ -2901,10 +2902,10 @@ declare const scoreTraceSchema: z$1.ZodObject<{
2901
2902
  namespace: z$1.ZodString;
2902
2903
  key: z$1.ZodString;
2903
2904
  status: z$1.ZodEnum<{
2904
- bypass: "bypass";
2905
- refresh: "refresh";
2906
2905
  hit: "hit";
2907
2906
  miss: "miss";
2907
+ refresh: "refresh";
2908
+ bypass: "bypass";
2908
2909
  }>;
2909
2910
  read: z$1.ZodOptional<z$1.ZodBoolean>;
2910
2911
  stored: z$1.ZodOptional<z$1.ZodBoolean>;
@@ -2925,9 +2926,9 @@ declare const caseDetailSchema$1: z$1.ZodObject<{
2925
2926
  error: "error";
2926
2927
  running: "running";
2927
2928
  cancelled: "cancelled";
2928
- pending: "pending";
2929
2929
  pass: "pass";
2930
2930
  fail: "fail";
2931
+ pending: "pending";
2931
2932
  }>;
2932
2933
  input: z$1.ZodUnknown;
2933
2934
  trace: z$1.ZodArray<z$1.ZodObject<{
@@ -3073,10 +3074,10 @@ declare const caseDetailSchema$1: z$1.ZodObject<{
3073
3074
  namespace: z$1.ZodString;
3074
3075
  key: z$1.ZodString;
3075
3076
  status: z$1.ZodEnum<{
3076
- bypass: "bypass";
3077
- refresh: "refresh";
3078
3077
  hit: "hit";
3079
3078
  miss: "miss";
3079
+ refresh: "refresh";
3080
+ bypass: "bypass";
3080
3081
  }>;
3081
3082
  read: z$1.ZodOptional<z$1.ZodBoolean>;
3082
3083
  stored: z$1.ZodOptional<z$1.ZodBoolean>;
@@ -3165,9 +3166,9 @@ declare const caseDetailSchema$1: z$1.ZodObject<{
3165
3166
  warn: "warn";
3166
3167
  }>;
3167
3168
  phase: z$1.ZodEnum<{
3168
- tracingAssertions: "tracingAssertions";
3169
3169
  eval: "eval";
3170
3170
  derive: "derive";
3171
+ tracingAssertions: "tracingAssertions";
3171
3172
  outputsSchema: "outputsSchema";
3172
3173
  scorer: "scorer";
3173
3174
  }>;
@@ -3194,10 +3195,10 @@ declare const caseDetailSchema$1: z$1.ZodObject<{
3194
3195
  namespace: z$1.ZodString;
3195
3196
  key: z$1.ZodString;
3196
3197
  status: z$1.ZodEnum<{
3197
- bypass: "bypass";
3198
- refresh: "refresh";
3199
3198
  hit: "hit";
3200
3199
  miss: "miss";
3200
+ refresh: "refresh";
3201
+ bypass: "bypass";
3201
3202
  }>;
3202
3203
  read: z$1.ZodOptional<z$1.ZodBoolean>;
3203
3204
  stored: z$1.ZodOptional<z$1.ZodBoolean>;
@@ -3240,8 +3241,8 @@ type EvalChartType = z$1.infer<typeof evalChartTypeSchema>;
3240
3241
  * than from a per-case column.
3241
3242
  */
3242
3243
  declare const evalChartBuiltinMetricSchema: z$1.ZodEnum<{
3243
- durationMs: "durationMs";
3244
3244
  passRate: "passRate";
3245
+ durationMs: "durationMs";
3245
3246
  }>;
3246
3247
  /**
3247
3248
  * Run-level metric sourced from the aggregated `RunSummary` for a run, rather
@@ -3250,10 +3251,10 @@ declare const evalChartBuiltinMetricSchema: z$1.ZodEnum<{
3250
3251
  type EvalChartBuiltinMetric = z$1.infer<typeof evalChartBuiltinMetricSchema>;
3251
3252
  /** Reducer applied to a numeric column across all cases of a single run. */
3252
3253
  declare const evalChartAggregateSchema: z$1.ZodEnum<{
3253
- min: "min";
3254
- max: "max";
3255
3254
  sum: "sum";
3256
3255
  avg: "avg";
3256
+ min: "min";
3257
+ max: "max";
3257
3258
  latest: "latest";
3258
3259
  passThresholdRate: "passThresholdRate";
3259
3260
  }>;
@@ -3264,10 +3265,10 @@ type EvalChartAggregate = z$1.infer<typeof evalChartAggregateSchema>;
3264
3265
  * not emit raw hex so authored evals stay decoupled from the web theme.
3265
3266
  */
3266
3267
  declare const evalChartColorSchema: z$1.ZodEnum<{
3267
- error: "error";
3268
3268
  success: "success";
3269
- accent: "accent";
3269
+ error: "error";
3270
3270
  warning: "warning";
3271
+ accent: "accent";
3271
3272
  accentDim: "accentDim";
3272
3273
  textMuted: "textMuted";
3273
3274
  }>;
@@ -3288,15 +3289,15 @@ type EvalChartAxis = z$1.infer<typeof evalChartAxisSchema>;
3288
3289
  declare const evalChartMetricSchema: z$1.ZodDiscriminatedUnion<[z$1.ZodObject<{
3289
3290
  source: z$1.ZodLiteral<"builtin">;
3290
3291
  metric: z$1.ZodEnum<{
3291
- durationMs: "durationMs";
3292
3292
  passRate: "passRate";
3293
+ durationMs: "durationMs";
3293
3294
  }>;
3294
3295
  label: z$1.ZodOptional<z$1.ZodString>;
3295
3296
  color: z$1.ZodOptional<z$1.ZodEnum<{
3296
- error: "error";
3297
3297
  success: "success";
3298
- accent: "accent";
3298
+ error: "error";
3299
3299
  warning: "warning";
3300
+ accent: "accent";
3300
3301
  accentDim: "accentDim";
3301
3302
  textMuted: "textMuted";
3302
3303
  }>>;
@@ -3308,19 +3309,19 @@ declare const evalChartMetricSchema: z$1.ZodDiscriminatedUnion<[z$1.ZodObject<{
3308
3309
  source: z$1.ZodLiteral<"column">;
3309
3310
  key: z$1.ZodString;
3310
3311
  aggregate: z$1.ZodEnum<{
3311
- min: "min";
3312
- max: "max";
3313
3312
  sum: "sum";
3314
3313
  avg: "avg";
3314
+ min: "min";
3315
+ max: "max";
3315
3316
  latest: "latest";
3316
3317
  passThresholdRate: "passThresholdRate";
3317
3318
  }>;
3318
3319
  label: z$1.ZodOptional<z$1.ZodString>;
3319
3320
  color: z$1.ZodOptional<z$1.ZodEnum<{
3320
- error: "error";
3321
3321
  success: "success";
3322
- accent: "accent";
3322
+ error: "error";
3323
3323
  warning: "warning";
3324
+ accent: "accent";
3324
3325
  accentDim: "accentDim";
3325
3326
  textMuted: "textMuted";
3326
3327
  }>>;
@@ -3335,18 +3336,18 @@ type EvalChartMetric = z$1.infer<typeof evalChartMetricSchema>;
3335
3336
  declare const evalChartTooltipExtraSchema: z$1.ZodDiscriminatedUnion<[z$1.ZodObject<{
3336
3337
  source: z$1.ZodLiteral<"builtin">;
3337
3338
  metric: z$1.ZodEnum<{
3338
- durationMs: "durationMs";
3339
3339
  passRate: "passRate";
3340
+ durationMs: "durationMs";
3340
3341
  }>;
3341
3342
  label: z$1.ZodOptional<z$1.ZodString>;
3342
3343
  }, z$1.core.$strip>, z$1.ZodObject<{
3343
3344
  source: z$1.ZodLiteral<"column">;
3344
3345
  key: z$1.ZodString;
3345
3346
  aggregate: z$1.ZodEnum<{
3346
- min: "min";
3347
- max: "max";
3348
3347
  sum: "sum";
3349
3348
  avg: "avg";
3349
+ min: "min";
3350
+ max: "max";
3350
3351
  latest: "latest";
3351
3352
  passThresholdRate: "passThresholdRate";
3352
3353
  }>;
@@ -3371,15 +3372,15 @@ declare const evalChartConfigSchema: z$1.ZodObject<{
3371
3372
  metrics: z$1.ZodArray<z$1.ZodDiscriminatedUnion<[z$1.ZodObject<{
3372
3373
  source: z$1.ZodLiteral<"builtin">;
3373
3374
  metric: z$1.ZodEnum<{
3374
- durationMs: "durationMs";
3375
3375
  passRate: "passRate";
3376
+ durationMs: "durationMs";
3376
3377
  }>;
3377
3378
  label: z$1.ZodOptional<z$1.ZodString>;
3378
3379
  color: z$1.ZodOptional<z$1.ZodEnum<{
3379
- error: "error";
3380
3380
  success: "success";
3381
- accent: "accent";
3381
+ error: "error";
3382
3382
  warning: "warning";
3383
+ accent: "accent";
3383
3384
  accentDim: "accentDim";
3384
3385
  textMuted: "textMuted";
3385
3386
  }>>;
@@ -3391,19 +3392,19 @@ declare const evalChartConfigSchema: z$1.ZodObject<{
3391
3392
  source: z$1.ZodLiteral<"column">;
3392
3393
  key: z$1.ZodString;
3393
3394
  aggregate: z$1.ZodEnum<{
3394
- min: "min";
3395
- max: "max";
3396
3395
  sum: "sum";
3397
3396
  avg: "avg";
3397
+ min: "min";
3398
+ max: "max";
3398
3399
  latest: "latest";
3399
3400
  passThresholdRate: "passThresholdRate";
3400
3401
  }>;
3401
3402
  label: z$1.ZodOptional<z$1.ZodString>;
3402
3403
  color: z$1.ZodOptional<z$1.ZodEnum<{
3403
- error: "error";
3404
3404
  success: "success";
3405
- accent: "accent";
3405
+ error: "error";
3406
3406
  warning: "warning";
3407
+ accent: "accent";
3407
3408
  accentDim: "accentDim";
3408
3409
  textMuted: "textMuted";
3409
3410
  }>>;
@@ -3425,18 +3426,18 @@ declare const evalChartConfigSchema: z$1.ZodObject<{
3425
3426
  tooltipExtras: z$1.ZodOptional<z$1.ZodArray<z$1.ZodDiscriminatedUnion<[z$1.ZodObject<{
3426
3427
  source: z$1.ZodLiteral<"builtin">;
3427
3428
  metric: z$1.ZodEnum<{
3428
- durationMs: "durationMs";
3429
3429
  passRate: "passRate";
3430
+ durationMs: "durationMs";
3430
3431
  }>;
3431
3432
  label: z$1.ZodOptional<z$1.ZodString>;
3432
3433
  }, z$1.core.$strip>, z$1.ZodObject<{
3433
3434
  source: z$1.ZodLiteral<"column">;
3434
3435
  key: z$1.ZodString;
3435
3436
  aggregate: z$1.ZodEnum<{
3436
- min: "min";
3437
- max: "max";
3438
3437
  sum: "sum";
3439
3438
  avg: "avg";
3439
+ min: "min";
3440
+ max: "max";
3440
3441
  latest: "latest";
3441
3442
  passThresholdRate: "passThresholdRate";
3442
3443
  }>;
@@ -3461,15 +3462,15 @@ declare const evalChartsConfigSchema: z$1.ZodArray<z$1.ZodObject<{
3461
3462
  metrics: z$1.ZodArray<z$1.ZodDiscriminatedUnion<[z$1.ZodObject<{
3462
3463
  source: z$1.ZodLiteral<"builtin">;
3463
3464
  metric: z$1.ZodEnum<{
3464
- durationMs: "durationMs";
3465
3465
  passRate: "passRate";
3466
+ durationMs: "durationMs";
3466
3467
  }>;
3467
3468
  label: z$1.ZodOptional<z$1.ZodString>;
3468
3469
  color: z$1.ZodOptional<z$1.ZodEnum<{
3469
- error: "error";
3470
3470
  success: "success";
3471
- accent: "accent";
3471
+ error: "error";
3472
3472
  warning: "warning";
3473
+ accent: "accent";
3473
3474
  accentDim: "accentDim";
3474
3475
  textMuted: "textMuted";
3475
3476
  }>>;
@@ -3481,19 +3482,19 @@ declare const evalChartsConfigSchema: z$1.ZodArray<z$1.ZodObject<{
3481
3482
  source: z$1.ZodLiteral<"column">;
3482
3483
  key: z$1.ZodString;
3483
3484
  aggregate: z$1.ZodEnum<{
3484
- min: "min";
3485
- max: "max";
3486
3485
  sum: "sum";
3487
3486
  avg: "avg";
3487
+ min: "min";
3488
+ max: "max";
3488
3489
  latest: "latest";
3489
3490
  passThresholdRate: "passThresholdRate";
3490
3491
  }>;
3491
3492
  label: z$1.ZodOptional<z$1.ZodString>;
3492
3493
  color: z$1.ZodOptional<z$1.ZodEnum<{
3493
- error: "error";
3494
3494
  success: "success";
3495
- accent: "accent";
3495
+ error: "error";
3496
3496
  warning: "warning";
3497
+ accent: "accent";
3497
3498
  accentDim: "accentDim";
3498
3499
  textMuted: "textMuted";
3499
3500
  }>>;
@@ -3515,18 +3516,18 @@ declare const evalChartsConfigSchema: z$1.ZodArray<z$1.ZodObject<{
3515
3516
  tooltipExtras: z$1.ZodOptional<z$1.ZodArray<z$1.ZodDiscriminatedUnion<[z$1.ZodObject<{
3516
3517
  source: z$1.ZodLiteral<"builtin">;
3517
3518
  metric: z$1.ZodEnum<{
3518
- durationMs: "durationMs";
3519
3519
  passRate: "passRate";
3520
+ durationMs: "durationMs";
3520
3521
  }>;
3521
3522
  label: z$1.ZodOptional<z$1.ZodString>;
3522
3523
  }, z$1.core.$strip>, z$1.ZodObject<{
3523
3524
  source: z$1.ZodLiteral<"column">;
3524
3525
  key: z$1.ZodString;
3525
3526
  aggregate: z$1.ZodEnum<{
3526
- min: "min";
3527
- max: "max";
3528
3527
  sum: "sum";
3529
3528
  avg: "avg";
3529
+ min: "min";
3530
+ max: "max";
3530
3531
  latest: "latest";
3531
3532
  passThresholdRate: "passThresholdRate";
3532
3533
  }>;
@@ -3555,8 +3556,8 @@ declare const runManifestSchema$1: z$1.ZodObject<{
3555
3556
  target: z$1.ZodObject<{
3556
3557
  mode: z$1.ZodEnum<{
3557
3558
  all: "all";
3558
- evalIds: "evalIds";
3559
3559
  caseIds: "caseIds";
3560
+ evalIds: "evalIds";
3560
3561
  }>;
3561
3562
  evalKeys: z$1.ZodOptional<z$1.ZodArray<z$1.ZodString>>;
3562
3563
  files: z$1.ZodOptional<z$1.ZodArray<z$1.ZodString>>;
@@ -3570,9 +3571,9 @@ declare const runManifestSchema$1: z$1.ZodObject<{
3570
3571
  median: "median";
3571
3572
  }>>>;
3572
3573
  cacheMode: z$1.ZodOptional<z$1.ZodEnum<{
3573
- use: "use";
3574
- bypass: "bypass";
3575
3574
  refresh: "refresh";
3575
+ bypass: "bypass";
3576
+ use: "use";
3576
3577
  }>>;
3577
3578
  }, z$1.core.$strip>;
3578
3579
  /** Persisted lifecycle metadata for a single eval run. */
@@ -3668,8 +3669,8 @@ type TrialSelectionMode = z$1.infer<typeof trialSelectionModeSchema>;
3668
3669
  /** Built-in eval-level output/column keys. */
3669
3670
  /** Removal config for built-in eval-level outputs and UI metadata. */
3670
3671
  declare const removeDefaultConfigSchema: z$1.ZodUnion<readonly [z$1.ZodLiteral<true>, z$1.ZodArray<z$1.ZodEnum<{
3671
- apiCalls: "apiCalls";
3672
3672
  costUsd: "costUsd";
3673
+ apiCalls: "apiCalls";
3673
3674
  llmTurns: "llmTurns";
3674
3675
  inputTokens: "inputTokens";
3675
3676
  outputTokens: "outputTokens";
@@ -3694,10 +3695,11 @@ type EvalTraceTree$1 = {
3694
3695
  findSpan: (name: string) => EvalTraceSpan$1 | undefined; /** Return every span whose name exactly matches `name`. */
3695
3696
  findSpans: (name: string) => EvalTraceSpan$1[]; /** Return whether any span name exactly matches `name`. */
3696
3697
  hasSpan: (name: string) => boolean; /** Return every span whose kind exactly matches `kind`. */
3697
- findSpansByKind: (kind: string) => EvalTraceSpan$1[]; /** Return every span with `kind: 'tool'`. */
3698
- findToolCallSpans: () => EvalTraceSpan$1[]; /** Return the names of every span with `kind: 'tool'`. */
3699
- listToolCallSpanNames: () => string[]; /** Return whether a `kind: 'tool'` span has a name exactly matching `name`. */
3700
- hasToolCallSpan: (name: string) => boolean; /** Return span names in creation order, optionally filtered by kind. */
3698
+ findSpansByKind: (kind: string) => EvalTraceSpan$1[]; /** Return every span with `kind: 'tool'` or `kind: 'tool_call'`. */
3699
+ findToolCallSpans: () => EvalTraceSpan$1[]; /** Return the names of every span with `kind: 'tool'` or `kind: 'tool_call'`. */
3700
+ listToolCallSpanNames: () => string[]; /** Return whether a tool-call span has a name exactly matching `name`. */
3701
+ hasToolCallSpan: (name: string) => boolean; /** Return whether a tool-call span name appears exactly `expectedCalls` times. */
3702
+ hasNToolCallSpans: (toolName: string, expectedCalls: number) => boolean; /** Return span names in creation order, optionally filtered by kind. */
3701
3703
  listSpanNames: (kind?: string) => string[]; /** Return span names in depth-first tree order, optionally filtered by kind. */
3702
3704
  listSpanNamesDfs: (kind?: string) => string[]; /** Return all spans in depth-first tree order. */
3703
3705
  flattenDfs: () => EvalTraceSpan$1[];
@@ -4529,9 +4531,9 @@ declare function extractApiCalls(spans: EvalTraceSpan$1[], config: ResolvedApiCa
4529
4531
  * - `refresh`: never read, always write (forces re-execution and overwrites).
4530
4532
  */
4531
4533
  declare const cacheModeSchema: z$1.ZodEnum<{
4532
- use: "use";
4533
- bypass: "bypass";
4534
4534
  refresh: "refresh";
4535
+ bypass: "bypass";
4536
+ use: "use";
4535
4537
  }>;
4536
4538
  /** Mode controlling how cached spans behave during a run. */
4537
4539
  type CacheMode = z$1.infer<typeof cacheModeSchema>;
@@ -4545,17 +4547,17 @@ declare const spanCacheOptionsSchema: z$1.ZodObject<{
4545
4547
  type SpanCacheOptions = z$1.infer<typeof spanCacheOptionsSchema>;
4546
4548
  /** Category of operation stored in the eval cache. */
4547
4549
  declare const cacheOperationTypeSchema: z$1.ZodEnum<{
4548
- span: "span";
4549
4550
  value: "value";
4551
+ span: "span";
4550
4552
  }>;
4551
4553
  /** Category of operation stored in the eval cache. */
4552
4554
  type CacheOperationType = z$1.infer<typeof cacheOperationTypeSchema>;
4553
4555
  /** Status of a cache lookup recorded on a span or case scope. */
4554
4556
  declare const cacheStatusSchema: z$1.ZodEnum<{
4555
- bypass: "bypass";
4556
- refresh: "refresh";
4557
4557
  hit: "hit";
4558
4558
  miss: "miss";
4559
+ refresh: "refresh";
4560
+ bypass: "bypass";
4559
4561
  }>;
4560
4562
  /** Status of a cache lookup recorded on a span or case scope. */
4561
4563
  type CacheStatus = z$1.infer<typeof cacheStatusSchema>;
@@ -4572,10 +4574,10 @@ declare const traceCacheRefSchema: z$1.ZodObject<{
4572
4574
  namespace: z$1.ZodString;
4573
4575
  key: z$1.ZodString;
4574
4576
  status: z$1.ZodEnum<{
4575
- bypass: "bypass";
4576
- refresh: "refresh";
4577
4577
  hit: "hit";
4578
4578
  miss: "miss";
4579
+ refresh: "refresh";
4580
+ bypass: "bypass";
4579
4581
  }>;
4580
4582
  read: z$1.ZodOptional<z$1.ZodBoolean>;
4581
4583
  stored: z$1.ZodOptional<z$1.ZodBoolean>;
@@ -4771,8 +4773,8 @@ declare const cacheEntrySchema: z$1.ZodObject<{
4771
4773
  key: z$1.ZodString;
4772
4774
  namespace: z$1.ZodString;
4773
4775
  operationType: z$1.ZodOptional<z$1.ZodEnum<{
4774
- span: "span";
4775
4776
  value: "value";
4777
+ span: "span";
4776
4778
  }>>;
4777
4779
  operationName: z$1.ZodOptional<z$1.ZodString>;
4778
4780
  spanName: z$1.ZodOptional<z$1.ZodString>;
@@ -4878,8 +4880,8 @@ declare const cacheDebugKeyEntrySchema: z$1.ZodObject<{
4878
4880
  key: z$1.ZodString;
4879
4881
  namespace: z$1.ZodString;
4880
4882
  operationType: z$1.ZodEnum<{
4881
- span: "span";
4882
4883
  value: "value";
4884
+ span: "span";
4883
4885
  }>;
4884
4886
  operationName: z$1.ZodString;
4885
4887
  storedAt: z$1.ZodString;
@@ -4889,8 +4891,8 @@ declare const cacheDebugKeyEntrySchema: z$1.ZodObject<{
4889
4891
  key: z$1.ZodString;
4890
4892
  namespace: z$1.ZodString;
4891
4893
  operationType: z$1.ZodOptional<z$1.ZodEnum<{
4892
- span: "span";
4893
4894
  value: "value";
4895
+ span: "span";
4894
4896
  }>>;
4895
4897
  operationName: z$1.ZodOptional<z$1.ZodString>;
4896
4898
  spanName: z$1.ZodOptional<z$1.ZodString>;
@@ -4996,8 +4998,8 @@ declare const cacheEntryWithDebugKeySchema$1: z$1.ZodObject<{
4996
4998
  key: z$1.ZodString;
4997
4999
  namespace: z$1.ZodString;
4998
5000
  operationType: z$1.ZodOptional<z$1.ZodEnum<{
4999
- span: "span";
5000
5001
  value: "value";
5002
+ span: "span";
5001
5003
  }>>;
5002
5004
  operationName: z$1.ZodOptional<z$1.ZodString>;
5003
5005
  spanName: z$1.ZodOptional<z$1.ZodString>;
@@ -5094,8 +5096,8 @@ declare const cacheEntryWithDebugKeySchema$1: z$1.ZodObject<{
5094
5096
  key: z$1.ZodString;
5095
5097
  namespace: z$1.ZodString;
5096
5098
  operationType: z$1.ZodEnum<{
5097
- span: "span";
5098
5099
  value: "value";
5100
+ span: "span";
5099
5101
  }>;
5100
5102
  operationName: z$1.ZodString;
5101
5103
  storedAt: z$1.ZodString;
@@ -5105,8 +5107,8 @@ declare const cacheEntryWithDebugKeySchema$1: z$1.ZodObject<{
5105
5107
  key: z$1.ZodString;
5106
5108
  namespace: z$1.ZodString;
5107
5109
  operationType: z$1.ZodOptional<z$1.ZodEnum<{
5108
- span: "span";
5109
5110
  value: "value";
5111
+ span: "span";
5110
5112
  }>>;
5111
5113
  operationName: z$1.ZodOptional<z$1.ZodString>;
5112
5114
  spanName: z$1.ZodOptional<z$1.ZodString>;
@@ -5212,8 +5214,8 @@ declare const cacheFileSchema: z$1.ZodObject<{
5212
5214
  key: z$1.ZodString;
5213
5215
  namespace: z$1.ZodString;
5214
5216
  operationType: z$1.ZodOptional<z$1.ZodEnum<{
5215
- span: "span";
5216
5217
  value: "value";
5218
+ span: "span";
5217
5219
  }>>;
5218
5220
  operationName: z$1.ZodOptional<z$1.ZodString>;
5219
5221
  spanName: z$1.ZodOptional<z$1.ZodString>;
@@ -5318,8 +5320,8 @@ declare const cacheDebugKeyFileSchema: z$1.ZodObject<{
5318
5320
  key: z$1.ZodString;
5319
5321
  namespace: z$1.ZodString;
5320
5322
  operationType: z$1.ZodEnum<{
5321
- span: "span";
5322
5323
  value: "value";
5324
+ span: "span";
5323
5325
  }>;
5324
5326
  operationName: z$1.ZodString;
5325
5327
  storedAt: z$1.ZodString;
@@ -5329,8 +5331,8 @@ declare const cacheDebugKeyFileSchema: z$1.ZodObject<{
5329
5331
  key: z$1.ZodString;
5330
5332
  namespace: z$1.ZodString;
5331
5333
  operationType: z$1.ZodOptional<z$1.ZodEnum<{
5332
- span: "span";
5333
5334
  value: "value";
5335
+ span: "span";
5334
5336
  }>>;
5335
5337
  operationName: z$1.ZodOptional<z$1.ZodString>;
5336
5338
  spanName: z$1.ZodOptional<z$1.ZodString>;
@@ -5504,8 +5506,8 @@ type SseEnvelope = z$1.infer<typeof sseEnvelopeSchema$1>; //#endregion
5504
5506
  //#region src/schemas/api.d.ts
5505
5507
  /** Lifecycle state for an app config reload triggered by `agent-evals.config.ts`. */
5506
5508
  declare const configReloadStatusSchema: z$1.ZodEnum<{
5507
- idle: "idle";
5508
5509
  pending: "pending";
5510
+ idle: "idle";
5509
5511
  reloading: "reloading";
5510
5512
  }>;
5511
5513
  /** Status for config reloads in the long-running app server. */
@@ -5513,8 +5515,8 @@ type ConfigReloadStatus = z$1.infer<typeof configReloadStatusSchema>;
5513
5515
  /** UI/API-visible state for config reloads in `agent-evals app`. */
5514
5516
  declare const configReloadStateSchema$1: z$1.ZodObject<{
5515
5517
  status: z$1.ZodEnum<{
5516
- idle: "idle";
5517
5518
  pending: "pending";
5519
+ idle: "idle";
5518
5520
  reloading: "reloading";
5519
5521
  }>;
5520
5522
  activeRunCount: z$1.ZodNumber;
@@ -5528,8 +5530,8 @@ declare const createRunRequestSchema$1: z$1.ZodObject<{
5528
5530
  target: z$1.ZodObject<{
5529
5531
  mode: z$1.ZodEnum<{
5530
5532
  all: "all";
5531
- evalIds: "evalIds";
5532
5533
  caseIds: "caseIds";
5534
+ evalIds: "evalIds";
5533
5535
  }>;
5534
5536
  evalKeys: z$1.ZodOptional<z$1.ZodArray<z$1.ZodString>>;
5535
5537
  files: z$1.ZodOptional<z$1.ZodArray<z$1.ZodString>>;
@@ -5541,9 +5543,9 @@ declare const createRunRequestSchema$1: z$1.ZodObject<{
5541
5543
  temporary: z$1.ZodOptional<z$1.ZodBoolean>;
5542
5544
  cache: z$1.ZodOptional<z$1.ZodObject<{
5543
5545
  mode: z$1.ZodDefault<z$1.ZodEnum<{
5544
- use: "use";
5545
- bypass: "bypass";
5546
5546
  refresh: "refresh";
5547
+ bypass: "bypass";
5548
+ use: "use";
5547
5549
  }>>;
5548
5550
  }, z$1.core.$strip>>;
5549
5551
  manualInputs: z$1.ZodOptional<z$1.ZodRecord<z$1.ZodString, z$1.ZodUnknown>>;