@ls-stack/agent-eval 0.60.1 → 0.60.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -1,7 +1,7 @@
1
- import { Et as getCaseRowCaseKey, Ot as caseRowSchema, dt as getEvalTitle, nt as updateManualScoreRequestSchema, rt as extractCacheEntries, tt as createRunRequestSchema } from "./runExecution-CjWJUUZ5.mjs";
2
- import { o as stageManualInputFile } from "./cli-CVBSlTD8.mjs";
3
- import "./src-DjOTPnDz.mjs";
4
- import { t as getRunnerInstance } from "./runner-DzDRasWV.mjs";
1
+ import { Et as getCaseRowCaseKey, Ot as caseRowSchema, dt as getEvalTitle, nt as updateManualScoreRequestSchema, rt as extractCacheEntries, tt as createRunRequestSchema } from "./runExecution-Bq0Y3y_1.mjs";
2
+ import { o as stageManualInputFile } from "./cli-CbePEEua.mjs";
3
+ import "./src-CVM_FqPx.mjs";
4
+ import { t as getRunnerInstance } from "./runner-Kp0JqxrU.mjs";
5
5
  import { z } from "zod";
6
6
  import { resultify } from "t-result";
7
7
  import { readFile } from "node:fs/promises";
package/dist/bin.mjs CHANGED
@@ -1,5 +1,5 @@
1
1
  #!/usr/bin/env node
2
- import { t as runCli } from "./cli-CVBSlTD8.mjs";
2
+ import { t as runCli } from "./cli-CbePEEua.mjs";
3
3
  import { spawn } from "node:child_process";
4
4
  //#region src/bin.ts
5
5
  const moduleMocksFlag = "--experimental-test-module-mocks";
@@ -1,4 +1,4 @@
1
- import { Ct as resolveLlmCallsConfig, It as runWithEvalRegistry, J as runInEvalRuntimeScope, L as configureEvalRunLogs, St as resolveApiCallsConfig, _ as createBufferedCacheStore, a as isCaseChildParentMessage, d as loadEvalModule, l as registerAgentEvalsPackageResolutionHooks, p as loadConfig, r as runCase, v as createFsCacheStore, y as getCacheRetentionOptions } from "./runExecution-CjWJUUZ5.mjs";
1
+ import { Ct as resolveLlmCallsConfig, It as runWithEvalRegistry, J as runInEvalRuntimeScope, L as configureEvalRunLogs, St as resolveApiCallsConfig, _ as createBufferedCacheStore, a as isCaseChildParentMessage, d as loadEvalModule, l as registerAgentEvalsPackageResolutionHooks, p as loadConfig, r as runCase, v as createFsCacheStore, y as getCacheRetentionOptions } from "./runExecution-Bq0Y3y_1.mjs";
2
2
  //#region ../runner/src/caseChild.ts
3
3
  let fatalErrorReported = false;
4
4
  let disconnectExpected = false;
@@ -1,5 +1,5 @@
1
- import { Ct as resolveLlmCallsConfig, Et as getCaseRowCaseKey, Ft as getEvalRegistry, Ot as caseRowSchema, St as resolveApiCallsConfig, Tt as buildEvalKey, _t as matchesTagsFilter, c as resolveArtifactPath, dt as getEvalTitle, f as resolveEvalDefaultConfig, ft as getEvalDisplayStatus, h as normalizeScoreDef, lt as applyDerivedCallAttributes, m as buildDeclaredColumnDefs, o as stripTerminalControlCodes, p as loadConfig, pt as deriveScopedSummaryFromCases, s as resolveTracePresentation, v as createFsCacheStore, xt as runSummarySchema, y as getCacheRetentionOptions } from "./runExecution-CjWJUUZ5.mjs";
2
- import { C as validateCharts, S as parseEvalDiscovery, _ as runTouchesEval, a as validateTagsFilters, b as deriveEvalFreshness, c as getLatestRunInfos, d as nextShortIdFromSnapshots, f as persistCaseDetail, g as recomputePersistedCaseStatus, h as recomputeEvalStatusesInRuns, i as resolveEvalTags, l as loadPersistedRunSnapshot, m as persistRunState, n as getTargetEvalKeys, o as generateRunId, p as deleteTemporaryRuns, s as getLastRunStatuses, u as loadPersistedRunSnapshots, v as buildManualInputDescriptor, x as loadIsolatedEvalRegistry, y as parseManualInputValues } from "./runOrchestration-DE2TFAS6.mjs";
1
+ import { Ct as resolveLlmCallsConfig, Et as getCaseRowCaseKey, Ft as getEvalRegistry, Ot as caseRowSchema, St as resolveApiCallsConfig, Tt as buildEvalKey, _t as matchesTagsFilter, c as resolveArtifactPath, dt as getEvalTitle, f as resolveEvalDefaultConfig, ft as getEvalDisplayStatus, h as normalizeScoreDef, lt as applyDerivedCallAttributes, m as buildDeclaredColumnDefs, o as stripTerminalControlCodes, p as loadConfig, pt as deriveScopedSummaryFromCases, s as resolveTracePresentation, v as createFsCacheStore, xt as runSummarySchema, y as getCacheRetentionOptions } from "./runExecution-Bq0Y3y_1.mjs";
2
+ import { C as validateCharts, S as parseEvalDiscovery, _ as runTouchesEval, a as validateTagsFilters, b as deriveEvalFreshness, c as getLatestRunInfos, d as nextShortIdFromSnapshots, f as persistCaseDetail, g as recomputePersistedCaseStatus, h as recomputeEvalStatusesInRuns, i as resolveEvalTags, l as loadPersistedRunSnapshot, m as persistRunState, n as getTargetEvalKeys, o as generateRunId, p as deleteTemporaryRuns, s as getLastRunStatuses, u as loadPersistedRunSnapshots, v as buildManualInputDescriptor, x as loadIsolatedEvalRegistry, y as parseManualInputValues } from "./runOrchestration-BpwW0AmB.mjs";
3
3
  import { parseEnv } from "node:util";
4
4
  import { resultify } from "t-result";
5
5
  import { copyFile, mkdir, readFile, rm, writeFile } from "node:fs/promises";
@@ -2232,8 +2232,8 @@ async function commandApp(args) {
2232
2232
  const { serve } = await import("@hono/node-server");
2233
2233
  const bundledWebDist = resolve(currentDir, "apps/web/dist");
2234
2234
  if (existsSync(bundledWebDist)) process.env.AGENT_EVALS_WEB_DIST = bundledWebDist;
2235
- const appModule = await import("./app-CxKEVlng.mjs");
2236
- const runnerModule = await import("./runner-Cu1CQPTB.mjs");
2235
+ const appModule = await import("./app-DPCFFkyQ.mjs");
2236
+ const runnerModule = await import("./runner-XEP21_u9.mjs");
2237
2237
  if (!isHonoAppModule(appModule)) throw new Error("Server app module is invalid");
2238
2238
  if (!isServerRunnerModule(runnerModule)) throw new Error("Server runner module is invalid");
2239
2239
  await runnerModule.initRunner({ loadEnv: args.loadEnv });
package/dist/index.d.mts CHANGED
@@ -1941,10 +1941,10 @@ type ColumnKind = z.infer<typeof columnKindSchema>;
1941
1941
  declare const columnFormatSchema: z.ZodEnum<{
1942
1942
  number: "number";
1943
1943
  boolean: "boolean";
1944
- duration: "duration";
1945
- json: "json";
1946
1944
  file: "file";
1945
+ duration: "duration";
1947
1946
  markdown: "markdown";
1947
+ json: "json";
1948
1948
  image: "image";
1949
1949
  html: "html";
1950
1950
  pdf: "pdf";
@@ -1968,10 +1968,10 @@ declare const columnDefSchema: z.ZodObject<{
1968
1968
  format: z.ZodOptional<z.ZodEnum<{
1969
1969
  number: "number";
1970
1970
  boolean: "boolean";
1971
- duration: "duration";
1972
- json: "json";
1973
1971
  file: "file";
1972
+ duration: "duration";
1974
1973
  markdown: "markdown";
1974
+ json: "json";
1975
1975
  image: "image";
1976
1976
  html: "html";
1977
1977
  pdf: "pdf";
@@ -2061,9 +2061,9 @@ declare const traceAttributeDisplaySchema: z.ZodObject<{
2061
2061
  subtree: "subtree";
2062
2062
  }>>;
2063
2063
  mode: z.ZodOptional<z.ZodEnum<{
2064
+ sum: "sum";
2064
2065
  all: "all";
2065
2066
  last: "last";
2066
- sum: "sum";
2067
2067
  }>>;
2068
2068
  }, z.core.$strip>;
2069
2069
  /**
@@ -2097,9 +2097,9 @@ declare const traceDisplayConfigSchema: z.ZodObject<{
2097
2097
  subtree: "subtree";
2098
2098
  }>>;
2099
2099
  mode: z.ZodOptional<z.ZodEnum<{
2100
+ sum: "sum";
2100
2101
  all: "all";
2101
2102
  last: "last";
2102
- sum: "sum";
2103
2103
  }>>;
2104
2104
  }, z.core.$strip>>>;
2105
2105
  }, z.core.$strip>;
@@ -2137,9 +2137,9 @@ declare const traceAttributeDisplayInputSchema: z.ZodObject<{
2137
2137
  subtree: "subtree";
2138
2138
  }>>;
2139
2139
  mode: z.ZodOptional<z.ZodEnum<{
2140
+ sum: "sum";
2140
2141
  all: "all";
2141
2142
  last: "last";
2142
- sum: "sum";
2143
2143
  }>>;
2144
2144
  transform: z.ZodOptional<z.ZodCustom<TraceAttributeTransform, TraceAttributeTransform>>;
2145
2145
  }, z.core.$strip>;
@@ -2175,9 +2175,9 @@ declare const traceDisplayInputConfigSchema: z.ZodObject<{
2175
2175
  subtree: "subtree";
2176
2176
  }>>;
2177
2177
  mode: z.ZodOptional<z.ZodEnum<{
2178
+ sum: "sum";
2178
2179
  all: "all";
2179
2180
  last: "last";
2180
- sum: "sum";
2181
2181
  }>>;
2182
2182
  transform: z.ZodOptional<z.ZodCustom<TraceAttributeTransform, TraceAttributeTransform>>;
2183
2183
  }, z.core.$strip>>>;
@@ -2214,8 +2214,8 @@ declare const traceSpanSchema$1: z.ZodObject<{
2214
2214
  status: z.ZodEnum<{
2215
2215
  error: "error";
2216
2216
  running: "running";
2217
- ok: "ok";
2218
2217
  cancelled: "cancelled";
2218
+ ok: "ok";
2219
2219
  }>;
2220
2220
  attributes: z.ZodOptional<z.ZodRecord<z.ZodString, z.ZodUnknown>>;
2221
2221
  error: z.ZodOptional<z.ZodObject<{
@@ -2260,10 +2260,10 @@ type EvalFreshnessStatus = z.infer<typeof evalFreshnessStatusSchema>;
2260
2260
  * `best` selects the highest finite value and `worst` selects the lowest.
2261
2261
  */
2262
2262
  declare const evalStatAggregateSchema: z.ZodEnum<{
2263
- sum: "sum";
2264
2263
  avg: "avg";
2265
2264
  min: "min";
2266
2265
  max: "max";
2266
+ sum: "sum";
2267
2267
  best: "best";
2268
2268
  worst: "worst";
2269
2269
  }>;
@@ -2292,10 +2292,10 @@ declare const evalStatItemSchema: z.ZodDiscriminatedUnion<[z.ZodObject<{
2292
2292
  hideIfNoValue: z.ZodOptional<z.ZodBoolean>;
2293
2293
  kind: z.ZodLiteral<"duration">;
2294
2294
  aggregate: z.ZodOptional<z.ZodEnum<{
2295
- sum: "sum";
2296
2295
  avg: "avg";
2297
2296
  min: "min";
2298
2297
  max: "max";
2298
+ sum: "sum";
2299
2299
  best: "best";
2300
2300
  worst: "worst";
2301
2301
  }>>;
@@ -2303,10 +2303,10 @@ declare const evalStatItemSchema: z.ZodDiscriminatedUnion<[z.ZodObject<{
2303
2303
  hideIfNoValue: z.ZodOptional<z.ZodBoolean>;
2304
2304
  kind: z.ZodLiteral<"cacheHits">;
2305
2305
  aggregate: z.ZodOptional<z.ZodEnum<{
2306
- sum: "sum";
2307
2306
  avg: "avg";
2308
2307
  min: "min";
2309
2308
  max: "max";
2309
+ sum: "sum";
2310
2310
  best: "best";
2311
2311
  worst: "worst";
2312
2312
  }>>;
@@ -2316,20 +2316,20 @@ declare const evalStatItemSchema: z.ZodDiscriminatedUnion<[z.ZodObject<{
2316
2316
  key: z.ZodString;
2317
2317
  label: z.ZodOptional<z.ZodString>;
2318
2318
  aggregate: z.ZodEnum<{
2319
- sum: "sum";
2320
2319
  avg: "avg";
2321
2320
  min: "min";
2322
2321
  max: "max";
2322
+ sum: "sum";
2323
2323
  best: "best";
2324
2324
  worst: "worst";
2325
2325
  }>;
2326
2326
  format: z.ZodOptional<z.ZodEnum<{
2327
2327
  number: "number";
2328
2328
  boolean: "boolean";
2329
- duration: "duration";
2330
- json: "json";
2331
2329
  file: "file";
2330
+ duration: "duration";
2332
2331
  markdown: "markdown";
2332
+ json: "json";
2333
2333
  image: "image";
2334
2334
  html: "html";
2335
2335
  pdf: "pdf";
@@ -2356,10 +2356,10 @@ declare const evalStatsConfigSchema: z.ZodArray<z.ZodDiscriminatedUnion<[z.ZodOb
2356
2356
  hideIfNoValue: z.ZodOptional<z.ZodBoolean>;
2357
2357
  kind: z.ZodLiteral<"duration">;
2358
2358
  aggregate: z.ZodOptional<z.ZodEnum<{
2359
- sum: "sum";
2360
2359
  avg: "avg";
2361
2360
  min: "min";
2362
2361
  max: "max";
2362
+ sum: "sum";
2363
2363
  best: "best";
2364
2364
  worst: "worst";
2365
2365
  }>>;
@@ -2367,10 +2367,10 @@ declare const evalStatsConfigSchema: z.ZodArray<z.ZodDiscriminatedUnion<[z.ZodOb
2367
2367
  hideIfNoValue: z.ZodOptional<z.ZodBoolean>;
2368
2368
  kind: z.ZodLiteral<"cacheHits">;
2369
2369
  aggregate: z.ZodOptional<z.ZodEnum<{
2370
- sum: "sum";
2371
2370
  avg: "avg";
2372
2371
  min: "min";
2373
2372
  max: "max";
2373
+ sum: "sum";
2374
2374
  best: "best";
2375
2375
  worst: "worst";
2376
2376
  }>>;
@@ -2380,20 +2380,20 @@ declare const evalStatsConfigSchema: z.ZodArray<z.ZodDiscriminatedUnion<[z.ZodOb
2380
2380
  key: z.ZodString;
2381
2381
  label: z.ZodOptional<z.ZodString>;
2382
2382
  aggregate: z.ZodEnum<{
2383
- sum: "sum";
2384
2383
  avg: "avg";
2385
2384
  min: "min";
2386
2385
  max: "max";
2386
+ sum: "sum";
2387
2387
  best: "best";
2388
2388
  worst: "worst";
2389
2389
  }>;
2390
2390
  format: z.ZodOptional<z.ZodEnum<{
2391
2391
  number: "number";
2392
2392
  boolean: "boolean";
2393
- duration: "duration";
2394
- json: "json";
2395
2393
  file: "file";
2394
+ duration: "duration";
2396
2395
  markdown: "markdown";
2396
+ json: "json";
2397
2397
  image: "image";
2398
2398
  html: "html";
2399
2399
  pdf: "pdf";
@@ -2436,10 +2436,10 @@ declare const evalSummarySchema$1: z.ZodObject<{
2436
2436
  format: z.ZodOptional<z.ZodEnum<{
2437
2437
  number: "number";
2438
2438
  boolean: "boolean";
2439
- duration: "duration";
2440
- json: "json";
2441
2439
  file: "file";
2440
+ duration: "duration";
2442
2441
  markdown: "markdown";
2442
+ json: "json";
2443
2443
  image: "image";
2444
2444
  html: "html";
2445
2445
  pdf: "pdf";
@@ -2466,10 +2466,10 @@ declare const evalSummarySchema$1: z.ZodObject<{
2466
2466
  caseIds: z.ZodOptional<z.ZodArray<z.ZodString>>;
2467
2467
  lastRunStatus: z.ZodNullable<z.ZodEnum<{
2468
2468
  error: "error";
2469
- running: "running";
2470
- cancelled: "cancelled";
2471
2469
  pass: "pass";
2472
2470
  fail: "fail";
2471
+ running: "running";
2472
+ cancelled: "cancelled";
2473
2473
  unscored: "unscored";
2474
2474
  }>>;
2475
2475
  stats: z.ZodOptional<z.ZodArray<z.ZodDiscriminatedUnion<[z.ZodObject<{
@@ -2483,10 +2483,10 @@ declare const evalSummarySchema$1: z.ZodObject<{
2483
2483
  hideIfNoValue: z.ZodOptional<z.ZodBoolean>;
2484
2484
  kind: z.ZodLiteral<"duration">;
2485
2485
  aggregate: z.ZodOptional<z.ZodEnum<{
2486
- sum: "sum";
2487
2486
  avg: "avg";
2488
2487
  min: "min";
2489
2488
  max: "max";
2489
+ sum: "sum";
2490
2490
  best: "best";
2491
2491
  worst: "worst";
2492
2492
  }>>;
@@ -2494,10 +2494,10 @@ declare const evalSummarySchema$1: z.ZodObject<{
2494
2494
  hideIfNoValue: z.ZodOptional<z.ZodBoolean>;
2495
2495
  kind: z.ZodLiteral<"cacheHits">;
2496
2496
  aggregate: z.ZodOptional<z.ZodEnum<{
2497
- sum: "sum";
2498
2497
  avg: "avg";
2499
2498
  min: "min";
2500
2499
  max: "max";
2500
+ sum: "sum";
2501
2501
  best: "best";
2502
2502
  worst: "worst";
2503
2503
  }>>;
@@ -2507,20 +2507,20 @@ declare const evalSummarySchema$1: z.ZodObject<{
2507
2507
  key: z.ZodString;
2508
2508
  label: z.ZodOptional<z.ZodString>;
2509
2509
  aggregate: z.ZodEnum<{
2510
- sum: "sum";
2511
2510
  avg: "avg";
2512
2511
  min: "min";
2513
2512
  max: "max";
2513
+ sum: "sum";
2514
2514
  best: "best";
2515
2515
  worst: "worst";
2516
2516
  }>;
2517
2517
  format: z.ZodOptional<z.ZodEnum<{
2518
2518
  number: "number";
2519
2519
  boolean: "boolean";
2520
- duration: "duration";
2521
- json: "json";
2522
2520
  file: "file";
2521
+ duration: "duration";
2523
2522
  markdown: "markdown";
2523
+ json: "json";
2524
2524
  image: "image";
2525
2525
  html: "html";
2526
2526
  pdf: "pdf";
@@ -2534,10 +2534,10 @@ declare const evalSummarySchema$1: z.ZodObject<{
2534
2534
  accent: z.ZodOptional<z.ZodBoolean>;
2535
2535
  }, z.core.$strip>], "kind">>>;
2536
2536
  defaultStatAggregate: z.ZodOptional<z.ZodEnum<{
2537
- sum: "sum";
2538
2537
  avg: "avg";
2539
2538
  min: "min";
2540
2539
  max: "max";
2540
+ sum: "sum";
2541
2541
  best: "best";
2542
2542
  worst: "worst";
2543
2543
  }>>;
@@ -2558,11 +2558,11 @@ declare const evalSummarySchema$1: z.ZodObject<{
2558
2558
  }>;
2559
2559
  label: z.ZodOptional<z.ZodString>;
2560
2560
  color: z.ZodOptional<z.ZodEnum<{
2561
- error: "error";
2562
2561
  success: "success";
2563
- warning: "warning";
2564
2562
  accent: "accent";
2563
+ error: "error";
2565
2564
  accentDim: "accentDim";
2565
+ warning: "warning";
2566
2566
  textMuted: "textMuted";
2567
2567
  }>>;
2568
2568
  axis: z.ZodOptional<z.ZodEnum<{
@@ -2573,20 +2573,20 @@ declare const evalSummarySchema$1: z.ZodObject<{
2573
2573
  source: z.ZodLiteral<"column">;
2574
2574
  key: z.ZodString;
2575
2575
  aggregate: z.ZodEnum<{
2576
- sum: "sum";
2577
2576
  avg: "avg";
2578
2577
  min: "min";
2579
2578
  max: "max";
2579
+ sum: "sum";
2580
2580
  latest: "latest";
2581
2581
  passThresholdRate: "passThresholdRate";
2582
2582
  }>;
2583
2583
  label: z.ZodOptional<z.ZodString>;
2584
2584
  color: z.ZodOptional<z.ZodEnum<{
2585
- error: "error";
2586
2585
  success: "success";
2587
- warning: "warning";
2588
2586
  accent: "accent";
2587
+ error: "error";
2589
2588
  accentDim: "accentDim";
2589
+ warning: "warning";
2590
2590
  textMuted: "textMuted";
2591
2591
  }>>;
2592
2592
  axis: z.ZodOptional<z.ZodEnum<{
@@ -2615,10 +2615,10 @@ declare const evalSummarySchema$1: z.ZodObject<{
2615
2615
  source: z.ZodLiteral<"column">;
2616
2616
  key: z.ZodString;
2617
2617
  aggregate: z.ZodEnum<{
2618
- sum: "sum";
2619
2618
  avg: "avg";
2620
2619
  min: "min";
2621
2620
  max: "max";
2621
+ sum: "sum";
2622
2622
  latest: "latest";
2623
2623
  passThresholdRate: "passThresholdRate";
2624
2624
  }>;
@@ -2715,10 +2715,10 @@ declare const caseRowSchema$1: z.ZodObject<{
2715
2715
  tags: z.ZodOptional<z.ZodArray<z.ZodString>>;
2716
2716
  status: z.ZodEnum<{
2717
2717
  error: "error";
2718
- running: "running";
2719
- cancelled: "cancelled";
2720
2718
  pass: "pass";
2721
2719
  fail: "fail";
2720
+ running: "running";
2721
+ cancelled: "cancelled";
2722
2722
  pending: "pending";
2723
2723
  }>;
2724
2724
  durationMs: z.ZodNullable<z.ZodNumber>;
@@ -2748,10 +2748,10 @@ declare const caseRowSchema$1: z.ZodObject<{
2748
2748
  format: z.ZodOptional<z.ZodEnum<{
2749
2749
  number: "number";
2750
2750
  boolean: "boolean";
2751
- duration: "duration";
2752
- json: "json";
2753
2751
  file: "file";
2752
+ duration: "duration";
2754
2753
  markdown: "markdown";
2754
+ json: "json";
2755
2755
  image: "image";
2756
2756
  html: "html";
2757
2757
  pdf: "pdf";
@@ -2857,8 +2857,8 @@ declare const scoreTraceSchema: z.ZodObject<{
2857
2857
  status: z.ZodEnum<{
2858
2858
  error: "error";
2859
2859
  running: "running";
2860
- ok: "ok";
2861
2860
  cancelled: "cancelled";
2861
+ ok: "ok";
2862
2862
  }>;
2863
2863
  attributes: z.ZodOptional<z.ZodRecord<z.ZodString, z.ZodUnknown>>;
2864
2864
  error: z.ZodOptional<z.ZodObject<{
@@ -2908,9 +2908,9 @@ declare const scoreTraceSchema: z.ZodObject<{
2908
2908
  subtree: "subtree";
2909
2909
  }>>;
2910
2910
  mode: z.ZodOptional<z.ZodEnum<{
2911
+ sum: "sum";
2911
2912
  all: "all";
2912
2913
  last: "last";
2913
- sum: "sum";
2914
2914
  }>>;
2915
2915
  }, z.core.$strip>>>;
2916
2916
  }, z.core.$strip>;
@@ -2942,10 +2942,10 @@ declare const caseDetailSchema$1: z.ZodObject<{
2942
2942
  tags: z.ZodOptional<z.ZodArray<z.ZodString>>;
2943
2943
  status: z.ZodEnum<{
2944
2944
  error: "error";
2945
- running: "running";
2946
- cancelled: "cancelled";
2947
2945
  pass: "pass";
2948
2946
  fail: "fail";
2947
+ running: "running";
2948
+ cancelled: "cancelled";
2949
2949
  pending: "pending";
2950
2950
  }>;
2951
2951
  input: z.ZodUnknown;
@@ -2960,8 +2960,8 @@ declare const caseDetailSchema$1: z.ZodObject<{
2960
2960
  status: z.ZodEnum<{
2961
2961
  error: "error";
2962
2962
  running: "running";
2963
- ok: "ok";
2964
2963
  cancelled: "cancelled";
2964
+ ok: "ok";
2965
2965
  }>;
2966
2966
  attributes: z.ZodOptional<z.ZodRecord<z.ZodString, z.ZodUnknown>>;
2967
2967
  error: z.ZodOptional<z.ZodObject<{
@@ -3011,9 +3011,9 @@ declare const caseDetailSchema$1: z.ZodObject<{
3011
3011
  subtree: "subtree";
3012
3012
  }>>;
3013
3013
  mode: z.ZodOptional<z.ZodEnum<{
3014
+ sum: "sum";
3014
3015
  all: "all";
3015
3016
  last: "last";
3016
- sum: "sum";
3017
3017
  }>>;
3018
3018
  }, z.core.$strip>>>;
3019
3019
  }, z.core.$strip>;
@@ -3029,8 +3029,8 @@ declare const caseDetailSchema$1: z.ZodObject<{
3029
3029
  status: z.ZodEnum<{
3030
3030
  error: "error";
3031
3031
  running: "running";
3032
- ok: "ok";
3033
3032
  cancelled: "cancelled";
3033
+ ok: "ok";
3034
3034
  }>;
3035
3035
  attributes: z.ZodOptional<z.ZodRecord<z.ZodString, z.ZodUnknown>>;
3036
3036
  error: z.ZodOptional<z.ZodObject<{
@@ -3080,9 +3080,9 @@ declare const caseDetailSchema$1: z.ZodObject<{
3080
3080
  subtree: "subtree";
3081
3081
  }>>;
3082
3082
  mode: z.ZodOptional<z.ZodEnum<{
3083
+ sum: "sum";
3083
3084
  all: "all";
3084
3085
  last: "last";
3085
- sum: "sum";
3086
3086
  }>>;
3087
3087
  }, z.core.$strip>>>;
3088
3088
  }, z.core.$strip>;
@@ -3126,10 +3126,10 @@ declare const caseDetailSchema$1: z.ZodObject<{
3126
3126
  format: z.ZodOptional<z.ZodEnum<{
3127
3127
  number: "number";
3128
3128
  boolean: "boolean";
3129
- duration: "duration";
3130
- json: "json";
3131
3129
  file: "file";
3130
+ duration: "duration";
3132
3131
  markdown: "markdown";
3132
+ json: "json";
3133
3133
  image: "image";
3134
3134
  html: "html";
3135
3135
  pdf: "pdf";
@@ -3269,10 +3269,10 @@ declare const evalChartBuiltinMetricSchema: z.ZodEnum<{
3269
3269
  type EvalChartBuiltinMetric = z.infer<typeof evalChartBuiltinMetricSchema>;
3270
3270
  /** Reducer applied to a numeric column across all cases of a single run. */
3271
3271
  declare const evalChartAggregateSchema: z.ZodEnum<{
3272
- sum: "sum";
3273
3272
  avg: "avg";
3274
3273
  min: "min";
3275
3274
  max: "max";
3275
+ sum: "sum";
3276
3276
  latest: "latest";
3277
3277
  passThresholdRate: "passThresholdRate";
3278
3278
  }>;
@@ -3283,11 +3283,11 @@ type EvalChartAggregate = z.infer<typeof evalChartAggregateSchema>;
3283
3283
  * not emit raw hex so authored evals stay decoupled from the web theme.
3284
3284
  */
3285
3285
  declare const evalChartColorSchema: z.ZodEnum<{
3286
- error: "error";
3287
3286
  success: "success";
3288
- warning: "warning";
3289
3287
  accent: "accent";
3288
+ error: "error";
3290
3289
  accentDim: "accentDim";
3290
+ warning: "warning";
3291
3291
  textMuted: "textMuted";
3292
3292
  }>;
3293
3293
  /** Semantic color token resolved to a theme color by the web UI. */
@@ -3312,11 +3312,11 @@ declare const evalChartMetricSchema: z.ZodDiscriminatedUnion<[z.ZodObject<{
3312
3312
  }>;
3313
3313
  label: z.ZodOptional<z.ZodString>;
3314
3314
  color: z.ZodOptional<z.ZodEnum<{
3315
- error: "error";
3316
3315
  success: "success";
3317
- warning: "warning";
3318
3316
  accent: "accent";
3317
+ error: "error";
3319
3318
  accentDim: "accentDim";
3319
+ warning: "warning";
3320
3320
  textMuted: "textMuted";
3321
3321
  }>>;
3322
3322
  axis: z.ZodOptional<z.ZodEnum<{
@@ -3327,20 +3327,20 @@ declare const evalChartMetricSchema: z.ZodDiscriminatedUnion<[z.ZodObject<{
3327
3327
  source: z.ZodLiteral<"column">;
3328
3328
  key: z.ZodString;
3329
3329
  aggregate: z.ZodEnum<{
3330
- sum: "sum";
3331
3330
  avg: "avg";
3332
3331
  min: "min";
3333
3332
  max: "max";
3333
+ sum: "sum";
3334
3334
  latest: "latest";
3335
3335
  passThresholdRate: "passThresholdRate";
3336
3336
  }>;
3337
3337
  label: z.ZodOptional<z.ZodString>;
3338
3338
  color: z.ZodOptional<z.ZodEnum<{
3339
- error: "error";
3340
3339
  success: "success";
3341
- warning: "warning";
3342
3340
  accent: "accent";
3341
+ error: "error";
3343
3342
  accentDim: "accentDim";
3343
+ warning: "warning";
3344
3344
  textMuted: "textMuted";
3345
3345
  }>>;
3346
3346
  axis: z.ZodOptional<z.ZodEnum<{
@@ -3362,10 +3362,10 @@ declare const evalChartTooltipExtraSchema: z.ZodDiscriminatedUnion<[z.ZodObject<
3362
3362
  source: z.ZodLiteral<"column">;
3363
3363
  key: z.ZodString;
3364
3364
  aggregate: z.ZodEnum<{
3365
- sum: "sum";
3366
3365
  avg: "avg";
3367
3366
  min: "min";
3368
3367
  max: "max";
3368
+ sum: "sum";
3369
3369
  latest: "latest";
3370
3370
  passThresholdRate: "passThresholdRate";
3371
3371
  }>;
@@ -3395,11 +3395,11 @@ declare const evalChartConfigSchema: z.ZodObject<{
3395
3395
  }>;
3396
3396
  label: z.ZodOptional<z.ZodString>;
3397
3397
  color: z.ZodOptional<z.ZodEnum<{
3398
- error: "error";
3399
3398
  success: "success";
3400
- warning: "warning";
3401
3399
  accent: "accent";
3400
+ error: "error";
3402
3401
  accentDim: "accentDim";
3402
+ warning: "warning";
3403
3403
  textMuted: "textMuted";
3404
3404
  }>>;
3405
3405
  axis: z.ZodOptional<z.ZodEnum<{
@@ -3410,20 +3410,20 @@ declare const evalChartConfigSchema: z.ZodObject<{
3410
3410
  source: z.ZodLiteral<"column">;
3411
3411
  key: z.ZodString;
3412
3412
  aggregate: z.ZodEnum<{
3413
- sum: "sum";
3414
3413
  avg: "avg";
3415
3414
  min: "min";
3416
3415
  max: "max";
3416
+ sum: "sum";
3417
3417
  latest: "latest";
3418
3418
  passThresholdRate: "passThresholdRate";
3419
3419
  }>;
3420
3420
  label: z.ZodOptional<z.ZodString>;
3421
3421
  color: z.ZodOptional<z.ZodEnum<{
3422
- error: "error";
3423
3422
  success: "success";
3424
- warning: "warning";
3425
3423
  accent: "accent";
3424
+ error: "error";
3426
3425
  accentDim: "accentDim";
3426
+ warning: "warning";
3427
3427
  textMuted: "textMuted";
3428
3428
  }>>;
3429
3429
  axis: z.ZodOptional<z.ZodEnum<{
@@ -3452,10 +3452,10 @@ declare const evalChartConfigSchema: z.ZodObject<{
3452
3452
  source: z.ZodLiteral<"column">;
3453
3453
  key: z.ZodString;
3454
3454
  aggregate: z.ZodEnum<{
3455
- sum: "sum";
3456
3455
  avg: "avg";
3457
3456
  min: "min";
3458
3457
  max: "max";
3458
+ sum: "sum";
3459
3459
  latest: "latest";
3460
3460
  passThresholdRate: "passThresholdRate";
3461
3461
  }>;
@@ -3485,11 +3485,11 @@ declare const evalChartsConfigSchema: z.ZodArray<z.ZodObject<{
3485
3485
  }>;
3486
3486
  label: z.ZodOptional<z.ZodString>;
3487
3487
  color: z.ZodOptional<z.ZodEnum<{
3488
- error: "error";
3489
3488
  success: "success";
3490
- warning: "warning";
3491
3489
  accent: "accent";
3490
+ error: "error";
3492
3491
  accentDim: "accentDim";
3492
+ warning: "warning";
3493
3493
  textMuted: "textMuted";
3494
3494
  }>>;
3495
3495
  axis: z.ZodOptional<z.ZodEnum<{
@@ -3500,20 +3500,20 @@ declare const evalChartsConfigSchema: z.ZodArray<z.ZodObject<{
3500
3500
  source: z.ZodLiteral<"column">;
3501
3501
  key: z.ZodString;
3502
3502
  aggregate: z.ZodEnum<{
3503
- sum: "sum";
3504
3503
  avg: "avg";
3505
3504
  min: "min";
3506
3505
  max: "max";
3506
+ sum: "sum";
3507
3507
  latest: "latest";
3508
3508
  passThresholdRate: "passThresholdRate";
3509
3509
  }>;
3510
3510
  label: z.ZodOptional<z.ZodString>;
3511
3511
  color: z.ZodOptional<z.ZodEnum<{
3512
- error: "error";
3513
3512
  success: "success";
3514
- warning: "warning";
3515
3513
  accent: "accent";
3514
+ error: "error";
3516
3515
  accentDim: "accentDim";
3516
+ warning: "warning";
3517
3517
  textMuted: "textMuted";
3518
3518
  }>>;
3519
3519
  axis: z.ZodOptional<z.ZodEnum<{
@@ -3542,10 +3542,10 @@ declare const evalChartsConfigSchema: z.ZodArray<z.ZodObject<{
3542
3542
  source: z.ZodLiteral<"column">;
3543
3543
  key: z.ZodString;
3544
3544
  aggregate: z.ZodEnum<{
3545
- sum: "sum";
3546
3545
  avg: "avg";
3547
3546
  min: "min";
3548
3547
  max: "max";
3548
+ sum: "sum";
3549
3549
  latest: "latest";
3550
3550
  passThresholdRate: "passThresholdRate";
3551
3551
  }>;
@@ -3573,8 +3573,8 @@ declare const runManifestSchema$1: z.ZodObject<{
3573
3573
  evalSourceFingerprints: z.ZodDefault<z.ZodOptional<z.ZodRecord<z.ZodString, z.ZodString>>>;
3574
3574
  target: z.ZodObject<{
3575
3575
  mode: z.ZodEnum<{
3576
- all: "all";
3577
3576
  caseIds: "caseIds";
3577
+ all: "all";
3578
3578
  evalIds: "evalIds";
3579
3579
  }>;
3580
3580
  evalKeys: z.ZodOptional<z.ZodArray<z.ZodString>>;
@@ -4669,10 +4669,10 @@ declare const cacheRecordingOpSchema: z.ZodDiscriminatedUnion<[z.ZodObject<{
4669
4669
  format: z.ZodOptional<z.ZodEnum<{
4670
4670
  number: "number";
4671
4671
  boolean: "boolean";
4672
- duration: "duration";
4673
- json: "json";
4674
4672
  file: "file";
4673
+ duration: "duration";
4675
4674
  markdown: "markdown";
4675
+ json: "json";
4676
4676
  image: "image";
4677
4677
  html: "html";
4678
4678
  pdf: "pdf";
@@ -4721,8 +4721,8 @@ declare const cacheRecordingSchema: z.ZodObject<{
4721
4721
  finalStatus: z.ZodOptional<z.ZodEnum<{
4722
4722
  error: "error";
4723
4723
  running: "running";
4724
- ok: "ok";
4725
4724
  cancelled: "cancelled";
4725
+ ok: "ok";
4726
4726
  }>>;
4727
4727
  finalError: z.ZodOptional<z.ZodObject<{
4728
4728
  name: z.ZodOptional<z.ZodString>;
@@ -4757,10 +4757,10 @@ declare const cacheRecordingSchema: z.ZodObject<{
4757
4757
  format: z.ZodOptional<z.ZodEnum<{
4758
4758
  number: "number";
4759
4759
  boolean: "boolean";
4760
- duration: "duration";
4761
- json: "json";
4762
4760
  file: "file";
4761
+ duration: "duration";
4763
4762
  markdown: "markdown";
4763
+ json: "json";
4764
4764
  image: "image";
4765
4765
  html: "html";
4766
4766
  pdf: "pdf";
@@ -4822,8 +4822,8 @@ declare const cacheEntrySchema: z.ZodObject<{
4822
4822
  finalStatus: z.ZodOptional<z.ZodEnum<{
4823
4823
  error: "error";
4824
4824
  running: "running";
4825
- ok: "ok";
4826
4825
  cancelled: "cancelled";
4826
+ ok: "ok";
4827
4827
  }>>;
4828
4828
  finalError: z.ZodOptional<z.ZodObject<{
4829
4829
  name: z.ZodOptional<z.ZodString>;
@@ -4858,10 +4858,10 @@ declare const cacheEntrySchema: z.ZodObject<{
4858
4858
  format: z.ZodOptional<z.ZodEnum<{
4859
4859
  number: "number";
4860
4860
  boolean: "boolean";
4861
- duration: "duration";
4862
- json: "json";
4863
4861
  file: "file";
4862
+ duration: "duration";
4864
4863
  markdown: "markdown";
4864
+ json: "json";
4865
4865
  image: "image";
4866
4866
  html: "html";
4867
4867
  pdf: "pdf";
@@ -4940,8 +4940,8 @@ declare const cacheDebugKeyEntrySchema: z.ZodObject<{
4940
4940
  finalStatus: z.ZodOptional<z.ZodEnum<{
4941
4941
  error: "error";
4942
4942
  running: "running";
4943
- ok: "ok";
4944
4943
  cancelled: "cancelled";
4944
+ ok: "ok";
4945
4945
  }>>;
4946
4946
  finalError: z.ZodOptional<z.ZodObject<{
4947
4947
  name: z.ZodOptional<z.ZodString>;
@@ -4976,10 +4976,10 @@ declare const cacheDebugKeyEntrySchema: z.ZodObject<{
4976
4976
  format: z.ZodOptional<z.ZodEnum<{
4977
4977
  number: "number";
4978
4978
  boolean: "boolean";
4979
- duration: "duration";
4980
- json: "json";
4981
4979
  file: "file";
4980
+ duration: "duration";
4982
4981
  markdown: "markdown";
4982
+ json: "json";
4983
4983
  image: "image";
4984
4984
  html: "html";
4985
4985
  pdf: "pdf";
@@ -5047,8 +5047,8 @@ declare const cacheEntryWithDebugKeySchema$1: z.ZodObject<{
5047
5047
  finalStatus: z.ZodOptional<z.ZodEnum<{
5048
5048
  error: "error";
5049
5049
  running: "running";
5050
- ok: "ok";
5051
5050
  cancelled: "cancelled";
5051
+ ok: "ok";
5052
5052
  }>>;
5053
5053
  finalError: z.ZodOptional<z.ZodObject<{
5054
5054
  name: z.ZodOptional<z.ZodString>;
@@ -5083,10 +5083,10 @@ declare const cacheEntryWithDebugKeySchema$1: z.ZodObject<{
5083
5083
  format: z.ZodOptional<z.ZodEnum<{
5084
5084
  number: "number";
5085
5085
  boolean: "boolean";
5086
- duration: "duration";
5087
- json: "json";
5088
5086
  file: "file";
5087
+ duration: "duration";
5089
5088
  markdown: "markdown";
5089
+ json: "json";
5090
5090
  image: "image";
5091
5091
  html: "html";
5092
5092
  pdf: "pdf";
@@ -5156,8 +5156,8 @@ declare const cacheEntryWithDebugKeySchema$1: z.ZodObject<{
5156
5156
  finalStatus: z.ZodOptional<z.ZodEnum<{
5157
5157
  error: "error";
5158
5158
  running: "running";
5159
- ok: "ok";
5160
5159
  cancelled: "cancelled";
5160
+ ok: "ok";
5161
5161
  }>>;
5162
5162
  finalError: z.ZodOptional<z.ZodObject<{
5163
5163
  name: z.ZodOptional<z.ZodString>;
@@ -5192,10 +5192,10 @@ declare const cacheEntryWithDebugKeySchema$1: z.ZodObject<{
5192
5192
  format: z.ZodOptional<z.ZodEnum<{
5193
5193
  number: "number";
5194
5194
  boolean: "boolean";
5195
- duration: "duration";
5196
- json: "json";
5197
5195
  file: "file";
5196
+ duration: "duration";
5198
5197
  markdown: "markdown";
5198
+ json: "json";
5199
5199
  image: "image";
5200
5200
  html: "html";
5201
5201
  pdf: "pdf";
@@ -5263,8 +5263,8 @@ declare const cacheFileSchema: z.ZodObject<{
5263
5263
  finalStatus: z.ZodOptional<z.ZodEnum<{
5264
5264
  error: "error";
5265
5265
  running: "running";
5266
- ok: "ok";
5267
5266
  cancelled: "cancelled";
5267
+ ok: "ok";
5268
5268
  }>>;
5269
5269
  finalError: z.ZodOptional<z.ZodObject<{
5270
5270
  name: z.ZodOptional<z.ZodString>;
@@ -5299,10 +5299,10 @@ declare const cacheFileSchema: z.ZodObject<{
5299
5299
  format: z.ZodOptional<z.ZodEnum<{
5300
5300
  number: "number";
5301
5301
  boolean: "boolean";
5302
- duration: "duration";
5303
- json: "json";
5304
5302
  file: "file";
5303
+ duration: "duration";
5305
5304
  markdown: "markdown";
5305
+ json: "json";
5306
5306
  image: "image";
5307
5307
  html: "html";
5308
5308
  pdf: "pdf";
@@ -5380,8 +5380,8 @@ declare const cacheDebugKeyFileSchema: z.ZodObject<{
5380
5380
  finalStatus: z.ZodOptional<z.ZodEnum<{
5381
5381
  error: "error";
5382
5382
  running: "running";
5383
- ok: "ok";
5384
5383
  cancelled: "cancelled";
5384
+ ok: "ok";
5385
5385
  }>>;
5386
5386
  finalError: z.ZodOptional<z.ZodObject<{
5387
5387
  name: z.ZodOptional<z.ZodString>;
@@ -5416,10 +5416,10 @@ declare const cacheDebugKeyFileSchema: z.ZodObject<{
5416
5416
  format: z.ZodOptional<z.ZodEnum<{
5417
5417
  number: "number";
5418
5418
  boolean: "boolean";
5419
- duration: "duration";
5420
- json: "json";
5421
5419
  file: "file";
5420
+ duration: "duration";
5422
5421
  markdown: "markdown";
5422
+ json: "json";
5423
5423
  image: "image";
5424
5424
  html: "html";
5425
5425
  pdf: "pdf";
@@ -5565,8 +5565,8 @@ type ConfigReloadState = z.infer<typeof configReloadStateSchema$1>;
5565
5565
  declare const createRunRequestSchema$1: z.ZodObject<{
5566
5566
  target: z.ZodObject<{
5567
5567
  mode: z.ZodEnum<{
5568
- all: "all";
5569
5568
  caseIds: "caseIds";
5569
+ all: "all";
5570
5570
  evalIds: "evalIds";
5571
5571
  }>;
5572
5572
  evalKeys: z.ZodOptional<z.ZodArray<z.ZodString>>;
package/dist/index.mjs CHANGED
@@ -1,4 +1,4 @@
1
- import { $ as setScopeCacheContext, A as repoFile, B as evalTime, C as evalTracer, D as deserializeCacheValue, E as deserializeCacheRecording, F as EvalRuntimeUsageError, Ft as getEvalRegistry, H as getEvalCaseInput, I as appendToEvalOutput, J as runInEvalRuntimeScope, K as mergeEvalOutput, M as readManualInputFile, N as evalExpect, O as serializeCacheRecording, P as EvalAssertionError, Q as setEvalOutput, R as evalAssert, S as evalSpan, T as hashCacheKeySync, U as incrementEvalOutput, V as getCurrentScope, W as isInEvalScope, X as runInExistingEvalScope, Y as runInEvalScope, at as extractApiCalls, b as buildTraceTree, ct as simulateTokenAllocation, et as startEvalBackgroundJob, it as extractCacheHits, j as manualInputFileValueSchema, k as serializeCacheValue, ot as extractLlmCalls, q as nextEvalId, rt as extractCacheEntries, st as simulateLlmCallCost, ut as getNestedAttribute, w as hashCacheKey, x as captureEvalSpanError, z as evalLog } from "./runExecution-CjWJUUZ5.mjs";
2
- import { a as materializeManualInputFiles, i as isManualInputFileValue, n as createRunner, o as stageManualInputFile, r as cleanupStagedManualInputFiles, s as stageManualInputFileFromPath, t as runCli } from "./cli-CVBSlTD8.mjs";
3
- import { n as matchesEvalTags, t as defineEval } from "./src-DjOTPnDz.mjs";
1
+ import { $ as setScopeCacheContext, A as repoFile, B as evalTime, C as evalTracer, D as deserializeCacheValue, E as deserializeCacheRecording, F as EvalRuntimeUsageError, Ft as getEvalRegistry, H as getEvalCaseInput, I as appendToEvalOutput, J as runInEvalRuntimeScope, K as mergeEvalOutput, M as readManualInputFile, N as evalExpect, O as serializeCacheRecording, P as EvalAssertionError, Q as setEvalOutput, R as evalAssert, S as evalSpan, T as hashCacheKeySync, U as incrementEvalOutput, V as getCurrentScope, W as isInEvalScope, X as runInExistingEvalScope, Y as runInEvalScope, at as extractApiCalls, b as buildTraceTree, ct as simulateTokenAllocation, et as startEvalBackgroundJob, it as extractCacheHits, j as manualInputFileValueSchema, k as serializeCacheValue, ot as extractLlmCalls, q as nextEvalId, rt as extractCacheEntries, st as simulateLlmCallCost, ut as getNestedAttribute, w as hashCacheKey, x as captureEvalSpanError, z as evalLog } from "./runExecution-Bq0Y3y_1.mjs";
2
+ import { a as materializeManualInputFiles, i as isManualInputFileValue, n as createRunner, o as stageManualInputFile, r as cleanupStagedManualInputFiles, s as stageManualInputFileFromPath, t as runCli } from "./cli-CbePEEua.mjs";
3
+ import { n as matchesEvalTags, t as defineEval } from "./src-CVM_FqPx.mjs";
4
4
  export { EvalAssertionError, EvalRuntimeUsageError, appendToEvalOutput, buildTraceTree, captureEvalSpanError, cleanupStagedManualInputFiles, createRunner, defineEval, deserializeCacheRecording, deserializeCacheValue, evalAssert, evalExpect, evalLog, evalSpan, evalTime, evalTracer, extractApiCalls, extractCacheEntries, extractCacheHits, extractLlmCalls, getCurrentScope, getEvalCaseInput, getEvalRegistry, getNestedAttribute, hashCacheKey, hashCacheKeySync, incrementEvalOutput, isInEvalScope, isManualInputFileValue, manualInputFileValueSchema, matchesEvalTags, materializeManualInputFiles, mergeEvalOutput, nextEvalId, readManualInputFile, repoFile, runCli, runInEvalRuntimeScope, runInEvalScope, runInExistingEvalScope, serializeCacheRecording, serializeCacheValue, setEvalOutput, setScopeCacheContext, simulateLlmCallCost, simulateTokenAllocation, stageManualInputFile, stageManualInputFileFromPath, startEvalBackgroundJob };
package/dist/runChild.mjs CHANGED
@@ -1,5 +1,5 @@
1
- import { At as evalStatsConfigSchema, L as configureEvalRunLogs, Mt as evalChartsConfigSchema, Nt as columnDefSchema, Tt as buildEvalKey, bt as runManifestSchema, jt as manualInputDescriptorSchema, kt as evalStatAggregateSchema, l as registerAgentEvalsPackageResolutionHooks, p as loadConfig, tt as createRunRequestSchema, v as createFsCacheStore, xt as runSummarySchema, y as getCacheRetentionOptions } from "./runExecution-CjWJUUZ5.mjs";
2
- import { S as parseEvalDiscovery, m as persistRunState, r as getTargetEvals$1, t as executeRun } from "./runOrchestration-DE2TFAS6.mjs";
1
+ import { At as evalStatsConfigSchema, L as configureEvalRunLogs, Mt as evalChartsConfigSchema, Nt as columnDefSchema, Tt as buildEvalKey, bt as runManifestSchema, jt as manualInputDescriptorSchema, kt as evalStatAggregateSchema, l as registerAgentEvalsPackageResolutionHooks, p as loadConfig, tt as createRunRequestSchema, v as createFsCacheStore, xt as runSummarySchema, y as getCacheRetentionOptions } from "./runExecution-Bq0Y3y_1.mjs";
2
+ import { S as parseEvalDiscovery, m as persistRunState, r as getTargetEvals$1, t as executeRun } from "./runOrchestration-BpwW0AmB.mjs";
3
3
  import { z } from "zod";
4
4
  import { readFile } from "node:fs/promises";
5
5
  import { relative } from "node:path";
@@ -289,7 +289,7 @@ z.object({
289
289
  key: z.string(),
290
290
  namespace: z.string(),
291
291
  storedAt: z.string(),
292
- /** Last successful cache hit time. `null` means the entry has not been hit yet. */
292
+ /** Last successful cache read or write time. Legacy entries may be `null`. */
293
293
  lastAccessedAt: z.string().nullable()
294
294
  });
295
295
  z.object({
@@ -5395,7 +5395,7 @@ function createFsCacheStore(options) {
5395
5395
  const index = await readNamespaceIndex(cacheDir, entry.namespace);
5396
5396
  index.entries[entry.key] = {
5397
5397
  storedAt: entry.storedAt,
5398
- lastAccessedAt: null,
5398
+ lastAccessedAt: entry.storedAt,
5399
5399
  blobRefs: await collectExternalJsonBlobRefs(entry, blobDirs)
5400
5400
  };
5401
5401
  await writeNamespaceIndex(cacheDir, index);
@@ -1,4 +1,4 @@
1
- import { Dt as caseDetailSchema, Et as getCaseRowCaseKey, It as runWithEvalRegistry, J as runInEvalRuntimeScope, Ot as caseRowSchema, Z as runWithEvalClock, _t as matchesTagsFilter, bt as runManifestSchema, d as loadEvalModule, f as resolveEvalDefaultConfig, g as commitPendingCacheWrites, gt as dedupeEvalTags, ht as deriveStatusFromChildStatuses, i as isCaseChildMessage, m as buildDeclaredColumnDefs, mt as deriveStatusFromCaseRows, n as resolveRunnableEvalCases, o as stripTerminalControlCodes, pt as deriveScopedSummaryFromCases, t as filterEvalCases, u as runWithModuleIsolation, vt as validateEvalTagName, wt as buildCaseKey, xt as runSummarySchema, yt as validateTagsFilterExpression } from "./runExecution-CjWJUUZ5.mjs";
1
+ import { Dt as caseDetailSchema, Et as getCaseRowCaseKey, It as runWithEvalRegistry, J as runInEvalRuntimeScope, Ot as caseRowSchema, Z as runWithEvalClock, _t as matchesTagsFilter, bt as runManifestSchema, d as loadEvalModule, f as resolveEvalDefaultConfig, g as commitPendingCacheWrites, gt as dedupeEvalTags, ht as deriveStatusFromChildStatuses, i as isCaseChildMessage, m as buildDeclaredColumnDefs, mt as deriveStatusFromCaseRows, n as resolveRunnableEvalCases, o as stripTerminalControlCodes, pt as deriveScopedSummaryFromCases, t as filterEvalCases, u as runWithModuleIsolation, vt as validateEvalTagName, wt as buildCaseKey, xt as runSummarySchema, yt as validateTagsFilterExpression } from "./runExecution-Bq0Y3y_1.mjs";
2
2
  import { Result, resultify } from "t-result";
3
3
  import { readFile, readdir, rm, writeFile } from "node:fs/promises";
4
4
  import { dirname, join } from "node:path";
@@ -1,5 +1,5 @@
1
- import { n as createRunner } from "./cli-CVBSlTD8.mjs";
2
- import "./src-DjOTPnDz.mjs";
1
+ import { n as createRunner } from "./cli-CbePEEua.mjs";
2
+ import "./src-CVM_FqPx.mjs";
3
3
  //#region ../../apps/server/src/runner.ts
4
4
  let runnerInstance = null;
5
5
  function getRunnerInstance({ loadEnv = true } = {}) {
@@ -1,2 +1,2 @@
1
- import { n as initRunner, t as getRunnerInstance } from "./runner-DzDRasWV.mjs";
1
+ import { n as initRunner, t as getRunnerInstance } from "./runner-Kp0JqxrU.mjs";
2
2
  export { getRunnerInstance, initRunner };
@@ -1,5 +1,5 @@
1
- import { G as matchesEvalTags$1, Pt as defineEval$1 } from "./runExecution-CjWJUUZ5.mjs";
2
- import "./cli-CVBSlTD8.mjs";
1
+ import { G as matchesEvalTags$1, Pt as defineEval$1 } from "./runExecution-Bq0Y3y_1.mjs";
2
+ import "./cli-CbePEEua.mjs";
3
3
  //#region src/index.ts
4
4
  /** Register an eval definition with typed tag support. */
5
5
  function defineEval(definition) {
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "@ls-stack/agent-eval",
3
- "version": "0.60.1",
3
+ "version": "0.60.2",
4
4
  "type": "module",
5
5
  "bin": {
6
6
  "agent-evals": "./dist/bin.mjs"
@@ -32,9 +32,9 @@
32
32
  "devDependencies": {
33
33
  "@types/node": "^24.7.2",
34
34
  "typescript": "^5.9.2",
35
- "@agent-evals/sdk": "0.0.1",
35
+ "@agent-evals/runner": "0.0.1",
36
36
  "@agent-evals/shared": "0.0.1",
37
- "@agent-evals/runner": "0.0.1"
37
+ "@agent-evals/sdk": "0.0.1"
38
38
  },
39
39
  "scripts": {
40
40
  "build": "pnpm --filter @agent-evals/web build && pnpm --filter @agent-evals/shared build && pnpm --filter @agent-evals/sdk build && pnpm --filter @agent-evals/runner build && tsdown --filter cli-js && tsdown --filter cli-types",
@@ -568,6 +568,8 @@ Mental model:
568
568
  runner stays idle for `cache.pruneIdleDelayMs ?? 5000` milliseconds. Configure
569
569
  `cache.maxEntries` as a number for the default cap, or as
570
570
  `{ default, namespaces }` for exact namespace-specific caps.
571
+ Writes initialize the row's last access time to the stored time; later cache
572
+ hits refresh that timestamp at the configured access-time update interval.
571
573
  - Unindexed legacy cache files are ignored by normal lookup/listing. Use
572
574
  `agent-evals cache repair` to remove unindexed cache files, stale index rows,
573
575
  debug sidecars, and unreferenced blob files.