@ls-stack/agent-eval 0.60.1 → 0.60.2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/{app-CxKEVlng.mjs → app-DPCFFkyQ.mjs} +4 -4
- package/dist/bin.mjs +1 -1
- package/dist/caseChild.mjs +1 -1
- package/dist/{cli-CVBSlTD8.mjs → cli-CbePEEua.mjs} +4 -4
- package/dist/index.d.mts +96 -96
- package/dist/index.mjs +3 -3
- package/dist/runChild.mjs +2 -2
- package/dist/{runExecution-CjWJUUZ5.mjs → runExecution-Bq0Y3y_1.mjs} +2 -2
- package/dist/{runOrchestration-DE2TFAS6.mjs → runOrchestration-BpwW0AmB.mjs} +1 -1
- package/dist/{runner-DzDRasWV.mjs → runner-Kp0JqxrU.mjs} +2 -2
- package/dist/{runner-Cu1CQPTB.mjs → runner-XEP21_u9.mjs} +1 -1
- package/dist/{src-DjOTPnDz.mjs → src-CVM_FqPx.mjs} +2 -2
- package/package.json +3 -3
- package/skills/agent-eval/SKILL.md +2 -0
|
@@ -1,7 +1,7 @@
|
|
|
1
|
-
import { Et as getCaseRowCaseKey, Ot as caseRowSchema, dt as getEvalTitle, nt as updateManualScoreRequestSchema, rt as extractCacheEntries, tt as createRunRequestSchema } from "./runExecution-
|
|
2
|
-
import { o as stageManualInputFile } from "./cli-
|
|
3
|
-
import "./src-
|
|
4
|
-
import { t as getRunnerInstance } from "./runner-
|
|
1
|
+
import { Et as getCaseRowCaseKey, Ot as caseRowSchema, dt as getEvalTitle, nt as updateManualScoreRequestSchema, rt as extractCacheEntries, tt as createRunRequestSchema } from "./runExecution-Bq0Y3y_1.mjs";
|
|
2
|
+
import { o as stageManualInputFile } from "./cli-CbePEEua.mjs";
|
|
3
|
+
import "./src-CVM_FqPx.mjs";
|
|
4
|
+
import { t as getRunnerInstance } from "./runner-Kp0JqxrU.mjs";
|
|
5
5
|
import { z } from "zod";
|
|
6
6
|
import { resultify } from "t-result";
|
|
7
7
|
import { readFile } from "node:fs/promises";
|
package/dist/bin.mjs
CHANGED
package/dist/caseChild.mjs
CHANGED
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
import { Ct as resolveLlmCallsConfig, It as runWithEvalRegistry, J as runInEvalRuntimeScope, L as configureEvalRunLogs, St as resolveApiCallsConfig, _ as createBufferedCacheStore, a as isCaseChildParentMessage, d as loadEvalModule, l as registerAgentEvalsPackageResolutionHooks, p as loadConfig, r as runCase, v as createFsCacheStore, y as getCacheRetentionOptions } from "./runExecution-
|
|
1
|
+
import { Ct as resolveLlmCallsConfig, It as runWithEvalRegistry, J as runInEvalRuntimeScope, L as configureEvalRunLogs, St as resolveApiCallsConfig, _ as createBufferedCacheStore, a as isCaseChildParentMessage, d as loadEvalModule, l as registerAgentEvalsPackageResolutionHooks, p as loadConfig, r as runCase, v as createFsCacheStore, y as getCacheRetentionOptions } from "./runExecution-Bq0Y3y_1.mjs";
|
|
2
2
|
//#region ../runner/src/caseChild.ts
|
|
3
3
|
let fatalErrorReported = false;
|
|
4
4
|
let disconnectExpected = false;
|
|
@@ -1,5 +1,5 @@
|
|
|
1
|
-
import { Ct as resolveLlmCallsConfig, Et as getCaseRowCaseKey, Ft as getEvalRegistry, Ot as caseRowSchema, St as resolveApiCallsConfig, Tt as buildEvalKey, _t as matchesTagsFilter, c as resolveArtifactPath, dt as getEvalTitle, f as resolveEvalDefaultConfig, ft as getEvalDisplayStatus, h as normalizeScoreDef, lt as applyDerivedCallAttributes, m as buildDeclaredColumnDefs, o as stripTerminalControlCodes, p as loadConfig, pt as deriveScopedSummaryFromCases, s as resolveTracePresentation, v as createFsCacheStore, xt as runSummarySchema, y as getCacheRetentionOptions } from "./runExecution-
|
|
2
|
-
import { C as validateCharts, S as parseEvalDiscovery, _ as runTouchesEval, a as validateTagsFilters, b as deriveEvalFreshness, c as getLatestRunInfos, d as nextShortIdFromSnapshots, f as persistCaseDetail, g as recomputePersistedCaseStatus, h as recomputeEvalStatusesInRuns, i as resolveEvalTags, l as loadPersistedRunSnapshot, m as persistRunState, n as getTargetEvalKeys, o as generateRunId, p as deleteTemporaryRuns, s as getLastRunStatuses, u as loadPersistedRunSnapshots, v as buildManualInputDescriptor, x as loadIsolatedEvalRegistry, y as parseManualInputValues } from "./runOrchestration-
|
|
1
|
+
import { Ct as resolveLlmCallsConfig, Et as getCaseRowCaseKey, Ft as getEvalRegistry, Ot as caseRowSchema, St as resolveApiCallsConfig, Tt as buildEvalKey, _t as matchesTagsFilter, c as resolveArtifactPath, dt as getEvalTitle, f as resolveEvalDefaultConfig, ft as getEvalDisplayStatus, h as normalizeScoreDef, lt as applyDerivedCallAttributes, m as buildDeclaredColumnDefs, o as stripTerminalControlCodes, p as loadConfig, pt as deriveScopedSummaryFromCases, s as resolveTracePresentation, v as createFsCacheStore, xt as runSummarySchema, y as getCacheRetentionOptions } from "./runExecution-Bq0Y3y_1.mjs";
|
|
2
|
+
import { C as validateCharts, S as parseEvalDiscovery, _ as runTouchesEval, a as validateTagsFilters, b as deriveEvalFreshness, c as getLatestRunInfos, d as nextShortIdFromSnapshots, f as persistCaseDetail, g as recomputePersistedCaseStatus, h as recomputeEvalStatusesInRuns, i as resolveEvalTags, l as loadPersistedRunSnapshot, m as persistRunState, n as getTargetEvalKeys, o as generateRunId, p as deleteTemporaryRuns, s as getLastRunStatuses, u as loadPersistedRunSnapshots, v as buildManualInputDescriptor, x as loadIsolatedEvalRegistry, y as parseManualInputValues } from "./runOrchestration-BpwW0AmB.mjs";
|
|
3
3
|
import { parseEnv } from "node:util";
|
|
4
4
|
import { resultify } from "t-result";
|
|
5
5
|
import { copyFile, mkdir, readFile, rm, writeFile } from "node:fs/promises";
|
|
@@ -2232,8 +2232,8 @@ async function commandApp(args) {
|
|
|
2232
2232
|
const { serve } = await import("@hono/node-server");
|
|
2233
2233
|
const bundledWebDist = resolve(currentDir, "apps/web/dist");
|
|
2234
2234
|
if (existsSync(bundledWebDist)) process.env.AGENT_EVALS_WEB_DIST = bundledWebDist;
|
|
2235
|
-
const appModule = await import("./app-
|
|
2236
|
-
const runnerModule = await import("./runner-
|
|
2235
|
+
const appModule = await import("./app-DPCFFkyQ.mjs");
|
|
2236
|
+
const runnerModule = await import("./runner-XEP21_u9.mjs");
|
|
2237
2237
|
if (!isHonoAppModule(appModule)) throw new Error("Server app module is invalid");
|
|
2238
2238
|
if (!isServerRunnerModule(runnerModule)) throw new Error("Server runner module is invalid");
|
|
2239
2239
|
await runnerModule.initRunner({ loadEnv: args.loadEnv });
|
package/dist/index.d.mts
CHANGED
|
@@ -1941,10 +1941,10 @@ type ColumnKind = z.infer<typeof columnKindSchema>;
|
|
|
1941
1941
|
declare const columnFormatSchema: z.ZodEnum<{
|
|
1942
1942
|
number: "number";
|
|
1943
1943
|
boolean: "boolean";
|
|
1944
|
-
duration: "duration";
|
|
1945
|
-
json: "json";
|
|
1946
1944
|
file: "file";
|
|
1945
|
+
duration: "duration";
|
|
1947
1946
|
markdown: "markdown";
|
|
1947
|
+
json: "json";
|
|
1948
1948
|
image: "image";
|
|
1949
1949
|
html: "html";
|
|
1950
1950
|
pdf: "pdf";
|
|
@@ -1968,10 +1968,10 @@ declare const columnDefSchema: z.ZodObject<{
|
|
|
1968
1968
|
format: z.ZodOptional<z.ZodEnum<{
|
|
1969
1969
|
number: "number";
|
|
1970
1970
|
boolean: "boolean";
|
|
1971
|
-
duration: "duration";
|
|
1972
|
-
json: "json";
|
|
1973
1971
|
file: "file";
|
|
1972
|
+
duration: "duration";
|
|
1974
1973
|
markdown: "markdown";
|
|
1974
|
+
json: "json";
|
|
1975
1975
|
image: "image";
|
|
1976
1976
|
html: "html";
|
|
1977
1977
|
pdf: "pdf";
|
|
@@ -2061,9 +2061,9 @@ declare const traceAttributeDisplaySchema: z.ZodObject<{
|
|
|
2061
2061
|
subtree: "subtree";
|
|
2062
2062
|
}>>;
|
|
2063
2063
|
mode: z.ZodOptional<z.ZodEnum<{
|
|
2064
|
+
sum: "sum";
|
|
2064
2065
|
all: "all";
|
|
2065
2066
|
last: "last";
|
|
2066
|
-
sum: "sum";
|
|
2067
2067
|
}>>;
|
|
2068
2068
|
}, z.core.$strip>;
|
|
2069
2069
|
/**
|
|
@@ -2097,9 +2097,9 @@ declare const traceDisplayConfigSchema: z.ZodObject<{
|
|
|
2097
2097
|
subtree: "subtree";
|
|
2098
2098
|
}>>;
|
|
2099
2099
|
mode: z.ZodOptional<z.ZodEnum<{
|
|
2100
|
+
sum: "sum";
|
|
2100
2101
|
all: "all";
|
|
2101
2102
|
last: "last";
|
|
2102
|
-
sum: "sum";
|
|
2103
2103
|
}>>;
|
|
2104
2104
|
}, z.core.$strip>>>;
|
|
2105
2105
|
}, z.core.$strip>;
|
|
@@ -2137,9 +2137,9 @@ declare const traceAttributeDisplayInputSchema: z.ZodObject<{
|
|
|
2137
2137
|
subtree: "subtree";
|
|
2138
2138
|
}>>;
|
|
2139
2139
|
mode: z.ZodOptional<z.ZodEnum<{
|
|
2140
|
+
sum: "sum";
|
|
2140
2141
|
all: "all";
|
|
2141
2142
|
last: "last";
|
|
2142
|
-
sum: "sum";
|
|
2143
2143
|
}>>;
|
|
2144
2144
|
transform: z.ZodOptional<z.ZodCustom<TraceAttributeTransform, TraceAttributeTransform>>;
|
|
2145
2145
|
}, z.core.$strip>;
|
|
@@ -2175,9 +2175,9 @@ declare const traceDisplayInputConfigSchema: z.ZodObject<{
|
|
|
2175
2175
|
subtree: "subtree";
|
|
2176
2176
|
}>>;
|
|
2177
2177
|
mode: z.ZodOptional<z.ZodEnum<{
|
|
2178
|
+
sum: "sum";
|
|
2178
2179
|
all: "all";
|
|
2179
2180
|
last: "last";
|
|
2180
|
-
sum: "sum";
|
|
2181
2181
|
}>>;
|
|
2182
2182
|
transform: z.ZodOptional<z.ZodCustom<TraceAttributeTransform, TraceAttributeTransform>>;
|
|
2183
2183
|
}, z.core.$strip>>>;
|
|
@@ -2214,8 +2214,8 @@ declare const traceSpanSchema$1: z.ZodObject<{
|
|
|
2214
2214
|
status: z.ZodEnum<{
|
|
2215
2215
|
error: "error";
|
|
2216
2216
|
running: "running";
|
|
2217
|
-
ok: "ok";
|
|
2218
2217
|
cancelled: "cancelled";
|
|
2218
|
+
ok: "ok";
|
|
2219
2219
|
}>;
|
|
2220
2220
|
attributes: z.ZodOptional<z.ZodRecord<z.ZodString, z.ZodUnknown>>;
|
|
2221
2221
|
error: z.ZodOptional<z.ZodObject<{
|
|
@@ -2260,10 +2260,10 @@ type EvalFreshnessStatus = z.infer<typeof evalFreshnessStatusSchema>;
|
|
|
2260
2260
|
* `best` selects the highest finite value and `worst` selects the lowest.
|
|
2261
2261
|
*/
|
|
2262
2262
|
declare const evalStatAggregateSchema: z.ZodEnum<{
|
|
2263
|
-
sum: "sum";
|
|
2264
2263
|
avg: "avg";
|
|
2265
2264
|
min: "min";
|
|
2266
2265
|
max: "max";
|
|
2266
|
+
sum: "sum";
|
|
2267
2267
|
best: "best";
|
|
2268
2268
|
worst: "worst";
|
|
2269
2269
|
}>;
|
|
@@ -2292,10 +2292,10 @@ declare const evalStatItemSchema: z.ZodDiscriminatedUnion<[z.ZodObject<{
|
|
|
2292
2292
|
hideIfNoValue: z.ZodOptional<z.ZodBoolean>;
|
|
2293
2293
|
kind: z.ZodLiteral<"duration">;
|
|
2294
2294
|
aggregate: z.ZodOptional<z.ZodEnum<{
|
|
2295
|
-
sum: "sum";
|
|
2296
2295
|
avg: "avg";
|
|
2297
2296
|
min: "min";
|
|
2298
2297
|
max: "max";
|
|
2298
|
+
sum: "sum";
|
|
2299
2299
|
best: "best";
|
|
2300
2300
|
worst: "worst";
|
|
2301
2301
|
}>>;
|
|
@@ -2303,10 +2303,10 @@ declare const evalStatItemSchema: z.ZodDiscriminatedUnion<[z.ZodObject<{
|
|
|
2303
2303
|
hideIfNoValue: z.ZodOptional<z.ZodBoolean>;
|
|
2304
2304
|
kind: z.ZodLiteral<"cacheHits">;
|
|
2305
2305
|
aggregate: z.ZodOptional<z.ZodEnum<{
|
|
2306
|
-
sum: "sum";
|
|
2307
2306
|
avg: "avg";
|
|
2308
2307
|
min: "min";
|
|
2309
2308
|
max: "max";
|
|
2309
|
+
sum: "sum";
|
|
2310
2310
|
best: "best";
|
|
2311
2311
|
worst: "worst";
|
|
2312
2312
|
}>>;
|
|
@@ -2316,20 +2316,20 @@ declare const evalStatItemSchema: z.ZodDiscriminatedUnion<[z.ZodObject<{
|
|
|
2316
2316
|
key: z.ZodString;
|
|
2317
2317
|
label: z.ZodOptional<z.ZodString>;
|
|
2318
2318
|
aggregate: z.ZodEnum<{
|
|
2319
|
-
sum: "sum";
|
|
2320
2319
|
avg: "avg";
|
|
2321
2320
|
min: "min";
|
|
2322
2321
|
max: "max";
|
|
2322
|
+
sum: "sum";
|
|
2323
2323
|
best: "best";
|
|
2324
2324
|
worst: "worst";
|
|
2325
2325
|
}>;
|
|
2326
2326
|
format: z.ZodOptional<z.ZodEnum<{
|
|
2327
2327
|
number: "number";
|
|
2328
2328
|
boolean: "boolean";
|
|
2329
|
-
duration: "duration";
|
|
2330
|
-
json: "json";
|
|
2331
2329
|
file: "file";
|
|
2330
|
+
duration: "duration";
|
|
2332
2331
|
markdown: "markdown";
|
|
2332
|
+
json: "json";
|
|
2333
2333
|
image: "image";
|
|
2334
2334
|
html: "html";
|
|
2335
2335
|
pdf: "pdf";
|
|
@@ -2356,10 +2356,10 @@ declare const evalStatsConfigSchema: z.ZodArray<z.ZodDiscriminatedUnion<[z.ZodOb
|
|
|
2356
2356
|
hideIfNoValue: z.ZodOptional<z.ZodBoolean>;
|
|
2357
2357
|
kind: z.ZodLiteral<"duration">;
|
|
2358
2358
|
aggregate: z.ZodOptional<z.ZodEnum<{
|
|
2359
|
-
sum: "sum";
|
|
2360
2359
|
avg: "avg";
|
|
2361
2360
|
min: "min";
|
|
2362
2361
|
max: "max";
|
|
2362
|
+
sum: "sum";
|
|
2363
2363
|
best: "best";
|
|
2364
2364
|
worst: "worst";
|
|
2365
2365
|
}>>;
|
|
@@ -2367,10 +2367,10 @@ declare const evalStatsConfigSchema: z.ZodArray<z.ZodDiscriminatedUnion<[z.ZodOb
|
|
|
2367
2367
|
hideIfNoValue: z.ZodOptional<z.ZodBoolean>;
|
|
2368
2368
|
kind: z.ZodLiteral<"cacheHits">;
|
|
2369
2369
|
aggregate: z.ZodOptional<z.ZodEnum<{
|
|
2370
|
-
sum: "sum";
|
|
2371
2370
|
avg: "avg";
|
|
2372
2371
|
min: "min";
|
|
2373
2372
|
max: "max";
|
|
2373
|
+
sum: "sum";
|
|
2374
2374
|
best: "best";
|
|
2375
2375
|
worst: "worst";
|
|
2376
2376
|
}>>;
|
|
@@ -2380,20 +2380,20 @@ declare const evalStatsConfigSchema: z.ZodArray<z.ZodDiscriminatedUnion<[z.ZodOb
|
|
|
2380
2380
|
key: z.ZodString;
|
|
2381
2381
|
label: z.ZodOptional<z.ZodString>;
|
|
2382
2382
|
aggregate: z.ZodEnum<{
|
|
2383
|
-
sum: "sum";
|
|
2384
2383
|
avg: "avg";
|
|
2385
2384
|
min: "min";
|
|
2386
2385
|
max: "max";
|
|
2386
|
+
sum: "sum";
|
|
2387
2387
|
best: "best";
|
|
2388
2388
|
worst: "worst";
|
|
2389
2389
|
}>;
|
|
2390
2390
|
format: z.ZodOptional<z.ZodEnum<{
|
|
2391
2391
|
number: "number";
|
|
2392
2392
|
boolean: "boolean";
|
|
2393
|
-
duration: "duration";
|
|
2394
|
-
json: "json";
|
|
2395
2393
|
file: "file";
|
|
2394
|
+
duration: "duration";
|
|
2396
2395
|
markdown: "markdown";
|
|
2396
|
+
json: "json";
|
|
2397
2397
|
image: "image";
|
|
2398
2398
|
html: "html";
|
|
2399
2399
|
pdf: "pdf";
|
|
@@ -2436,10 +2436,10 @@ declare const evalSummarySchema$1: z.ZodObject<{
|
|
|
2436
2436
|
format: z.ZodOptional<z.ZodEnum<{
|
|
2437
2437
|
number: "number";
|
|
2438
2438
|
boolean: "boolean";
|
|
2439
|
-
duration: "duration";
|
|
2440
|
-
json: "json";
|
|
2441
2439
|
file: "file";
|
|
2440
|
+
duration: "duration";
|
|
2442
2441
|
markdown: "markdown";
|
|
2442
|
+
json: "json";
|
|
2443
2443
|
image: "image";
|
|
2444
2444
|
html: "html";
|
|
2445
2445
|
pdf: "pdf";
|
|
@@ -2466,10 +2466,10 @@ declare const evalSummarySchema$1: z.ZodObject<{
|
|
|
2466
2466
|
caseIds: z.ZodOptional<z.ZodArray<z.ZodString>>;
|
|
2467
2467
|
lastRunStatus: z.ZodNullable<z.ZodEnum<{
|
|
2468
2468
|
error: "error";
|
|
2469
|
-
running: "running";
|
|
2470
|
-
cancelled: "cancelled";
|
|
2471
2469
|
pass: "pass";
|
|
2472
2470
|
fail: "fail";
|
|
2471
|
+
running: "running";
|
|
2472
|
+
cancelled: "cancelled";
|
|
2473
2473
|
unscored: "unscored";
|
|
2474
2474
|
}>>;
|
|
2475
2475
|
stats: z.ZodOptional<z.ZodArray<z.ZodDiscriminatedUnion<[z.ZodObject<{
|
|
@@ -2483,10 +2483,10 @@ declare const evalSummarySchema$1: z.ZodObject<{
|
|
|
2483
2483
|
hideIfNoValue: z.ZodOptional<z.ZodBoolean>;
|
|
2484
2484
|
kind: z.ZodLiteral<"duration">;
|
|
2485
2485
|
aggregate: z.ZodOptional<z.ZodEnum<{
|
|
2486
|
-
sum: "sum";
|
|
2487
2486
|
avg: "avg";
|
|
2488
2487
|
min: "min";
|
|
2489
2488
|
max: "max";
|
|
2489
|
+
sum: "sum";
|
|
2490
2490
|
best: "best";
|
|
2491
2491
|
worst: "worst";
|
|
2492
2492
|
}>>;
|
|
@@ -2494,10 +2494,10 @@ declare const evalSummarySchema$1: z.ZodObject<{
|
|
|
2494
2494
|
hideIfNoValue: z.ZodOptional<z.ZodBoolean>;
|
|
2495
2495
|
kind: z.ZodLiteral<"cacheHits">;
|
|
2496
2496
|
aggregate: z.ZodOptional<z.ZodEnum<{
|
|
2497
|
-
sum: "sum";
|
|
2498
2497
|
avg: "avg";
|
|
2499
2498
|
min: "min";
|
|
2500
2499
|
max: "max";
|
|
2500
|
+
sum: "sum";
|
|
2501
2501
|
best: "best";
|
|
2502
2502
|
worst: "worst";
|
|
2503
2503
|
}>>;
|
|
@@ -2507,20 +2507,20 @@ declare const evalSummarySchema$1: z.ZodObject<{
|
|
|
2507
2507
|
key: z.ZodString;
|
|
2508
2508
|
label: z.ZodOptional<z.ZodString>;
|
|
2509
2509
|
aggregate: z.ZodEnum<{
|
|
2510
|
-
sum: "sum";
|
|
2511
2510
|
avg: "avg";
|
|
2512
2511
|
min: "min";
|
|
2513
2512
|
max: "max";
|
|
2513
|
+
sum: "sum";
|
|
2514
2514
|
best: "best";
|
|
2515
2515
|
worst: "worst";
|
|
2516
2516
|
}>;
|
|
2517
2517
|
format: z.ZodOptional<z.ZodEnum<{
|
|
2518
2518
|
number: "number";
|
|
2519
2519
|
boolean: "boolean";
|
|
2520
|
-
duration: "duration";
|
|
2521
|
-
json: "json";
|
|
2522
2520
|
file: "file";
|
|
2521
|
+
duration: "duration";
|
|
2523
2522
|
markdown: "markdown";
|
|
2523
|
+
json: "json";
|
|
2524
2524
|
image: "image";
|
|
2525
2525
|
html: "html";
|
|
2526
2526
|
pdf: "pdf";
|
|
@@ -2534,10 +2534,10 @@ declare const evalSummarySchema$1: z.ZodObject<{
|
|
|
2534
2534
|
accent: z.ZodOptional<z.ZodBoolean>;
|
|
2535
2535
|
}, z.core.$strip>], "kind">>>;
|
|
2536
2536
|
defaultStatAggregate: z.ZodOptional<z.ZodEnum<{
|
|
2537
|
-
sum: "sum";
|
|
2538
2537
|
avg: "avg";
|
|
2539
2538
|
min: "min";
|
|
2540
2539
|
max: "max";
|
|
2540
|
+
sum: "sum";
|
|
2541
2541
|
best: "best";
|
|
2542
2542
|
worst: "worst";
|
|
2543
2543
|
}>>;
|
|
@@ -2558,11 +2558,11 @@ declare const evalSummarySchema$1: z.ZodObject<{
|
|
|
2558
2558
|
}>;
|
|
2559
2559
|
label: z.ZodOptional<z.ZodString>;
|
|
2560
2560
|
color: z.ZodOptional<z.ZodEnum<{
|
|
2561
|
-
error: "error";
|
|
2562
2561
|
success: "success";
|
|
2563
|
-
warning: "warning";
|
|
2564
2562
|
accent: "accent";
|
|
2563
|
+
error: "error";
|
|
2565
2564
|
accentDim: "accentDim";
|
|
2565
|
+
warning: "warning";
|
|
2566
2566
|
textMuted: "textMuted";
|
|
2567
2567
|
}>>;
|
|
2568
2568
|
axis: z.ZodOptional<z.ZodEnum<{
|
|
@@ -2573,20 +2573,20 @@ declare const evalSummarySchema$1: z.ZodObject<{
|
|
|
2573
2573
|
source: z.ZodLiteral<"column">;
|
|
2574
2574
|
key: z.ZodString;
|
|
2575
2575
|
aggregate: z.ZodEnum<{
|
|
2576
|
-
sum: "sum";
|
|
2577
2576
|
avg: "avg";
|
|
2578
2577
|
min: "min";
|
|
2579
2578
|
max: "max";
|
|
2579
|
+
sum: "sum";
|
|
2580
2580
|
latest: "latest";
|
|
2581
2581
|
passThresholdRate: "passThresholdRate";
|
|
2582
2582
|
}>;
|
|
2583
2583
|
label: z.ZodOptional<z.ZodString>;
|
|
2584
2584
|
color: z.ZodOptional<z.ZodEnum<{
|
|
2585
|
-
error: "error";
|
|
2586
2585
|
success: "success";
|
|
2587
|
-
warning: "warning";
|
|
2588
2586
|
accent: "accent";
|
|
2587
|
+
error: "error";
|
|
2589
2588
|
accentDim: "accentDim";
|
|
2589
|
+
warning: "warning";
|
|
2590
2590
|
textMuted: "textMuted";
|
|
2591
2591
|
}>>;
|
|
2592
2592
|
axis: z.ZodOptional<z.ZodEnum<{
|
|
@@ -2615,10 +2615,10 @@ declare const evalSummarySchema$1: z.ZodObject<{
|
|
|
2615
2615
|
source: z.ZodLiteral<"column">;
|
|
2616
2616
|
key: z.ZodString;
|
|
2617
2617
|
aggregate: z.ZodEnum<{
|
|
2618
|
-
sum: "sum";
|
|
2619
2618
|
avg: "avg";
|
|
2620
2619
|
min: "min";
|
|
2621
2620
|
max: "max";
|
|
2621
|
+
sum: "sum";
|
|
2622
2622
|
latest: "latest";
|
|
2623
2623
|
passThresholdRate: "passThresholdRate";
|
|
2624
2624
|
}>;
|
|
@@ -2715,10 +2715,10 @@ declare const caseRowSchema$1: z.ZodObject<{
|
|
|
2715
2715
|
tags: z.ZodOptional<z.ZodArray<z.ZodString>>;
|
|
2716
2716
|
status: z.ZodEnum<{
|
|
2717
2717
|
error: "error";
|
|
2718
|
-
running: "running";
|
|
2719
|
-
cancelled: "cancelled";
|
|
2720
2718
|
pass: "pass";
|
|
2721
2719
|
fail: "fail";
|
|
2720
|
+
running: "running";
|
|
2721
|
+
cancelled: "cancelled";
|
|
2722
2722
|
pending: "pending";
|
|
2723
2723
|
}>;
|
|
2724
2724
|
durationMs: z.ZodNullable<z.ZodNumber>;
|
|
@@ -2748,10 +2748,10 @@ declare const caseRowSchema$1: z.ZodObject<{
|
|
|
2748
2748
|
format: z.ZodOptional<z.ZodEnum<{
|
|
2749
2749
|
number: "number";
|
|
2750
2750
|
boolean: "boolean";
|
|
2751
|
-
duration: "duration";
|
|
2752
|
-
json: "json";
|
|
2753
2751
|
file: "file";
|
|
2752
|
+
duration: "duration";
|
|
2754
2753
|
markdown: "markdown";
|
|
2754
|
+
json: "json";
|
|
2755
2755
|
image: "image";
|
|
2756
2756
|
html: "html";
|
|
2757
2757
|
pdf: "pdf";
|
|
@@ -2857,8 +2857,8 @@ declare const scoreTraceSchema: z.ZodObject<{
|
|
|
2857
2857
|
status: z.ZodEnum<{
|
|
2858
2858
|
error: "error";
|
|
2859
2859
|
running: "running";
|
|
2860
|
-
ok: "ok";
|
|
2861
2860
|
cancelled: "cancelled";
|
|
2861
|
+
ok: "ok";
|
|
2862
2862
|
}>;
|
|
2863
2863
|
attributes: z.ZodOptional<z.ZodRecord<z.ZodString, z.ZodUnknown>>;
|
|
2864
2864
|
error: z.ZodOptional<z.ZodObject<{
|
|
@@ -2908,9 +2908,9 @@ declare const scoreTraceSchema: z.ZodObject<{
|
|
|
2908
2908
|
subtree: "subtree";
|
|
2909
2909
|
}>>;
|
|
2910
2910
|
mode: z.ZodOptional<z.ZodEnum<{
|
|
2911
|
+
sum: "sum";
|
|
2911
2912
|
all: "all";
|
|
2912
2913
|
last: "last";
|
|
2913
|
-
sum: "sum";
|
|
2914
2914
|
}>>;
|
|
2915
2915
|
}, z.core.$strip>>>;
|
|
2916
2916
|
}, z.core.$strip>;
|
|
@@ -2942,10 +2942,10 @@ declare const caseDetailSchema$1: z.ZodObject<{
|
|
|
2942
2942
|
tags: z.ZodOptional<z.ZodArray<z.ZodString>>;
|
|
2943
2943
|
status: z.ZodEnum<{
|
|
2944
2944
|
error: "error";
|
|
2945
|
-
running: "running";
|
|
2946
|
-
cancelled: "cancelled";
|
|
2947
2945
|
pass: "pass";
|
|
2948
2946
|
fail: "fail";
|
|
2947
|
+
running: "running";
|
|
2948
|
+
cancelled: "cancelled";
|
|
2949
2949
|
pending: "pending";
|
|
2950
2950
|
}>;
|
|
2951
2951
|
input: z.ZodUnknown;
|
|
@@ -2960,8 +2960,8 @@ declare const caseDetailSchema$1: z.ZodObject<{
|
|
|
2960
2960
|
status: z.ZodEnum<{
|
|
2961
2961
|
error: "error";
|
|
2962
2962
|
running: "running";
|
|
2963
|
-
ok: "ok";
|
|
2964
2963
|
cancelled: "cancelled";
|
|
2964
|
+
ok: "ok";
|
|
2965
2965
|
}>;
|
|
2966
2966
|
attributes: z.ZodOptional<z.ZodRecord<z.ZodString, z.ZodUnknown>>;
|
|
2967
2967
|
error: z.ZodOptional<z.ZodObject<{
|
|
@@ -3011,9 +3011,9 @@ declare const caseDetailSchema$1: z.ZodObject<{
|
|
|
3011
3011
|
subtree: "subtree";
|
|
3012
3012
|
}>>;
|
|
3013
3013
|
mode: z.ZodOptional<z.ZodEnum<{
|
|
3014
|
+
sum: "sum";
|
|
3014
3015
|
all: "all";
|
|
3015
3016
|
last: "last";
|
|
3016
|
-
sum: "sum";
|
|
3017
3017
|
}>>;
|
|
3018
3018
|
}, z.core.$strip>>>;
|
|
3019
3019
|
}, z.core.$strip>;
|
|
@@ -3029,8 +3029,8 @@ declare const caseDetailSchema$1: z.ZodObject<{
|
|
|
3029
3029
|
status: z.ZodEnum<{
|
|
3030
3030
|
error: "error";
|
|
3031
3031
|
running: "running";
|
|
3032
|
-
ok: "ok";
|
|
3033
3032
|
cancelled: "cancelled";
|
|
3033
|
+
ok: "ok";
|
|
3034
3034
|
}>;
|
|
3035
3035
|
attributes: z.ZodOptional<z.ZodRecord<z.ZodString, z.ZodUnknown>>;
|
|
3036
3036
|
error: z.ZodOptional<z.ZodObject<{
|
|
@@ -3080,9 +3080,9 @@ declare const caseDetailSchema$1: z.ZodObject<{
|
|
|
3080
3080
|
subtree: "subtree";
|
|
3081
3081
|
}>>;
|
|
3082
3082
|
mode: z.ZodOptional<z.ZodEnum<{
|
|
3083
|
+
sum: "sum";
|
|
3083
3084
|
all: "all";
|
|
3084
3085
|
last: "last";
|
|
3085
|
-
sum: "sum";
|
|
3086
3086
|
}>>;
|
|
3087
3087
|
}, z.core.$strip>>>;
|
|
3088
3088
|
}, z.core.$strip>;
|
|
@@ -3126,10 +3126,10 @@ declare const caseDetailSchema$1: z.ZodObject<{
|
|
|
3126
3126
|
format: z.ZodOptional<z.ZodEnum<{
|
|
3127
3127
|
number: "number";
|
|
3128
3128
|
boolean: "boolean";
|
|
3129
|
-
duration: "duration";
|
|
3130
|
-
json: "json";
|
|
3131
3129
|
file: "file";
|
|
3130
|
+
duration: "duration";
|
|
3132
3131
|
markdown: "markdown";
|
|
3132
|
+
json: "json";
|
|
3133
3133
|
image: "image";
|
|
3134
3134
|
html: "html";
|
|
3135
3135
|
pdf: "pdf";
|
|
@@ -3269,10 +3269,10 @@ declare const evalChartBuiltinMetricSchema: z.ZodEnum<{
|
|
|
3269
3269
|
type EvalChartBuiltinMetric = z.infer<typeof evalChartBuiltinMetricSchema>;
|
|
3270
3270
|
/** Reducer applied to a numeric column across all cases of a single run. */
|
|
3271
3271
|
declare const evalChartAggregateSchema: z.ZodEnum<{
|
|
3272
|
-
sum: "sum";
|
|
3273
3272
|
avg: "avg";
|
|
3274
3273
|
min: "min";
|
|
3275
3274
|
max: "max";
|
|
3275
|
+
sum: "sum";
|
|
3276
3276
|
latest: "latest";
|
|
3277
3277
|
passThresholdRate: "passThresholdRate";
|
|
3278
3278
|
}>;
|
|
@@ -3283,11 +3283,11 @@ type EvalChartAggregate = z.infer<typeof evalChartAggregateSchema>;
|
|
|
3283
3283
|
* not emit raw hex so authored evals stay decoupled from the web theme.
|
|
3284
3284
|
*/
|
|
3285
3285
|
declare const evalChartColorSchema: z.ZodEnum<{
|
|
3286
|
-
error: "error";
|
|
3287
3286
|
success: "success";
|
|
3288
|
-
warning: "warning";
|
|
3289
3287
|
accent: "accent";
|
|
3288
|
+
error: "error";
|
|
3290
3289
|
accentDim: "accentDim";
|
|
3290
|
+
warning: "warning";
|
|
3291
3291
|
textMuted: "textMuted";
|
|
3292
3292
|
}>;
|
|
3293
3293
|
/** Semantic color token resolved to a theme color by the web UI. */
|
|
@@ -3312,11 +3312,11 @@ declare const evalChartMetricSchema: z.ZodDiscriminatedUnion<[z.ZodObject<{
|
|
|
3312
3312
|
}>;
|
|
3313
3313
|
label: z.ZodOptional<z.ZodString>;
|
|
3314
3314
|
color: z.ZodOptional<z.ZodEnum<{
|
|
3315
|
-
error: "error";
|
|
3316
3315
|
success: "success";
|
|
3317
|
-
warning: "warning";
|
|
3318
3316
|
accent: "accent";
|
|
3317
|
+
error: "error";
|
|
3319
3318
|
accentDim: "accentDim";
|
|
3319
|
+
warning: "warning";
|
|
3320
3320
|
textMuted: "textMuted";
|
|
3321
3321
|
}>>;
|
|
3322
3322
|
axis: z.ZodOptional<z.ZodEnum<{
|
|
@@ -3327,20 +3327,20 @@ declare const evalChartMetricSchema: z.ZodDiscriminatedUnion<[z.ZodObject<{
|
|
|
3327
3327
|
source: z.ZodLiteral<"column">;
|
|
3328
3328
|
key: z.ZodString;
|
|
3329
3329
|
aggregate: z.ZodEnum<{
|
|
3330
|
-
sum: "sum";
|
|
3331
3330
|
avg: "avg";
|
|
3332
3331
|
min: "min";
|
|
3333
3332
|
max: "max";
|
|
3333
|
+
sum: "sum";
|
|
3334
3334
|
latest: "latest";
|
|
3335
3335
|
passThresholdRate: "passThresholdRate";
|
|
3336
3336
|
}>;
|
|
3337
3337
|
label: z.ZodOptional<z.ZodString>;
|
|
3338
3338
|
color: z.ZodOptional<z.ZodEnum<{
|
|
3339
|
-
error: "error";
|
|
3340
3339
|
success: "success";
|
|
3341
|
-
warning: "warning";
|
|
3342
3340
|
accent: "accent";
|
|
3341
|
+
error: "error";
|
|
3343
3342
|
accentDim: "accentDim";
|
|
3343
|
+
warning: "warning";
|
|
3344
3344
|
textMuted: "textMuted";
|
|
3345
3345
|
}>>;
|
|
3346
3346
|
axis: z.ZodOptional<z.ZodEnum<{
|
|
@@ -3362,10 +3362,10 @@ declare const evalChartTooltipExtraSchema: z.ZodDiscriminatedUnion<[z.ZodObject<
|
|
|
3362
3362
|
source: z.ZodLiteral<"column">;
|
|
3363
3363
|
key: z.ZodString;
|
|
3364
3364
|
aggregate: z.ZodEnum<{
|
|
3365
|
-
sum: "sum";
|
|
3366
3365
|
avg: "avg";
|
|
3367
3366
|
min: "min";
|
|
3368
3367
|
max: "max";
|
|
3368
|
+
sum: "sum";
|
|
3369
3369
|
latest: "latest";
|
|
3370
3370
|
passThresholdRate: "passThresholdRate";
|
|
3371
3371
|
}>;
|
|
@@ -3395,11 +3395,11 @@ declare const evalChartConfigSchema: z.ZodObject<{
|
|
|
3395
3395
|
}>;
|
|
3396
3396
|
label: z.ZodOptional<z.ZodString>;
|
|
3397
3397
|
color: z.ZodOptional<z.ZodEnum<{
|
|
3398
|
-
error: "error";
|
|
3399
3398
|
success: "success";
|
|
3400
|
-
warning: "warning";
|
|
3401
3399
|
accent: "accent";
|
|
3400
|
+
error: "error";
|
|
3402
3401
|
accentDim: "accentDim";
|
|
3402
|
+
warning: "warning";
|
|
3403
3403
|
textMuted: "textMuted";
|
|
3404
3404
|
}>>;
|
|
3405
3405
|
axis: z.ZodOptional<z.ZodEnum<{
|
|
@@ -3410,20 +3410,20 @@ declare const evalChartConfigSchema: z.ZodObject<{
|
|
|
3410
3410
|
source: z.ZodLiteral<"column">;
|
|
3411
3411
|
key: z.ZodString;
|
|
3412
3412
|
aggregate: z.ZodEnum<{
|
|
3413
|
-
sum: "sum";
|
|
3414
3413
|
avg: "avg";
|
|
3415
3414
|
min: "min";
|
|
3416
3415
|
max: "max";
|
|
3416
|
+
sum: "sum";
|
|
3417
3417
|
latest: "latest";
|
|
3418
3418
|
passThresholdRate: "passThresholdRate";
|
|
3419
3419
|
}>;
|
|
3420
3420
|
label: z.ZodOptional<z.ZodString>;
|
|
3421
3421
|
color: z.ZodOptional<z.ZodEnum<{
|
|
3422
|
-
error: "error";
|
|
3423
3422
|
success: "success";
|
|
3424
|
-
warning: "warning";
|
|
3425
3423
|
accent: "accent";
|
|
3424
|
+
error: "error";
|
|
3426
3425
|
accentDim: "accentDim";
|
|
3426
|
+
warning: "warning";
|
|
3427
3427
|
textMuted: "textMuted";
|
|
3428
3428
|
}>>;
|
|
3429
3429
|
axis: z.ZodOptional<z.ZodEnum<{
|
|
@@ -3452,10 +3452,10 @@ declare const evalChartConfigSchema: z.ZodObject<{
|
|
|
3452
3452
|
source: z.ZodLiteral<"column">;
|
|
3453
3453
|
key: z.ZodString;
|
|
3454
3454
|
aggregate: z.ZodEnum<{
|
|
3455
|
-
sum: "sum";
|
|
3456
3455
|
avg: "avg";
|
|
3457
3456
|
min: "min";
|
|
3458
3457
|
max: "max";
|
|
3458
|
+
sum: "sum";
|
|
3459
3459
|
latest: "latest";
|
|
3460
3460
|
passThresholdRate: "passThresholdRate";
|
|
3461
3461
|
}>;
|
|
@@ -3485,11 +3485,11 @@ declare const evalChartsConfigSchema: z.ZodArray<z.ZodObject<{
|
|
|
3485
3485
|
}>;
|
|
3486
3486
|
label: z.ZodOptional<z.ZodString>;
|
|
3487
3487
|
color: z.ZodOptional<z.ZodEnum<{
|
|
3488
|
-
error: "error";
|
|
3489
3488
|
success: "success";
|
|
3490
|
-
warning: "warning";
|
|
3491
3489
|
accent: "accent";
|
|
3490
|
+
error: "error";
|
|
3492
3491
|
accentDim: "accentDim";
|
|
3492
|
+
warning: "warning";
|
|
3493
3493
|
textMuted: "textMuted";
|
|
3494
3494
|
}>>;
|
|
3495
3495
|
axis: z.ZodOptional<z.ZodEnum<{
|
|
@@ -3500,20 +3500,20 @@ declare const evalChartsConfigSchema: z.ZodArray<z.ZodObject<{
|
|
|
3500
3500
|
source: z.ZodLiteral<"column">;
|
|
3501
3501
|
key: z.ZodString;
|
|
3502
3502
|
aggregate: z.ZodEnum<{
|
|
3503
|
-
sum: "sum";
|
|
3504
3503
|
avg: "avg";
|
|
3505
3504
|
min: "min";
|
|
3506
3505
|
max: "max";
|
|
3506
|
+
sum: "sum";
|
|
3507
3507
|
latest: "latest";
|
|
3508
3508
|
passThresholdRate: "passThresholdRate";
|
|
3509
3509
|
}>;
|
|
3510
3510
|
label: z.ZodOptional<z.ZodString>;
|
|
3511
3511
|
color: z.ZodOptional<z.ZodEnum<{
|
|
3512
|
-
error: "error";
|
|
3513
3512
|
success: "success";
|
|
3514
|
-
warning: "warning";
|
|
3515
3513
|
accent: "accent";
|
|
3514
|
+
error: "error";
|
|
3516
3515
|
accentDim: "accentDim";
|
|
3516
|
+
warning: "warning";
|
|
3517
3517
|
textMuted: "textMuted";
|
|
3518
3518
|
}>>;
|
|
3519
3519
|
axis: z.ZodOptional<z.ZodEnum<{
|
|
@@ -3542,10 +3542,10 @@ declare const evalChartsConfigSchema: z.ZodArray<z.ZodObject<{
|
|
|
3542
3542
|
source: z.ZodLiteral<"column">;
|
|
3543
3543
|
key: z.ZodString;
|
|
3544
3544
|
aggregate: z.ZodEnum<{
|
|
3545
|
-
sum: "sum";
|
|
3546
3545
|
avg: "avg";
|
|
3547
3546
|
min: "min";
|
|
3548
3547
|
max: "max";
|
|
3548
|
+
sum: "sum";
|
|
3549
3549
|
latest: "latest";
|
|
3550
3550
|
passThresholdRate: "passThresholdRate";
|
|
3551
3551
|
}>;
|
|
@@ -3573,8 +3573,8 @@ declare const runManifestSchema$1: z.ZodObject<{
|
|
|
3573
3573
|
evalSourceFingerprints: z.ZodDefault<z.ZodOptional<z.ZodRecord<z.ZodString, z.ZodString>>>;
|
|
3574
3574
|
target: z.ZodObject<{
|
|
3575
3575
|
mode: z.ZodEnum<{
|
|
3576
|
-
all: "all";
|
|
3577
3576
|
caseIds: "caseIds";
|
|
3577
|
+
all: "all";
|
|
3578
3578
|
evalIds: "evalIds";
|
|
3579
3579
|
}>;
|
|
3580
3580
|
evalKeys: z.ZodOptional<z.ZodArray<z.ZodString>>;
|
|
@@ -4669,10 +4669,10 @@ declare const cacheRecordingOpSchema: z.ZodDiscriminatedUnion<[z.ZodObject<{
|
|
|
4669
4669
|
format: z.ZodOptional<z.ZodEnum<{
|
|
4670
4670
|
number: "number";
|
|
4671
4671
|
boolean: "boolean";
|
|
4672
|
-
duration: "duration";
|
|
4673
|
-
json: "json";
|
|
4674
4672
|
file: "file";
|
|
4673
|
+
duration: "duration";
|
|
4675
4674
|
markdown: "markdown";
|
|
4675
|
+
json: "json";
|
|
4676
4676
|
image: "image";
|
|
4677
4677
|
html: "html";
|
|
4678
4678
|
pdf: "pdf";
|
|
@@ -4721,8 +4721,8 @@ declare const cacheRecordingSchema: z.ZodObject<{
|
|
|
4721
4721
|
finalStatus: z.ZodOptional<z.ZodEnum<{
|
|
4722
4722
|
error: "error";
|
|
4723
4723
|
running: "running";
|
|
4724
|
-
ok: "ok";
|
|
4725
4724
|
cancelled: "cancelled";
|
|
4725
|
+
ok: "ok";
|
|
4726
4726
|
}>>;
|
|
4727
4727
|
finalError: z.ZodOptional<z.ZodObject<{
|
|
4728
4728
|
name: z.ZodOptional<z.ZodString>;
|
|
@@ -4757,10 +4757,10 @@ declare const cacheRecordingSchema: z.ZodObject<{
|
|
|
4757
4757
|
format: z.ZodOptional<z.ZodEnum<{
|
|
4758
4758
|
number: "number";
|
|
4759
4759
|
boolean: "boolean";
|
|
4760
|
-
duration: "duration";
|
|
4761
|
-
json: "json";
|
|
4762
4760
|
file: "file";
|
|
4761
|
+
duration: "duration";
|
|
4763
4762
|
markdown: "markdown";
|
|
4763
|
+
json: "json";
|
|
4764
4764
|
image: "image";
|
|
4765
4765
|
html: "html";
|
|
4766
4766
|
pdf: "pdf";
|
|
@@ -4822,8 +4822,8 @@ declare const cacheEntrySchema: z.ZodObject<{
|
|
|
4822
4822
|
finalStatus: z.ZodOptional<z.ZodEnum<{
|
|
4823
4823
|
error: "error";
|
|
4824
4824
|
running: "running";
|
|
4825
|
-
ok: "ok";
|
|
4826
4825
|
cancelled: "cancelled";
|
|
4826
|
+
ok: "ok";
|
|
4827
4827
|
}>>;
|
|
4828
4828
|
finalError: z.ZodOptional<z.ZodObject<{
|
|
4829
4829
|
name: z.ZodOptional<z.ZodString>;
|
|
@@ -4858,10 +4858,10 @@ declare const cacheEntrySchema: z.ZodObject<{
|
|
|
4858
4858
|
format: z.ZodOptional<z.ZodEnum<{
|
|
4859
4859
|
number: "number";
|
|
4860
4860
|
boolean: "boolean";
|
|
4861
|
-
duration: "duration";
|
|
4862
|
-
json: "json";
|
|
4863
4861
|
file: "file";
|
|
4862
|
+
duration: "duration";
|
|
4864
4863
|
markdown: "markdown";
|
|
4864
|
+
json: "json";
|
|
4865
4865
|
image: "image";
|
|
4866
4866
|
html: "html";
|
|
4867
4867
|
pdf: "pdf";
|
|
@@ -4940,8 +4940,8 @@ declare const cacheDebugKeyEntrySchema: z.ZodObject<{
|
|
|
4940
4940
|
finalStatus: z.ZodOptional<z.ZodEnum<{
|
|
4941
4941
|
error: "error";
|
|
4942
4942
|
running: "running";
|
|
4943
|
-
ok: "ok";
|
|
4944
4943
|
cancelled: "cancelled";
|
|
4944
|
+
ok: "ok";
|
|
4945
4945
|
}>>;
|
|
4946
4946
|
finalError: z.ZodOptional<z.ZodObject<{
|
|
4947
4947
|
name: z.ZodOptional<z.ZodString>;
|
|
@@ -4976,10 +4976,10 @@ declare const cacheDebugKeyEntrySchema: z.ZodObject<{
|
|
|
4976
4976
|
format: z.ZodOptional<z.ZodEnum<{
|
|
4977
4977
|
number: "number";
|
|
4978
4978
|
boolean: "boolean";
|
|
4979
|
-
duration: "duration";
|
|
4980
|
-
json: "json";
|
|
4981
4979
|
file: "file";
|
|
4980
|
+
duration: "duration";
|
|
4982
4981
|
markdown: "markdown";
|
|
4982
|
+
json: "json";
|
|
4983
4983
|
image: "image";
|
|
4984
4984
|
html: "html";
|
|
4985
4985
|
pdf: "pdf";
|
|
@@ -5047,8 +5047,8 @@ declare const cacheEntryWithDebugKeySchema$1: z.ZodObject<{
|
|
|
5047
5047
|
finalStatus: z.ZodOptional<z.ZodEnum<{
|
|
5048
5048
|
error: "error";
|
|
5049
5049
|
running: "running";
|
|
5050
|
-
ok: "ok";
|
|
5051
5050
|
cancelled: "cancelled";
|
|
5051
|
+
ok: "ok";
|
|
5052
5052
|
}>>;
|
|
5053
5053
|
finalError: z.ZodOptional<z.ZodObject<{
|
|
5054
5054
|
name: z.ZodOptional<z.ZodString>;
|
|
@@ -5083,10 +5083,10 @@ declare const cacheEntryWithDebugKeySchema$1: z.ZodObject<{
|
|
|
5083
5083
|
format: z.ZodOptional<z.ZodEnum<{
|
|
5084
5084
|
number: "number";
|
|
5085
5085
|
boolean: "boolean";
|
|
5086
|
-
duration: "duration";
|
|
5087
|
-
json: "json";
|
|
5088
5086
|
file: "file";
|
|
5087
|
+
duration: "duration";
|
|
5089
5088
|
markdown: "markdown";
|
|
5089
|
+
json: "json";
|
|
5090
5090
|
image: "image";
|
|
5091
5091
|
html: "html";
|
|
5092
5092
|
pdf: "pdf";
|
|
@@ -5156,8 +5156,8 @@ declare const cacheEntryWithDebugKeySchema$1: z.ZodObject<{
|
|
|
5156
5156
|
finalStatus: z.ZodOptional<z.ZodEnum<{
|
|
5157
5157
|
error: "error";
|
|
5158
5158
|
running: "running";
|
|
5159
|
-
ok: "ok";
|
|
5160
5159
|
cancelled: "cancelled";
|
|
5160
|
+
ok: "ok";
|
|
5161
5161
|
}>>;
|
|
5162
5162
|
finalError: z.ZodOptional<z.ZodObject<{
|
|
5163
5163
|
name: z.ZodOptional<z.ZodString>;
|
|
@@ -5192,10 +5192,10 @@ declare const cacheEntryWithDebugKeySchema$1: z.ZodObject<{
|
|
|
5192
5192
|
format: z.ZodOptional<z.ZodEnum<{
|
|
5193
5193
|
number: "number";
|
|
5194
5194
|
boolean: "boolean";
|
|
5195
|
-
duration: "duration";
|
|
5196
|
-
json: "json";
|
|
5197
5195
|
file: "file";
|
|
5196
|
+
duration: "duration";
|
|
5198
5197
|
markdown: "markdown";
|
|
5198
|
+
json: "json";
|
|
5199
5199
|
image: "image";
|
|
5200
5200
|
html: "html";
|
|
5201
5201
|
pdf: "pdf";
|
|
@@ -5263,8 +5263,8 @@ declare const cacheFileSchema: z.ZodObject<{
|
|
|
5263
5263
|
finalStatus: z.ZodOptional<z.ZodEnum<{
|
|
5264
5264
|
error: "error";
|
|
5265
5265
|
running: "running";
|
|
5266
|
-
ok: "ok";
|
|
5267
5266
|
cancelled: "cancelled";
|
|
5267
|
+
ok: "ok";
|
|
5268
5268
|
}>>;
|
|
5269
5269
|
finalError: z.ZodOptional<z.ZodObject<{
|
|
5270
5270
|
name: z.ZodOptional<z.ZodString>;
|
|
@@ -5299,10 +5299,10 @@ declare const cacheFileSchema: z.ZodObject<{
|
|
|
5299
5299
|
format: z.ZodOptional<z.ZodEnum<{
|
|
5300
5300
|
number: "number";
|
|
5301
5301
|
boolean: "boolean";
|
|
5302
|
-
duration: "duration";
|
|
5303
|
-
json: "json";
|
|
5304
5302
|
file: "file";
|
|
5303
|
+
duration: "duration";
|
|
5305
5304
|
markdown: "markdown";
|
|
5305
|
+
json: "json";
|
|
5306
5306
|
image: "image";
|
|
5307
5307
|
html: "html";
|
|
5308
5308
|
pdf: "pdf";
|
|
@@ -5380,8 +5380,8 @@ declare const cacheDebugKeyFileSchema: z.ZodObject<{
|
|
|
5380
5380
|
finalStatus: z.ZodOptional<z.ZodEnum<{
|
|
5381
5381
|
error: "error";
|
|
5382
5382
|
running: "running";
|
|
5383
|
-
ok: "ok";
|
|
5384
5383
|
cancelled: "cancelled";
|
|
5384
|
+
ok: "ok";
|
|
5385
5385
|
}>>;
|
|
5386
5386
|
finalError: z.ZodOptional<z.ZodObject<{
|
|
5387
5387
|
name: z.ZodOptional<z.ZodString>;
|
|
@@ -5416,10 +5416,10 @@ declare const cacheDebugKeyFileSchema: z.ZodObject<{
|
|
|
5416
5416
|
format: z.ZodOptional<z.ZodEnum<{
|
|
5417
5417
|
number: "number";
|
|
5418
5418
|
boolean: "boolean";
|
|
5419
|
-
duration: "duration";
|
|
5420
|
-
json: "json";
|
|
5421
5419
|
file: "file";
|
|
5420
|
+
duration: "duration";
|
|
5422
5421
|
markdown: "markdown";
|
|
5422
|
+
json: "json";
|
|
5423
5423
|
image: "image";
|
|
5424
5424
|
html: "html";
|
|
5425
5425
|
pdf: "pdf";
|
|
@@ -5565,8 +5565,8 @@ type ConfigReloadState = z.infer<typeof configReloadStateSchema$1>;
|
|
|
5565
5565
|
declare const createRunRequestSchema$1: z.ZodObject<{
|
|
5566
5566
|
target: z.ZodObject<{
|
|
5567
5567
|
mode: z.ZodEnum<{
|
|
5568
|
-
all: "all";
|
|
5569
5568
|
caseIds: "caseIds";
|
|
5569
|
+
all: "all";
|
|
5570
5570
|
evalIds: "evalIds";
|
|
5571
5571
|
}>;
|
|
5572
5572
|
evalKeys: z.ZodOptional<z.ZodArray<z.ZodString>>;
|
package/dist/index.mjs
CHANGED
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
import { $ as setScopeCacheContext, A as repoFile, B as evalTime, C as evalTracer, D as deserializeCacheValue, E as deserializeCacheRecording, F as EvalRuntimeUsageError, Ft as getEvalRegistry, H as getEvalCaseInput, I as appendToEvalOutput, J as runInEvalRuntimeScope, K as mergeEvalOutput, M as readManualInputFile, N as evalExpect, O as serializeCacheRecording, P as EvalAssertionError, Q as setEvalOutput, R as evalAssert, S as evalSpan, T as hashCacheKeySync, U as incrementEvalOutput, V as getCurrentScope, W as isInEvalScope, X as runInExistingEvalScope, Y as runInEvalScope, at as extractApiCalls, b as buildTraceTree, ct as simulateTokenAllocation, et as startEvalBackgroundJob, it as extractCacheHits, j as manualInputFileValueSchema, k as serializeCacheValue, ot as extractLlmCalls, q as nextEvalId, rt as extractCacheEntries, st as simulateLlmCallCost, ut as getNestedAttribute, w as hashCacheKey, x as captureEvalSpanError, z as evalLog } from "./runExecution-
|
|
2
|
-
import { a as materializeManualInputFiles, i as isManualInputFileValue, n as createRunner, o as stageManualInputFile, r as cleanupStagedManualInputFiles, s as stageManualInputFileFromPath, t as runCli } from "./cli-
|
|
3
|
-
import { n as matchesEvalTags, t as defineEval } from "./src-
|
|
1
|
+
import { $ as setScopeCacheContext, A as repoFile, B as evalTime, C as evalTracer, D as deserializeCacheValue, E as deserializeCacheRecording, F as EvalRuntimeUsageError, Ft as getEvalRegistry, H as getEvalCaseInput, I as appendToEvalOutput, J as runInEvalRuntimeScope, K as mergeEvalOutput, M as readManualInputFile, N as evalExpect, O as serializeCacheRecording, P as EvalAssertionError, Q as setEvalOutput, R as evalAssert, S as evalSpan, T as hashCacheKeySync, U as incrementEvalOutput, V as getCurrentScope, W as isInEvalScope, X as runInExistingEvalScope, Y as runInEvalScope, at as extractApiCalls, b as buildTraceTree, ct as simulateTokenAllocation, et as startEvalBackgroundJob, it as extractCacheHits, j as manualInputFileValueSchema, k as serializeCacheValue, ot as extractLlmCalls, q as nextEvalId, rt as extractCacheEntries, st as simulateLlmCallCost, ut as getNestedAttribute, w as hashCacheKey, x as captureEvalSpanError, z as evalLog } from "./runExecution-Bq0Y3y_1.mjs";
|
|
2
|
+
import { a as materializeManualInputFiles, i as isManualInputFileValue, n as createRunner, o as stageManualInputFile, r as cleanupStagedManualInputFiles, s as stageManualInputFileFromPath, t as runCli } from "./cli-CbePEEua.mjs";
|
|
3
|
+
import { n as matchesEvalTags, t as defineEval } from "./src-CVM_FqPx.mjs";
|
|
4
4
|
export { EvalAssertionError, EvalRuntimeUsageError, appendToEvalOutput, buildTraceTree, captureEvalSpanError, cleanupStagedManualInputFiles, createRunner, defineEval, deserializeCacheRecording, deserializeCacheValue, evalAssert, evalExpect, evalLog, evalSpan, evalTime, evalTracer, extractApiCalls, extractCacheEntries, extractCacheHits, extractLlmCalls, getCurrentScope, getEvalCaseInput, getEvalRegistry, getNestedAttribute, hashCacheKey, hashCacheKeySync, incrementEvalOutput, isInEvalScope, isManualInputFileValue, manualInputFileValueSchema, matchesEvalTags, materializeManualInputFiles, mergeEvalOutput, nextEvalId, readManualInputFile, repoFile, runCli, runInEvalRuntimeScope, runInEvalScope, runInExistingEvalScope, serializeCacheRecording, serializeCacheValue, setEvalOutput, setScopeCacheContext, simulateLlmCallCost, simulateTokenAllocation, stageManualInputFile, stageManualInputFileFromPath, startEvalBackgroundJob };
|
package/dist/runChild.mjs
CHANGED
|
@@ -1,5 +1,5 @@
|
|
|
1
|
-
import { At as evalStatsConfigSchema, L as configureEvalRunLogs, Mt as evalChartsConfigSchema, Nt as columnDefSchema, Tt as buildEvalKey, bt as runManifestSchema, jt as manualInputDescriptorSchema, kt as evalStatAggregateSchema, l as registerAgentEvalsPackageResolutionHooks, p as loadConfig, tt as createRunRequestSchema, v as createFsCacheStore, xt as runSummarySchema, y as getCacheRetentionOptions } from "./runExecution-
|
|
2
|
-
import { S as parseEvalDiscovery, m as persistRunState, r as getTargetEvals$1, t as executeRun } from "./runOrchestration-
|
|
1
|
+
import { At as evalStatsConfigSchema, L as configureEvalRunLogs, Mt as evalChartsConfigSchema, Nt as columnDefSchema, Tt as buildEvalKey, bt as runManifestSchema, jt as manualInputDescriptorSchema, kt as evalStatAggregateSchema, l as registerAgentEvalsPackageResolutionHooks, p as loadConfig, tt as createRunRequestSchema, v as createFsCacheStore, xt as runSummarySchema, y as getCacheRetentionOptions } from "./runExecution-Bq0Y3y_1.mjs";
|
|
2
|
+
import { S as parseEvalDiscovery, m as persistRunState, r as getTargetEvals$1, t as executeRun } from "./runOrchestration-BpwW0AmB.mjs";
|
|
3
3
|
import { z } from "zod";
|
|
4
4
|
import { readFile } from "node:fs/promises";
|
|
5
5
|
import { relative } from "node:path";
|
|
@@ -289,7 +289,7 @@ z.object({
|
|
|
289
289
|
key: z.string(),
|
|
290
290
|
namespace: z.string(),
|
|
291
291
|
storedAt: z.string(),
|
|
292
|
-
/** Last successful cache
|
|
292
|
+
/** Last successful cache read or write time. Legacy entries may be `null`. */
|
|
293
293
|
lastAccessedAt: z.string().nullable()
|
|
294
294
|
});
|
|
295
295
|
z.object({
|
|
@@ -5395,7 +5395,7 @@ function createFsCacheStore(options) {
|
|
|
5395
5395
|
const index = await readNamespaceIndex(cacheDir, entry.namespace);
|
|
5396
5396
|
index.entries[entry.key] = {
|
|
5397
5397
|
storedAt: entry.storedAt,
|
|
5398
|
-
lastAccessedAt:
|
|
5398
|
+
lastAccessedAt: entry.storedAt,
|
|
5399
5399
|
blobRefs: await collectExternalJsonBlobRefs(entry, blobDirs)
|
|
5400
5400
|
};
|
|
5401
5401
|
await writeNamespaceIndex(cacheDir, index);
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
import { Dt as caseDetailSchema, Et as getCaseRowCaseKey, It as runWithEvalRegistry, J as runInEvalRuntimeScope, Ot as caseRowSchema, Z as runWithEvalClock, _t as matchesTagsFilter, bt as runManifestSchema, d as loadEvalModule, f as resolveEvalDefaultConfig, g as commitPendingCacheWrites, gt as dedupeEvalTags, ht as deriveStatusFromChildStatuses, i as isCaseChildMessage, m as buildDeclaredColumnDefs, mt as deriveStatusFromCaseRows, n as resolveRunnableEvalCases, o as stripTerminalControlCodes, pt as deriveScopedSummaryFromCases, t as filterEvalCases, u as runWithModuleIsolation, vt as validateEvalTagName, wt as buildCaseKey, xt as runSummarySchema, yt as validateTagsFilterExpression } from "./runExecution-
|
|
1
|
+
import { Dt as caseDetailSchema, Et as getCaseRowCaseKey, It as runWithEvalRegistry, J as runInEvalRuntimeScope, Ot as caseRowSchema, Z as runWithEvalClock, _t as matchesTagsFilter, bt as runManifestSchema, d as loadEvalModule, f as resolveEvalDefaultConfig, g as commitPendingCacheWrites, gt as dedupeEvalTags, ht as deriveStatusFromChildStatuses, i as isCaseChildMessage, m as buildDeclaredColumnDefs, mt as deriveStatusFromCaseRows, n as resolveRunnableEvalCases, o as stripTerminalControlCodes, pt as deriveScopedSummaryFromCases, t as filterEvalCases, u as runWithModuleIsolation, vt as validateEvalTagName, wt as buildCaseKey, xt as runSummarySchema, yt as validateTagsFilterExpression } from "./runExecution-Bq0Y3y_1.mjs";
|
|
2
2
|
import { Result, resultify } from "t-result";
|
|
3
3
|
import { readFile, readdir, rm, writeFile } from "node:fs/promises";
|
|
4
4
|
import { dirname, join } from "node:path";
|
|
@@ -1,5 +1,5 @@
|
|
|
1
|
-
import { n as createRunner } from "./cli-
|
|
2
|
-
import "./src-
|
|
1
|
+
import { n as createRunner } from "./cli-CbePEEua.mjs";
|
|
2
|
+
import "./src-CVM_FqPx.mjs";
|
|
3
3
|
//#region ../../apps/server/src/runner.ts
|
|
4
4
|
let runnerInstance = null;
|
|
5
5
|
function getRunnerInstance({ loadEnv = true } = {}) {
|
|
@@ -1,2 +1,2 @@
|
|
|
1
|
-
import { n as initRunner, t as getRunnerInstance } from "./runner-
|
|
1
|
+
import { n as initRunner, t as getRunnerInstance } from "./runner-Kp0JqxrU.mjs";
|
|
2
2
|
export { getRunnerInstance, initRunner };
|
|
@@ -1,5 +1,5 @@
|
|
|
1
|
-
import { G as matchesEvalTags$1, Pt as defineEval$1 } from "./runExecution-
|
|
2
|
-
import "./cli-
|
|
1
|
+
import { G as matchesEvalTags$1, Pt as defineEval$1 } from "./runExecution-Bq0Y3y_1.mjs";
|
|
2
|
+
import "./cli-CbePEEua.mjs";
|
|
3
3
|
//#region src/index.ts
|
|
4
4
|
/** Register an eval definition with typed tag support. */
|
|
5
5
|
function defineEval(definition) {
|
package/package.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
{
|
|
2
2
|
"name": "@ls-stack/agent-eval",
|
|
3
|
-
"version": "0.60.
|
|
3
|
+
"version": "0.60.2",
|
|
4
4
|
"type": "module",
|
|
5
5
|
"bin": {
|
|
6
6
|
"agent-evals": "./dist/bin.mjs"
|
|
@@ -32,9 +32,9 @@
|
|
|
32
32
|
"devDependencies": {
|
|
33
33
|
"@types/node": "^24.7.2",
|
|
34
34
|
"typescript": "^5.9.2",
|
|
35
|
-
"@agent-evals/
|
|
35
|
+
"@agent-evals/runner": "0.0.1",
|
|
36
36
|
"@agent-evals/shared": "0.0.1",
|
|
37
|
-
"@agent-evals/
|
|
37
|
+
"@agent-evals/sdk": "0.0.1"
|
|
38
38
|
},
|
|
39
39
|
"scripts": {
|
|
40
40
|
"build": "pnpm --filter @agent-evals/web build && pnpm --filter @agent-evals/shared build && pnpm --filter @agent-evals/sdk build && pnpm --filter @agent-evals/runner build && tsdown --filter cli-js && tsdown --filter cli-types",
|
|
@@ -568,6 +568,8 @@ Mental model:
|
|
|
568
568
|
runner stays idle for `cache.pruneIdleDelayMs ?? 5000` milliseconds. Configure
|
|
569
569
|
`cache.maxEntries` as a number for the default cap, or as
|
|
570
570
|
`{ default, namespaces }` for exact namespace-specific caps.
|
|
571
|
+
Writes initialize the row's last access time to the stored time; later cache
|
|
572
|
+
hits refresh that timestamp at the configured access-time update interval.
|
|
571
573
|
- Unindexed legacy cache files are ignored by normal lookup/listing. Use
|
|
572
574
|
`agent-evals cache repair` to remove unindexed cache files, stale index rows,
|
|
573
575
|
debug sidecars, and unreferenced blob files.
|