@ls-stack/agent-eval 0.40.0 → 0.41.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/{app-0k8Y1OBk.mjs → app-1vE5Ryry.mjs} +5 -5
- package/dist/apps/web/dist/assets/index-DKfAipoE.js +140 -0
- package/dist/apps/web/dist/assets/{index-C58_zLA9.css → index-pKAZgRwO.css} +1 -1
- package/dist/apps/web/dist/index.html +2 -2
- package/dist/bin.mjs +1 -1
- package/dist/{cli-Sg8UdOnm.mjs → cli-Bk5g-bat.mjs} +43 -11
- package/dist/index.d.mts +3118 -3452
- package/dist/index.mjs +4 -4
- package/dist/runChild.mjs +5 -3
- package/dist/{runOrchestration-CTzVNrDP.mjs → runOrchestration-DhTiT4V0.mjs} +4635 -4262
- package/dist/{runner-njK_CtXC.mjs → runner-B1Cyevvr.mjs} +1 -1
- package/dist/{runner-Bb9JdFkg.mjs → runner-BG0L4yId.mjs} +2 -2
- package/dist/src-t6OVp1li.mjs +13 -0
- package/package.json +1 -1
- package/skills/agent-eval/SKILL.md +21 -1
- package/dist/apps/web/dist/assets/index-C4v6dWcv.js +0 -140
- package/dist/src-BZzPFS8r.mjs +0 -3
package/dist/index.mjs
CHANGED
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
import { $ as
|
|
2
|
-
import { a as materializeManualInputFiles, i as isManualInputFileValue, n as createRunner, o as stageManualInputFile, r as cleanupStagedManualInputFiles, s as stageManualInputFileFromPath, t as runCli } from "./cli-
|
|
3
|
-
import "./src-
|
|
4
|
-
export {
|
|
1
|
+
import { $ as getCurrentScope, B as deserializeCacheValue, F as evalSpan, G as readManualInputFile, H as serializeCacheValue, I as evalTracer, J as appendToEvalOutput, K as evalExpect, L as hashCacheKey, M as z, N as buildTraceTree, P as captureEvalSpanError, Q as evalTime, R as hashCacheKeySync, Rt as getEvalRegistry, U as repoFile, V as serializeCacheRecording, W as manualInputFileValueSchema, X as evalAssert, Z as evalLog, _t as extractLlmCalls, at as nextEvalId, ct as runInExistingEvalScope, dt as startEvalBackgroundJob, et as getEvalCaseInput, gt as extractApiCalls, ht as extractCacheHits, it as mergeEvalOutput, lt as setEvalOutput, mt as extractCacheEntries, nt as isInEvalScope, ot as runInEvalRuntimeScope, q as EvalAssertionError, st as runInEvalScope, tt as incrementEvalOutput, ut as setScopeCacheContext, vt as simulateLlmCallCost, xt as getNestedAttribute, yt as simulateTokenAllocation, z as deserializeCacheRecording } from "./runOrchestration-DhTiT4V0.mjs";
|
|
2
|
+
import { a as materializeManualInputFiles, i as isManualInputFileValue, n as createRunner, o as stageManualInputFile, r as cleanupStagedManualInputFiles, s as stageManualInputFileFromPath, t as runCli } from "./cli-Bk5g-bat.mjs";
|
|
3
|
+
import { n as matchesEvalTags, t as defineEval } from "./src-t6OVp1li.mjs";
|
|
4
|
+
export { EvalAssertionError, appendToEvalOutput, buildTraceTree, captureEvalSpanError, cleanupStagedManualInputFiles, createRunner, defineEval, deserializeCacheRecording, deserializeCacheValue, evalAssert, evalExpect, evalLog, evalSpan, evalTime, evalTracer, extractApiCalls, extractCacheEntries, extractCacheHits, extractLlmCalls, getCurrentScope, getEvalCaseInput, getEvalRegistry, getNestedAttribute, hashCacheKey, hashCacheKeySync, incrementEvalOutput, isInEvalScope, isManualInputFileValue, manualInputFileValueSchema, matchesEvalTags, materializeManualInputFiles, mergeEvalOutput, nextEvalId, readManualInputFile, repoFile, runCli, runInEvalRuntimeScope, runInEvalScope, runInExistingEvalScope, serializeCacheRecording, serializeCacheValue, setEvalOutput, setScopeCacheContext, simulateLlmCallCost, simulateTokenAllocation, stageManualInputFile, stageManualInputFileFromPath, startEvalBackgroundJob, z };
|
package/dist/runChild.mjs
CHANGED
|
@@ -1,8 +1,8 @@
|
|
|
1
|
-
import { At as
|
|
2
|
-
import {
|
|
1
|
+
import { At as buildEvalKey, D as loadConfig, Dt as runSummarySchema, Et as runManifestSchema, Ft as evalChartsConfigSchema, It as columnDefSchema, Nt as evalStatsConfigSchema, Pt as manualInputDescriptorSchema, T as parseEvalDiscovery, Y as configureEvalRunLogs, ft as createRunRequestSchema, h as persistRunState, j as createFsCacheStore, r as getTargetEvals$1, t as executeRun } from "./runOrchestration-DhTiT4V0.mjs";
|
|
2
|
+
import { z } from "zod/v4";
|
|
3
3
|
import { readFile } from "node:fs/promises";
|
|
4
4
|
import { relative } from "node:path";
|
|
5
|
-
import {
|
|
5
|
+
import { createHash } from "node:crypto";
|
|
6
6
|
import { glob } from "glob";
|
|
7
7
|
//#region ../runner/src/runChild.ts
|
|
8
8
|
const evalMetaSchema = z.object({
|
|
@@ -10,6 +10,7 @@ const evalMetaSchema = z.object({
|
|
|
10
10
|
id: z.string(),
|
|
11
11
|
title: z.string().optional(),
|
|
12
12
|
filePath: z.string(),
|
|
13
|
+
tags: z.array(z.string()).default([]),
|
|
13
14
|
sourceFilePath: z.string(),
|
|
14
15
|
sourceFingerprint: z.string().nullable(),
|
|
15
16
|
columnDefs: z.array(columnDefSchema),
|
|
@@ -109,6 +110,7 @@ async function discoverRunEvals(params) {
|
|
|
109
110
|
id: meta.id,
|
|
110
111
|
title: meta.title,
|
|
111
112
|
filePath: relativeFilePath,
|
|
113
|
+
tags: [],
|
|
112
114
|
sourceFilePath: meta.filePath,
|
|
113
115
|
sourceFingerprint,
|
|
114
116
|
columnDefs: [],
|