@ls-stack/agent-eval 0.33.0 → 0.34.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/{app-Dc6vvHRL.mjs → app-DOE-crd0.mjs} +4 -4
- package/dist/apps/web/dist/assets/index-BJpxc61J.css +1 -0
- package/dist/apps/web/dist/assets/index-ol64metU.js +140 -0
- package/dist/apps/web/dist/index.html +2 -2
- package/dist/bin.mjs +1 -1
- package/dist/{cli-huuJbDNb.mjs → cli-CG66f0GN.mjs} +3 -3
- package/dist/index.d.mts +102 -102
- package/dist/index.mjs +3 -3
- package/dist/runChild.mjs +1 -1
- package/dist/{runOrchestration-ZpN7xty_.mjs → runOrchestration-CYhn4DJ0.mjs} +19 -55
- package/dist/{runner-BPXPvinB.mjs → runner-D5i7HLcE.mjs} +1 -1
- package/dist/{runner-Dkol2ukD.mjs → runner-j9b6g0h0.mjs} +2 -2
- package/dist/src-B0b1vgk0.mjs +3 -0
- package/package.json +3 -3
- package/skills/agent-eval/SKILL.md +7 -4
- package/dist/apps/web/dist/assets/index-BPMMRktE.css +0 -1
- package/dist/apps/web/dist/assets/index-BV_DM8fZ.js +0 -118
- package/dist/src-1Qvuh0NH.mjs +0 -3
|
@@ -25,8 +25,8 @@
|
|
|
25
25
|
href="https://fonts.googleapis.com/css2?family=Geist:wght@400;500;600&family=JetBrains+Mono:wght@400;500&display=swap"
|
|
26
26
|
rel="stylesheet"
|
|
27
27
|
/>
|
|
28
|
-
<script type="module" crossorigin src="/assets/index-
|
|
29
|
-
<link rel="stylesheet" crossorigin href="/assets/index-
|
|
28
|
+
<script type="module" crossorigin src="/assets/index-ol64metU.js"></script>
|
|
29
|
+
<link rel="stylesheet" crossorigin href="/assets/index-BJpxc61J.css">
|
|
30
30
|
</head>
|
|
31
31
|
<body>
|
|
32
32
|
<div id="root"></div>
|
package/dist/bin.mjs
CHANGED
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
import { C as loadConfig, D as createFsCacheStore, E as validateCharts, H as getEvalDisplayStatus, S as resolveEvalDefaultConfig, T as normalizeScoreDef, U as deriveScopedSummaryFromCases, V as getEvalTitle, _ as buildManualInputDescriptor, a as getLastRunStatuses, b as loadEvalModule, bt as getCaseRowEvalKey, c as loadPersistedRunSnapshots, d as persistRunState, f as recomputeEvalStatusesInRuns, g as resolveArtifactPath, h as resolveTracePresentation, i as generateRunId, l as nextShortIdFromSnapshots, m as runTouchesEval, mt as resolveLlmCallsConfig, n as getTargetEvalKeys, o as getLatestRunInfos, p as recomputePersistedCaseStatus, pr as getEvalRegistry, pt as resolveApiCallsConfig, q as runSummarySchema, s as loadPersistedRunSnapshot, u as persistCaseDetail, v as parseManualInputValues, vt as buildEvalKey, w as buildDeclaredColumnDefs, x as parseEvalDiscovery, y as deriveEvalFreshness, yt as getCaseRowCaseKey, z as applyDerivedCallAttributes } from "./runOrchestration-
|
|
1
|
+
import { C as loadConfig, D as createFsCacheStore, E as validateCharts, H as getEvalDisplayStatus, S as resolveEvalDefaultConfig, T as normalizeScoreDef, U as deriveScopedSummaryFromCases, V as getEvalTitle, _ as buildManualInputDescriptor, a as getLastRunStatuses, b as loadEvalModule, bt as getCaseRowEvalKey, c as loadPersistedRunSnapshots, d as persistRunState, f as recomputeEvalStatusesInRuns, g as resolveArtifactPath, h as resolveTracePresentation, i as generateRunId, l as nextShortIdFromSnapshots, m as runTouchesEval, mt as resolveLlmCallsConfig, n as getTargetEvalKeys, o as getLatestRunInfos, p as recomputePersistedCaseStatus, pr as getEvalRegistry, pt as resolveApiCallsConfig, q as runSummarySchema, s as loadPersistedRunSnapshot, u as persistCaseDetail, v as parseManualInputValues, vt as buildEvalKey, w as buildDeclaredColumnDefs, x as parseEvalDiscovery, y as deriveEvalFreshness, yt as getCaseRowCaseKey, z as applyDerivedCallAttributes } from "./runOrchestration-CYhn4DJ0.mjs";
|
|
2
2
|
import { createHash, randomUUID } from "node:crypto";
|
|
3
3
|
import { copyFile, mkdir, readFile, rm, writeFile } from "node:fs/promises";
|
|
4
4
|
import { basename, dirname, extname, isAbsolute, join, relative, resolve, sep } from "node:path";
|
|
@@ -1940,8 +1940,8 @@ async function commandApp(args) {
|
|
|
1940
1940
|
const { serve } = await import("@hono/node-server");
|
|
1941
1941
|
const bundledWebDist = resolve(currentDir, "apps/web/dist");
|
|
1942
1942
|
if (existsSync(bundledWebDist)) process.env.AGENT_EVALS_WEB_DIST = bundledWebDist;
|
|
1943
|
-
const appModule = await import("./app-
|
|
1944
|
-
const runnerModule = await import("./runner-
|
|
1943
|
+
const appModule = await import("./app-DOE-crd0.mjs");
|
|
1944
|
+
const runnerModule = await import("./runner-D5i7HLcE.mjs");
|
|
1945
1945
|
if (!isHonoAppModule(appModule)) throw new Error("Server app module is invalid");
|
|
1946
1946
|
if (!isServerRunnerModule(runnerModule)) throw new Error("Server runner module is invalid");
|
|
1947
1947
|
await runnerModule.initRunner();
|