@ls-stack/agent-eval 0.17.0 → 0.18.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -1,2 +1,2 @@
1
- import { n as initRunner, t as getRunnerInstance } from "./runner-BSXZiQIi.mjs";
1
+ import { n as initRunner, t as getRunnerInstance } from "./runner-RmZPRz-h.mjs";
2
2
  export { getRunnerInstance, initRunner };
@@ -1,5 +1,5 @@
1
- import { n as createRunner } from "./cli-CULTt3Xp.mjs";
2
- import "./src-CNf3xwVw.mjs";
1
+ import { n as createRunner } from "./cli-3zANEAhG.mjs";
2
+ import "./src-BC4OrajN.mjs";
3
3
  //#region ../../apps/server/src/runner.ts
4
4
  let runnerInstance = null;
5
5
  function getRunnerInstance() {
@@ -0,0 +1,3 @@
1
+ import "./runOrchestration-BBg_VUH5.mjs";
2
+ import "./cli-3zANEAhG.mjs";
3
+ export {};
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "@ls-stack/agent-eval",
3
- "version": "0.17.0",
3
+ "version": "0.18.0",
4
4
  "type": "module",
5
5
  "bin": {
6
6
  "agent-evals": "./dist/bin.mjs"
@@ -55,8 +55,9 @@ a per-case sequence number, and throws outside an eval case scope.
55
55
  Use `evalLog(level, ...args)` for intentional per-case logs. The runner also
56
56
  captures `console.log`, `console.info`, `console.warn`, and `console.error`
57
57
  during case-owned phases by default; log arguments are stored as JSON-safe
58
- values and rendered with the JSON viewer, collapsed previews are capped, and
59
- logs inside cached operations are not replayed from cache hits.
58
+ values and rendered with the JSON viewer, collapsed previews include best-effort
59
+ code locations when stack data is available, previews are capped, and logs
60
+ inside cached operations are not replayed from cache hits.
60
61
 
61
62
  ### Product code (instrumented once, reused everywhere)
62
63
 
@@ -341,7 +342,8 @@ Mental model:
341
342
  - Authored raw cache keys are stored for debugging under
342
343
  `.agent-evals/cache-debug/<owner>.json`. This folder may include prompts,
343
344
  user inputs, or other sensitive data, should be gitignored, and is not needed
344
- for cache reuse. The UI Cache hits tab shows the raw key when it is available.
345
+ for cache reuse. The UI Cache tab shows the raw key when it is available and
346
+ can be filtered to hits or new entries added by cache misses/refreshes.
345
347
  - Cached payloads use advance serialization/deserialization with the Web API plugin set, so return values and
346
348
  recorded SDK effects preserve richer built-ins such as `Date`, `Map`, `Set`,
347
349
  typed arrays, `URL`, `Headers`, `Blob`, and `File` on hits. Cache keys still