@wix/evalforge-evaluator 0.154.0 → 0.156.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -9,6 +9,12 @@ export interface EvaluationLoopResult {
9
9
  completedExecutions: number;
10
10
  totalExecutions: number;
11
11
  erroredExecutions: number;
12
+ /**
13
+ * `outputText` of the first errored iteration (already prefixed with
14
+ * `"Execution error: "`). Captured so the entry-point can surface a
15
+ * representative error on the eval run row when every iteration errors.
16
+ */
17
+ firstErrorMessage?: string;
12
18
  }
13
19
  /**
14
20
  * Run all scenarios with iteration support.
@@ -0,0 +1,9 @@
1
+ export declare const UNLIMITED_RUN_TIMEOUT_MS: number;
2
+ /**
3
+ * Returns the wall-clock timeout for an agent execution.
4
+ *
5
+ * - Explicit `maxDurationMs` always wins.
6
+ * - Unlimited runs (`maxTurns === undefined`) get a 60-minute ceiling.
7
+ * - Capped runs get 1 minute per turn, floored at 5 minutes.
8
+ */
9
+ export declare function resolveTimeoutMs(maxTurns: number | undefined, maxDurationMs?: number): number;
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "@wix/evalforge-evaluator",
3
- "version": "0.154.0",
3
+ "version": "0.156.0",
4
4
  "description": "EvalForge Evaluator",
5
5
  "bin": "./build/index.js",
6
6
  "files": [
@@ -63,5 +63,5 @@
63
63
  "artifactId": "evalforge-evaluator"
64
64
  }
65
65
  },
66
- "falconPackageHash": "c7af564ff189446a75e14e4d8053306774bcc500994454fec9ef687d"
66
+ "falconPackageHash": "b5977845c3a2e20a607b203191c76ab11f088863d7253b2235a29415"
67
67
  }