@wix/evalforge-evaluator 0.122.0 → 0.123.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -9,10 +9,15 @@ import type { OpenCodeExecutionOptions, OpenCodeExecutionResult } from './types.
9
9
  */
10
10
  export declare function prepareOpenCodeEnvironment(cwd: string, skills: SkillWithLatestVersion[], options: Pick<OpenCodeExecutionOptions, 'mcps' | 'subAgents' | 'rules'>): Promise<void>;
11
11
  /**
12
- * Execute skills using the OpenCode CLI.
12
+ * Execute skills using the OpenCode CLI with automatic retry on idle timeouts.
13
13
  *
14
- * Spawns `opencode run --format json` with the trigger prompt, parses the
15
- * NDJSON events from stdout, and builds the trace/conversation from them.
14
+ * When the OpenCode process stalls (no output for 120s), it is killed and
15
+ * retried with a recovery prompt that carries context about work already done.
16
+ * This works around known OpenCode hanging issues where the upstream LLM
17
+ * connection stalls mid-stream.
18
+ *
19
+ * @see https://github.com/anomalyco/opencode/issues/13230 - Memory leak causes OOM
20
+ * @see https://github.com/anomalyco/opencode/issues/13841 - LLM connection stalls
16
21
  */
17
22
  export declare function executeWithOpenCode(skills: SkillWithLatestVersion[], scenario: TestScenario, options: OpenCodeExecutionOptions): Promise<{
18
23
  result: OpenCodeExecutionResult;
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "@wix/evalforge-evaluator",
3
- "version": "0.122.0",
3
+ "version": "0.123.0",
4
4
  "description": "EvalForge Evaluator",
5
5
  "bin": "./build/index.js",
6
6
  "files": [
@@ -62,5 +62,5 @@
62
62
  "artifactId": "evalforge-evaluator"
63
63
  }
64
64
  },
65
- "falconPackageHash": "723dce09677b21f37f8754eb54c9660ce559159542bb2d2a43ae49db"
65
+ "falconPackageHash": "909d0a5e5ceffeabc71d45e03e964c3d4a5b0466111f64147fb09d83"
66
66
  }