@wix/evalforge-evaluator 0.139.0 → 0.140.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -1,11 +1,11 @@
1
- import type { SkillWithLatestVersion, TestScenario, LLMTrace, ConversationMessage } from '@wix/evalforge-types';
1
+ import type { SkillWithLatestVersion, TestScenario, LLMTrace, ConversationMessage, TriggerPromptImage } from '@wix/evalforge-types';
2
2
  import type { ClaudeCodeExecutionOptions, ClaudeCodeExecutionResult } from './types.js';
3
3
  /**
4
4
  * Import SDK types directly from Claude Agent SDK.
5
5
  * Type-only imports are erased at compile time - zero runtime overhead.
6
6
  * The SDK is still dynamically imported at runtime in executeWithClaudeCode().
7
7
  */
8
- import type { SDKMessage } from '@anthropic-ai/claude-agent-sdk' with { 'resolution-mode': 'import' };
8
+ import type { SDKUserMessage, SDKMessage } from '@anthropic-ai/claude-agent-sdk' with { 'resolution-mode': 'import' };
9
9
  /**
10
10
  * Message with timestamp — tracks when each message was received.
11
11
  */
@@ -13,6 +13,16 @@ export interface TimestampedMessage {
13
13
  message: SDKMessage;
14
14
  receivedAt: Date;
15
15
  }
16
+ /**
17
+ * Build an async iterable that yields a user message with images.
18
+ * When images are attached to the trigger prompt, this allows multimodal input
19
+ * to the Claude Agent SDK via content blocks (text + image).
20
+ *
21
+ * @param triggerPrompt - The text prompt to send
22
+ * @param images - Array of images with base64 data and metadata
23
+ * @returns An async iterable yielding a single SDKUserMessage
24
+ */
25
+ export declare function buildPromptStream(triggerPrompt: string, images: TriggerPromptImage[]): AsyncIterable<SDKUserMessage>;
16
26
  /**
17
27
  * Write all infrastructure files (settings, MCPs, sub-agents, rules, skills)
18
28
  * to the working directory. Called by the adapter's `prepareEnvironment()` so
@@ -1,5 +1,17 @@
1
- import type { SkillWithLatestVersion, TestScenario, LLMTrace, ConversationMessage } from '@wix/evalforge-types';
1
+ import type { SkillWithLatestVersion, TestScenario, LLMTrace, ConversationMessage, TriggerPromptImage } from '@wix/evalforge-types';
2
2
  import type { OpenCodeExecutionOptions, OpenCodeExecutionResult } from './types.js';
3
+ /**
4
+ * Write trigger prompt images to disk so they can be passed via --file flags.
5
+ *
6
+ * Note: OpenCode CLI's --file flag currently has a known MIME-type detection bug
7
+ * (hardcodes text/plain for all files). Images are still written to the cwd so the
8
+ * agent can access them via its tools even if the CLI doesn't render them visually.
9
+ *
10
+ * @param cwd - Working directory where images will be written
11
+ * @param images - Array of images with base64 data and metadata
12
+ * @returns Array of absolute file paths for the written images
13
+ */
14
+ export declare function writePromptImages(cwd: string, images: TriggerPromptImage[]): Promise<string[]>;
3
15
  /**
4
16
  * Write all infrastructure files (sub-agents, rules, skills)
5
17
  * to the working directory. Called by the adapter's `prepareEnvironment()` so
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "@wix/evalforge-evaluator",
3
- "version": "0.139.0",
3
+ "version": "0.140.0",
4
4
  "description": "EvalForge Evaluator",
5
5
  "bin": "./build/index.js",
6
6
  "files": [
@@ -21,9 +21,9 @@
21
21
  "@ai-sdk/openai": "^3.0.39",
22
22
  "@anthropic-ai/claude-agent-sdk": "^0.2.63",
23
23
  "@anthropic-ai/claude-code": "^2.1.63",
24
- "@wix/eval-assertions": "0.42.0",
25
- "@wix/evalforge-github-client": "0.46.0",
26
- "@wix/evalforge-types": "0.71.0",
24
+ "@wix/eval-assertions": "0.43.0",
25
+ "@wix/evalforge-github-client": "0.47.0",
26
+ "@wix/evalforge-types": "0.72.0",
27
27
  "ai": "^6.0.107",
28
28
  "diff": "^7.0.0",
29
29
  "tar": "^7.5.3",
@@ -62,5 +62,5 @@
62
62
  "artifactId": "evalforge-evaluator"
63
63
  }
64
64
  },
65
- "falconPackageHash": "5bb57c48b8bf1e552339edfe3952c4156ed91c946c2701fad8e2778f"
65
+ "falconPackageHash": "ff3677bd864b44dbb26d0cf845d0e17f4039fe8031366a11a13e2cf1"
66
66
  }