@wix/evalforge-evaluator 0.138.0 → 0.140.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
|
@@ -1,11 +1,11 @@
|
|
|
1
|
-
import type { SkillWithLatestVersion, TestScenario, LLMTrace, ConversationMessage } from '@wix/evalforge-types';
|
|
1
|
+
import type { SkillWithLatestVersion, TestScenario, LLMTrace, ConversationMessage, TriggerPromptImage } from '@wix/evalforge-types';
|
|
2
2
|
import type { ClaudeCodeExecutionOptions, ClaudeCodeExecutionResult } from './types.js';
|
|
3
3
|
/**
|
|
4
4
|
* Import SDK types directly from Claude Agent SDK.
|
|
5
5
|
* Type-only imports are erased at compile time - zero runtime overhead.
|
|
6
6
|
* The SDK is still dynamically imported at runtime in executeWithClaudeCode().
|
|
7
7
|
*/
|
|
8
|
-
import type { SDKMessage } from '@anthropic-ai/claude-agent-sdk' with { 'resolution-mode': 'import' };
|
|
8
|
+
import type { SDKUserMessage, SDKMessage } from '@anthropic-ai/claude-agent-sdk' with { 'resolution-mode': 'import' };
|
|
9
9
|
/**
|
|
10
10
|
* Message with timestamp — tracks when each message was received.
|
|
11
11
|
*/
|
|
@@ -13,6 +13,16 @@ export interface TimestampedMessage {
|
|
|
13
13
|
message: SDKMessage;
|
|
14
14
|
receivedAt: Date;
|
|
15
15
|
}
|
|
16
|
+
/**
|
|
17
|
+
* Build an async iterable that yields a user message with images.
|
|
18
|
+
* When images are attached to the trigger prompt, this allows multimodal input
|
|
19
|
+
* to the Claude Agent SDK via content blocks (text + image).
|
|
20
|
+
*
|
|
21
|
+
* @param triggerPrompt - The text prompt to send
|
|
22
|
+
* @param images - Array of images with base64 data and metadata
|
|
23
|
+
* @returns An async iterable yielding a single SDKUserMessage
|
|
24
|
+
*/
|
|
25
|
+
export declare function buildPromptStream(triggerPrompt: string, images: TriggerPromptImage[]): AsyncIterable<SDKUserMessage>;
|
|
16
26
|
/**
|
|
17
27
|
* Write all infrastructure files (settings, MCPs, sub-agents, rules, skills)
|
|
18
28
|
* to the working directory. Called by the adapter's `prepareEnvironment()` so
|
|
@@ -1,5 +1,17 @@
|
|
|
1
|
-
import type { SkillWithLatestVersion, TestScenario, LLMTrace, ConversationMessage } from '@wix/evalforge-types';
|
|
1
|
+
import type { SkillWithLatestVersion, TestScenario, LLMTrace, ConversationMessage, TriggerPromptImage } from '@wix/evalforge-types';
|
|
2
2
|
import type { OpenCodeExecutionOptions, OpenCodeExecutionResult } from './types.js';
|
|
3
|
+
/**
|
|
4
|
+
* Write trigger prompt images to disk so they can be passed via --file flags.
|
|
5
|
+
*
|
|
6
|
+
* Note: OpenCode CLI's --file flag currently has a known MIME-type detection bug
|
|
7
|
+
* (hardcodes text/plain for all files). Images are still written to the cwd so the
|
|
8
|
+
* agent can access them via its tools even if the CLI doesn't render them visually.
|
|
9
|
+
*
|
|
10
|
+
* @param cwd - Working directory where images will be written
|
|
11
|
+
* @param images - Array of images with base64 data and metadata
|
|
12
|
+
* @returns Array of absolute file paths for the written images
|
|
13
|
+
*/
|
|
14
|
+
export declare function writePromptImages(cwd: string, images: TriggerPromptImage[]): Promise<string[]>;
|
|
3
15
|
/**
|
|
4
16
|
* Write all infrastructure files (sub-agents, rules, skills)
|
|
5
17
|
* to the working directory. Called by the adapter's `prepareEnvironment()` so
|
package/package.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
{
|
|
2
2
|
"name": "@wix/evalforge-evaluator",
|
|
3
|
-
"version": "0.
|
|
3
|
+
"version": "0.140.0",
|
|
4
4
|
"description": "EvalForge Evaluator",
|
|
5
5
|
"bin": "./build/index.js",
|
|
6
6
|
"files": [
|
|
@@ -21,9 +21,9 @@
|
|
|
21
21
|
"@ai-sdk/openai": "^3.0.39",
|
|
22
22
|
"@anthropic-ai/claude-agent-sdk": "^0.2.63",
|
|
23
23
|
"@anthropic-ai/claude-code": "^2.1.63",
|
|
24
|
-
"@wix/eval-assertions": "0.
|
|
25
|
-
"@wix/evalforge-github-client": "0.
|
|
26
|
-
"@wix/evalforge-types": "0.
|
|
24
|
+
"@wix/eval-assertions": "0.43.0",
|
|
25
|
+
"@wix/evalforge-github-client": "0.47.0",
|
|
26
|
+
"@wix/evalforge-types": "0.72.0",
|
|
27
27
|
"ai": "^6.0.107",
|
|
28
28
|
"diff": "^7.0.0",
|
|
29
29
|
"tar": "^7.5.3",
|
|
@@ -62,5 +62,5 @@
|
|
|
62
62
|
"artifactId": "evalforge-evaluator"
|
|
63
63
|
}
|
|
64
64
|
},
|
|
65
|
-
"falconPackageHash": "
|
|
65
|
+
"falconPackageHash": "ff3677bd864b44dbb26d0cf845d0e17f4039fe8031366a11a13e2cf1"
|
|
66
66
|
}
|