@wix/evalforge-types 0.54.0 → 0.56.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/build/index.js +59 -921
- package/build/index.js.map +4 -4
- package/build/index.mjs +57 -921
- package/build/index.mjs.map +4 -4
- package/build/types/common/models.d.ts +30 -22
- package/build/types/evaluation/eval-result.d.ts +4 -0
- package/build/types/evaluation/eval-run.d.ts +5 -0
- package/build/types/evaluation/metrics.d.ts +4 -0
- package/build/types/target/agent.d.ts +2 -1
- package/package.json +2 -3
|
@@ -1,34 +1,32 @@
|
|
|
1
1
|
import { z } from 'zod';
|
|
2
|
-
import { AnthropicModel as _AnthropicModel, Model as _OpenAIModel } from '@wix/ambassador-ds-wix-ai-gateway-v1-prompt/types';
|
|
3
2
|
/**
|
|
4
3
|
* Curated model sets — only models suitable for code generation.
|
|
5
|
-
*
|
|
6
|
-
* completion-only, and non-text models.
|
|
4
|
+
* Uses official/canonical model IDs (not internal gateway enums).
|
|
7
5
|
* Update these explicitly when new models become available.
|
|
8
6
|
*/
|
|
9
7
|
export declare const ClaudeModel: {
|
|
10
|
-
readonly CLAUDE_4_SONNET_1_0:
|
|
11
|
-
readonly CLAUDE_4_OPUS_1_0:
|
|
12
|
-
readonly CLAUDE_4_5_SONNET_1_0:
|
|
13
|
-
readonly CLAUDE_4_5_HAIKU_1_0:
|
|
14
|
-
readonly CLAUDE_4_5_OPUS_1_0:
|
|
15
|
-
readonly CLAUDE_4_6_SONNET_1_0:
|
|
16
|
-
readonly CLAUDE_4_6_OPUS_1_0:
|
|
8
|
+
readonly CLAUDE_4_SONNET_1_0: "claude-sonnet-4";
|
|
9
|
+
readonly CLAUDE_4_OPUS_1_0: "claude-opus-4";
|
|
10
|
+
readonly CLAUDE_4_5_SONNET_1_0: "claude-sonnet-4-5";
|
|
11
|
+
readonly CLAUDE_4_5_HAIKU_1_0: "claude-haiku-4-5";
|
|
12
|
+
readonly CLAUDE_4_5_OPUS_1_0: "claude-opus-4-5";
|
|
13
|
+
readonly CLAUDE_4_6_SONNET_1_0: "claude-sonnet-4-6";
|
|
14
|
+
readonly CLAUDE_4_6_OPUS_1_0: "claude-opus-4-6";
|
|
17
15
|
};
|
|
18
16
|
export type ClaudeModel = (typeof ClaudeModel)[keyof typeof ClaudeModel];
|
|
19
17
|
export declare const OpenAIModel: {
|
|
20
|
-
readonly GPT_4O_MINI_2024_07_18:
|
|
21
|
-
readonly GPT_4O_2024_11_20:
|
|
22
|
-
readonly O1_2024_12_17:
|
|
23
|
-
readonly O3_MINI_2025_01_31:
|
|
24
|
-
readonly GPT_4_1_2025_04_14:
|
|
25
|
-
readonly GPT_4_1_MINI_2025_04_14:
|
|
26
|
-
readonly GPT_4_1_NANO_2025_04_14:
|
|
27
|
-
readonly O3_2025_04_16:
|
|
28
|
-
readonly O4_MINI_2025_04_16:
|
|
29
|
-
readonly GPT_5_2025_08_07:
|
|
30
|
-
readonly GPT_5_MINI_2025_08_07:
|
|
31
|
-
readonly GPT_5_NANO_2025_08_07:
|
|
18
|
+
readonly GPT_4O_MINI_2024_07_18: "gpt-4o-mini";
|
|
19
|
+
readonly GPT_4O_2024_11_20: "gpt-4o";
|
|
20
|
+
readonly O1_2024_12_17: "o1";
|
|
21
|
+
readonly O3_MINI_2025_01_31: "o3-mini";
|
|
22
|
+
readonly GPT_4_1_2025_04_14: "gpt-4.1";
|
|
23
|
+
readonly GPT_4_1_MINI_2025_04_14: "gpt-4.1-mini";
|
|
24
|
+
readonly GPT_4_1_NANO_2025_04_14: "gpt-4.1-nano";
|
|
25
|
+
readonly O3_2025_04_16: "o3";
|
|
26
|
+
readonly O4_MINI_2025_04_16: "o4-mini";
|
|
27
|
+
readonly GPT_5_2025_08_07: "gpt-5";
|
|
28
|
+
readonly GPT_5_MINI_2025_08_07: "gpt-5-mini";
|
|
29
|
+
readonly GPT_5_NANO_2025_08_07: "gpt-5-nano";
|
|
32
30
|
};
|
|
33
31
|
export type OpenAIModel = (typeof OpenAIModel)[keyof typeof OpenAIModel];
|
|
34
32
|
export declare const AVAILABLE_CLAUDE_MODEL_IDS: ClaudeModel[];
|
|
@@ -50,6 +48,16 @@ export declare const ALL_AVAILABLE_MODEL_IDS: string[];
|
|
|
50
48
|
export declare const AnyModelSchema: z.ZodEnum<{
|
|
51
49
|
[x: string]: string;
|
|
52
50
|
}>;
|
|
51
|
+
/**
|
|
52
|
+
* Maps legacy Wix AI Gateway enum strings to official model IDs.
|
|
53
|
+
* Used for backward compatibility with stored data (DB, eval traces).
|
|
54
|
+
*/
|
|
55
|
+
export declare const LEGACY_MODEL_ID_MAP: Record<string, string>;
|
|
56
|
+
/**
|
|
57
|
+
* Normalize a model ID: translates legacy gateway enum strings to
|
|
58
|
+
* official model IDs. Returns the input unchanged if already canonical.
|
|
59
|
+
*/
|
|
60
|
+
export declare function normalizeModelId(modelId: string): string;
|
|
53
61
|
export declare const ModelConfigSchema: z.ZodObject<{
|
|
54
62
|
model: z.ZodEnum<{
|
|
55
63
|
[x: string]: string;
|
|
@@ -45,6 +45,7 @@ export declare const AssertionResultSchema: z.ZodObject<{
|
|
|
45
45
|
outputPreview: z.ZodOptional<z.ZodString>;
|
|
46
46
|
success: z.ZodBoolean;
|
|
47
47
|
error: z.ZodOptional<z.ZodString>;
|
|
48
|
+
turnIndex: z.ZodOptional<z.ZodNumber>;
|
|
48
49
|
}, z.core.$strip>>>;
|
|
49
50
|
}, z.core.$strip>;
|
|
50
51
|
export type AssertionResult = z.infer<typeof AssertionResultSchema>;
|
|
@@ -98,6 +99,7 @@ export declare const EvalRunResultSchema: z.ZodObject<{
|
|
|
98
99
|
outputPreview: z.ZodOptional<z.ZodString>;
|
|
99
100
|
success: z.ZodBoolean;
|
|
100
101
|
error: z.ZodOptional<z.ZodString>;
|
|
102
|
+
turnIndex: z.ZodOptional<z.ZodNumber>;
|
|
101
103
|
}, z.core.$strip>>>;
|
|
102
104
|
}, z.core.$strip>>;
|
|
103
105
|
metrics: z.ZodOptional<z.ZodObject<{
|
|
@@ -167,9 +169,11 @@ export declare const EvalRunResultSchema: z.ZodObject<{
|
|
|
167
169
|
outputPreview: z.ZodOptional<z.ZodString>;
|
|
168
170
|
success: z.ZodBoolean;
|
|
169
171
|
error: z.ZodOptional<z.ZodString>;
|
|
172
|
+
turnIndex: z.ZodOptional<z.ZodNumber>;
|
|
170
173
|
}, z.core.$strip>>;
|
|
171
174
|
summary: z.ZodObject<{
|
|
172
175
|
totalSteps: z.ZodNumber;
|
|
176
|
+
totalTurns: z.ZodOptional<z.ZodNumber>;
|
|
173
177
|
totalDurationMs: z.ZodNumber;
|
|
174
178
|
totalTokens: z.ZodObject<{
|
|
175
179
|
prompt: z.ZodNumber;
|
|
@@ -287,6 +287,7 @@ export declare const EvalRunSchema: z.ZodObject<{
|
|
|
287
287
|
outputPreview: z.ZodOptional<z.ZodString>;
|
|
288
288
|
success: z.ZodBoolean;
|
|
289
289
|
error: z.ZodOptional<z.ZodString>;
|
|
290
|
+
turnIndex: z.ZodOptional<z.ZodNumber>;
|
|
290
291
|
}, z.core.$strip>>>;
|
|
291
292
|
}, z.core.$strip>>;
|
|
292
293
|
metrics: z.ZodOptional<z.ZodObject<{
|
|
@@ -356,9 +357,11 @@ export declare const EvalRunSchema: z.ZodObject<{
|
|
|
356
357
|
outputPreview: z.ZodOptional<z.ZodString>;
|
|
357
358
|
success: z.ZodBoolean;
|
|
358
359
|
error: z.ZodOptional<z.ZodString>;
|
|
360
|
+
turnIndex: z.ZodOptional<z.ZodNumber>;
|
|
359
361
|
}, z.core.$strip>>;
|
|
360
362
|
summary: z.ZodObject<{
|
|
361
363
|
totalSteps: z.ZodNumber;
|
|
364
|
+
totalTurns: z.ZodOptional<z.ZodNumber>;
|
|
362
365
|
totalDurationMs: z.ZodNumber;
|
|
363
366
|
totalTokens: z.ZodObject<{
|
|
364
367
|
prompt: z.ZodNumber;
|
|
@@ -468,6 +471,7 @@ export declare const EvalRunSchema: z.ZodObject<{
|
|
|
468
471
|
}, z.core.$strip>>>;
|
|
469
472
|
llmTraceSummary: z.ZodOptional<z.ZodObject<{
|
|
470
473
|
totalSteps: z.ZodNumber;
|
|
474
|
+
totalTurns: z.ZodOptional<z.ZodNumber>;
|
|
471
475
|
totalDurationMs: z.ZodNumber;
|
|
472
476
|
totalTokens: z.ZodObject<{
|
|
473
477
|
prompt: z.ZodNumber;
|
|
@@ -597,6 +601,7 @@ export declare const CreateEvalRunInputSchema: z.ZodObject<{
|
|
|
597
601
|
}, z.core.$strip>>>;
|
|
598
602
|
llmTraceSummary: z.ZodOptional<z.ZodObject<{
|
|
599
603
|
totalSteps: z.ZodNumber;
|
|
604
|
+
totalTurns: z.ZodOptional<z.ZodNumber>;
|
|
600
605
|
totalDurationMs: z.ZodNumber;
|
|
601
606
|
totalTokens: z.ZodObject<{
|
|
602
607
|
prompt: z.ZodNumber;
|
|
@@ -65,6 +65,7 @@ export declare const LLMTraceStepSchema: z.ZodObject<{
|
|
|
65
65
|
outputPreview: z.ZodOptional<z.ZodString>;
|
|
66
66
|
success: z.ZodBoolean;
|
|
67
67
|
error: z.ZodOptional<z.ZodString>;
|
|
68
|
+
turnIndex: z.ZodOptional<z.ZodNumber>;
|
|
68
69
|
}, z.core.$strip>;
|
|
69
70
|
export type LLMTraceStep = z.infer<typeof LLMTraceStepSchema>;
|
|
70
71
|
/**
|
|
@@ -82,6 +83,7 @@ export type LLMBreakdownStats = z.infer<typeof LLMBreakdownStatsSchema>;
|
|
|
82
83
|
*/
|
|
83
84
|
export declare const LLMTraceSummarySchema: z.ZodObject<{
|
|
84
85
|
totalSteps: z.ZodNumber;
|
|
86
|
+
totalTurns: z.ZodOptional<z.ZodNumber>;
|
|
85
87
|
totalDurationMs: z.ZodNumber;
|
|
86
88
|
totalTokens: z.ZodObject<{
|
|
87
89
|
prompt: z.ZodNumber;
|
|
@@ -129,9 +131,11 @@ export declare const LLMTraceSchema: z.ZodObject<{
|
|
|
129
131
|
outputPreview: z.ZodOptional<z.ZodString>;
|
|
130
132
|
success: z.ZodBoolean;
|
|
131
133
|
error: z.ZodOptional<z.ZodString>;
|
|
134
|
+
turnIndex: z.ZodOptional<z.ZodNumber>;
|
|
132
135
|
}, z.core.$strip>>;
|
|
133
136
|
summary: z.ZodObject<{
|
|
134
137
|
totalSteps: z.ZodNumber;
|
|
138
|
+
totalTurns: z.ZodOptional<z.ZodNumber>;
|
|
135
139
|
totalDurationMs: z.ZodNumber;
|
|
136
140
|
totalTokens: z.ZodObject<{
|
|
137
141
|
prompt: z.ZodNumber;
|
|
@@ -28,7 +28,8 @@ export declare const AGENT_TYPE_LABELS: Record<AgentTypeValue, string>;
|
|
|
28
28
|
* When adding a new CLI agent adapter, add its command here first.
|
|
29
29
|
*/
|
|
30
30
|
export declare enum AgentRunCommand {
|
|
31
|
-
CLAUDE = "claude"
|
|
31
|
+
CLAUDE = "claude",
|
|
32
|
+
OPENCODE = "opencode"
|
|
32
33
|
}
|
|
33
34
|
/** All available run commands for use in dropdowns and validation. */
|
|
34
35
|
export declare const AVAILABLE_RUN_COMMANDS: AgentRunCommand[];
|
package/package.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
{
|
|
2
2
|
"name": "@wix/evalforge-types",
|
|
3
|
-
"version": "0.
|
|
3
|
+
"version": "0.56.0",
|
|
4
4
|
"description": "Unified types for EvalForge agent evaluation system",
|
|
5
5
|
"files": [
|
|
6
6
|
"build"
|
|
@@ -20,7 +20,6 @@
|
|
|
20
20
|
"devDependencies": {
|
|
21
21
|
"@eslint/js": "^9.39.2",
|
|
22
22
|
"@types/node": "^22.19.3",
|
|
23
|
-
"@wix/ambassador-ds-wix-ai-gateway-v1-prompt": "^1.0.312",
|
|
24
23
|
"esbuild": "^0.27.2",
|
|
25
24
|
"eslint": "^9.39.2",
|
|
26
25
|
"eslint-config-prettier": "^10.1.8",
|
|
@@ -47,5 +46,5 @@
|
|
|
47
46
|
"artifactId": "evalforge-types"
|
|
48
47
|
}
|
|
49
48
|
},
|
|
50
|
-
"falconPackageHash": "
|
|
49
|
+
"falconPackageHash": "331ddbd68218e960214d7b75e497534e88fa193a082b6fd1fb9a922f"
|
|
51
50
|
}
|