@wix/evalforge-types 0.46.0 → 0.48.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/build/index.js +25 -13
- package/build/index.js.map +2 -2
- package/build/index.mjs +24 -12
- package/build/index.mjs.map +2 -2
- package/build/types/common/models.d.ts +1 -1
- package/build/types/evaluation/eval-run.d.ts +7 -1
- package/build/types/project/project.d.ts +3 -0
- package/build/types/scenario/test-scenario.d.ts +3 -0
- package/package.json +2 -2
package/build/index.js
CHANGED
|
@@ -22,7 +22,7 @@ var index_exports = {};
|
|
|
22
22
|
__export(index_exports, {
|
|
23
23
|
AGENT_TYPE_LABELS: () => AGENT_TYPE_LABELS,
|
|
24
24
|
ALL_AVAILABLE_MODEL_IDS: () => ALL_AVAILABLE_MODEL_IDS,
|
|
25
|
-
|
|
25
|
+
AVAILABLE_CLAUDE_MODEL_IDS: () => AVAILABLE_CLAUDE_MODEL_IDS,
|
|
26
26
|
AVAILABLE_OPENAI_MODEL_IDS: () => AVAILABLE_OPENAI_MODEL_IDS,
|
|
27
27
|
AVAILABLE_RUN_COMMANDS: () => AVAILABLE_RUN_COMMANDS,
|
|
28
28
|
AVAILABLE_TOOL_NAMES: () => AVAILABLE_TOOL_NAMES,
|
|
@@ -1119,17 +1119,17 @@ var WebhookIdentityType;
|
|
|
1119
1119
|
})(WebhookIdentityType || (WebhookIdentityType = {}));
|
|
1120
1120
|
|
|
1121
1121
|
// src/common/models.ts
|
|
1122
|
-
var
|
|
1122
|
+
var AVAILABLE_CLAUDE_MODEL_IDS = Object.values(
|
|
1123
1123
|
ClaudeModel
|
|
1124
1124
|
).filter(
|
|
1125
1125
|
(v) => typeof v === "string" && v !== ClaudeModel.UNKNOWN_CLAUDE_MODEL
|
|
1126
1126
|
);
|
|
1127
1127
|
var PREFERRED_JUDGE_MODEL = "CLAUDE_4_5_HAIKU_1_0";
|
|
1128
|
-
var DEFAULT_JUDGE_MODEL =
|
|
1128
|
+
var DEFAULT_JUDGE_MODEL = AVAILABLE_CLAUDE_MODEL_IDS.includes(
|
|
1129
1129
|
PREFERRED_JUDGE_MODEL
|
|
1130
|
-
) ? PREFERRED_JUDGE_MODEL :
|
|
1130
|
+
) ? PREFERRED_JUDGE_MODEL : AVAILABLE_CLAUDE_MODEL_IDS[0];
|
|
1131
1131
|
var ClaudeModelSchema = import_zod4.z.enum(
|
|
1132
|
-
|
|
1132
|
+
AVAILABLE_CLAUDE_MODEL_IDS
|
|
1133
1133
|
);
|
|
1134
1134
|
var AVAILABLE_OPENAI_MODEL_IDS = Object.values(
|
|
1135
1135
|
Model
|
|
@@ -1140,7 +1140,7 @@ var OpenAIModelSchema = import_zod4.z.enum(
|
|
|
1140
1140
|
AVAILABLE_OPENAI_MODEL_IDS
|
|
1141
1141
|
);
|
|
1142
1142
|
var ALL_AVAILABLE_MODEL_IDS = [
|
|
1143
|
-
...
|
|
1143
|
+
...AVAILABLE_CLAUDE_MODEL_IDS,
|
|
1144
1144
|
...AVAILABLE_OPENAI_MODEL_IDS
|
|
1145
1145
|
];
|
|
1146
1146
|
var AnyModelSchema = import_zod4.z.enum(
|
|
@@ -1791,7 +1791,9 @@ var TestScenarioSchema = TenantEntitySchema.extend({
|
|
|
1791
1791
|
/** IDs of saved assertions to evaluate (from assertions table) - legacy, use assertionLinks */
|
|
1792
1792
|
assertionIds: import_zod24.z.array(import_zod24.z.string()).optional(),
|
|
1793
1793
|
/** Linked assertions with per-scenario parameter values */
|
|
1794
|
-
assertionLinks: import_zod24.z.array(ScenarioAssertionLinkSchema).optional()
|
|
1794
|
+
assertionLinks: import_zod24.z.array(ScenarioAssertionLinkSchema).optional(),
|
|
1795
|
+
/** Tags for categorisation and filtering */
|
|
1796
|
+
tags: import_zod24.z.array(import_zod24.z.string()).optional()
|
|
1795
1797
|
});
|
|
1796
1798
|
var CreateTestScenarioInputSchema = TestScenarioSchema.omit({
|
|
1797
1799
|
id: true,
|
|
@@ -2060,7 +2062,7 @@ var EvalRunSchema = TenantEntitySchema.extend({
|
|
|
2060
2062
|
skillsGroupId: import_zod28.z.string().optional(),
|
|
2061
2063
|
/** Map of skillId to skillVersionId for this run */
|
|
2062
2064
|
skillVersions: import_zod28.z.record(import_zod28.z.string(), import_zod28.z.string()).optional(),
|
|
2063
|
-
/** Scenario IDs to run */
|
|
2065
|
+
/** Scenario IDs to run (always present — resolved server-side from tags when needed) */
|
|
2064
2066
|
scenarioIds: import_zod28.z.array(import_zod28.z.string()),
|
|
2065
2067
|
/** Current status */
|
|
2066
2068
|
status: EvalStatusSchema,
|
|
@@ -2095,7 +2097,9 @@ var EvalRunSchema = TenantEntitySchema.extend({
|
|
|
2095
2097
|
/** Sub-agent IDs to enable for this run (optional) */
|
|
2096
2098
|
subAgentIds: import_zod28.z.array(import_zod28.z.string()).optional(),
|
|
2097
2099
|
/** Rule IDs to enable for this run (optional) */
|
|
2098
|
-
ruleIds: import_zod28.z.array(import_zod28.z.string()).optional()
|
|
2100
|
+
ruleIds: import_zod28.z.array(import_zod28.z.string()).optional(),
|
|
2101
|
+
/** Tags used to select scenarios for this run (for traceability) */
|
|
2102
|
+
tags: import_zod28.z.array(import_zod28.z.string()).optional()
|
|
2099
2103
|
});
|
|
2100
2104
|
var CreateEvalRunInputSchema = EvalRunSchema.omit({
|
|
2101
2105
|
id: true,
|
|
@@ -2106,8 +2110,15 @@ var CreateEvalRunInputSchema = EvalRunSchema.omit({
|
|
|
2106
2110
|
results: true,
|
|
2107
2111
|
aggregateMetrics: true,
|
|
2108
2112
|
startedAt: true,
|
|
2109
|
-
completedAt: true
|
|
2110
|
-
|
|
2113
|
+
completedAt: true,
|
|
2114
|
+
scenarioIds: true
|
|
2115
|
+
}).extend({
|
|
2116
|
+
/** Optional on input — backend resolves from tags when not provided */
|
|
2117
|
+
scenarioIds: import_zod28.z.array(import_zod28.z.string()).optional()
|
|
2118
|
+
}).refine(
|
|
2119
|
+
(data) => data.scenarioIds && data.scenarioIds.length > 0 || data.tags && data.tags.length > 0,
|
|
2120
|
+
{ message: "Either scenarioIds or tags must be provided" }
|
|
2121
|
+
);
|
|
2111
2122
|
var EvaluationProgressSchema = import_zod28.z.object({
|
|
2112
2123
|
runId: import_zod28.z.string(),
|
|
2113
2124
|
targetId: import_zod28.z.string(),
|
|
@@ -2281,7 +2292,8 @@ var ProjectSchema = BaseEntitySchema.extend({
|
|
|
2281
2292
|
appId: import_zod31.z.string().optional().describe("The ID of the app in Dev Center"),
|
|
2282
2293
|
appSecret: import_zod31.z.string().optional().describe("The secret of the app in Dev Center"),
|
|
2283
2294
|
useWixAuth: import_zod31.z.boolean().optional().describe("Enable Wix CLI/MCP auth for evaluations"),
|
|
2284
|
-
useBase44Auth: import_zod31.z.boolean().optional().describe("Enable Base44 auth for evaluations")
|
|
2295
|
+
useBase44Auth: import_zod31.z.boolean().optional().describe("Enable Base44 auth for evaluations"),
|
|
2296
|
+
scenarioTags: import_zod31.z.array(import_zod31.z.string()).optional().describe("Project-level tag vocabulary for scenarios")
|
|
2285
2297
|
});
|
|
2286
2298
|
var CreateProjectInputSchema = ProjectSchema.omit({
|
|
2287
2299
|
id: true,
|
|
@@ -2456,7 +2468,7 @@ function getSystemAssertion(id) {
|
|
|
2456
2468
|
0 && (module.exports = {
|
|
2457
2469
|
AGENT_TYPE_LABELS,
|
|
2458
2470
|
ALL_AVAILABLE_MODEL_IDS,
|
|
2459
|
-
|
|
2471
|
+
AVAILABLE_CLAUDE_MODEL_IDS,
|
|
2460
2472
|
AVAILABLE_OPENAI_MODEL_IDS,
|
|
2461
2473
|
AVAILABLE_RUN_COMMANDS,
|
|
2462
2474
|
AVAILABLE_TOOL_NAMES,
|