@wix/evalforge-types 0.46.0 → 0.48.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/build/index.js CHANGED
@@ -22,7 +22,7 @@ var index_exports = {};
22
22
  __export(index_exports, {
23
23
  AGENT_TYPE_LABELS: () => AGENT_TYPE_LABELS,
24
24
  ALL_AVAILABLE_MODEL_IDS: () => ALL_AVAILABLE_MODEL_IDS,
25
- AVAILABLE_MODEL_IDS: () => AVAILABLE_MODEL_IDS,
25
+ AVAILABLE_CLAUDE_MODEL_IDS: () => AVAILABLE_CLAUDE_MODEL_IDS,
26
26
  AVAILABLE_OPENAI_MODEL_IDS: () => AVAILABLE_OPENAI_MODEL_IDS,
27
27
  AVAILABLE_RUN_COMMANDS: () => AVAILABLE_RUN_COMMANDS,
28
28
  AVAILABLE_TOOL_NAMES: () => AVAILABLE_TOOL_NAMES,
@@ -1119,17 +1119,17 @@ var WebhookIdentityType;
1119
1119
  })(WebhookIdentityType || (WebhookIdentityType = {}));
1120
1120
 
1121
1121
  // src/common/models.ts
1122
- var AVAILABLE_MODEL_IDS = Object.values(
1122
+ var AVAILABLE_CLAUDE_MODEL_IDS = Object.values(
1123
1123
  ClaudeModel
1124
1124
  ).filter(
1125
1125
  (v) => typeof v === "string" && v !== ClaudeModel.UNKNOWN_CLAUDE_MODEL
1126
1126
  );
1127
1127
  var PREFERRED_JUDGE_MODEL = "CLAUDE_4_5_HAIKU_1_0";
1128
- var DEFAULT_JUDGE_MODEL = AVAILABLE_MODEL_IDS.includes(
1128
+ var DEFAULT_JUDGE_MODEL = AVAILABLE_CLAUDE_MODEL_IDS.includes(
1129
1129
  PREFERRED_JUDGE_MODEL
1130
- ) ? PREFERRED_JUDGE_MODEL : AVAILABLE_MODEL_IDS[0];
1130
+ ) ? PREFERRED_JUDGE_MODEL : AVAILABLE_CLAUDE_MODEL_IDS[0];
1131
1131
  var ClaudeModelSchema = import_zod4.z.enum(
1132
- AVAILABLE_MODEL_IDS
1132
+ AVAILABLE_CLAUDE_MODEL_IDS
1133
1133
  );
1134
1134
  var AVAILABLE_OPENAI_MODEL_IDS = Object.values(
1135
1135
  Model
@@ -1140,7 +1140,7 @@ var OpenAIModelSchema = import_zod4.z.enum(
1140
1140
  AVAILABLE_OPENAI_MODEL_IDS
1141
1141
  );
1142
1142
  var ALL_AVAILABLE_MODEL_IDS = [
1143
- ...AVAILABLE_MODEL_IDS,
1143
+ ...AVAILABLE_CLAUDE_MODEL_IDS,
1144
1144
  ...AVAILABLE_OPENAI_MODEL_IDS
1145
1145
  ];
1146
1146
  var AnyModelSchema = import_zod4.z.enum(
@@ -1791,7 +1791,9 @@ var TestScenarioSchema = TenantEntitySchema.extend({
1791
1791
  /** IDs of saved assertions to evaluate (from assertions table) - legacy, use assertionLinks */
1792
1792
  assertionIds: import_zod24.z.array(import_zod24.z.string()).optional(),
1793
1793
  /** Linked assertions with per-scenario parameter values */
1794
- assertionLinks: import_zod24.z.array(ScenarioAssertionLinkSchema).optional()
1794
+ assertionLinks: import_zod24.z.array(ScenarioAssertionLinkSchema).optional(),
1795
+ /** Tags for categorisation and filtering */
1796
+ tags: import_zod24.z.array(import_zod24.z.string()).optional()
1795
1797
  });
1796
1798
  var CreateTestScenarioInputSchema = TestScenarioSchema.omit({
1797
1799
  id: true,
@@ -2060,7 +2062,7 @@ var EvalRunSchema = TenantEntitySchema.extend({
2060
2062
  skillsGroupId: import_zod28.z.string().optional(),
2061
2063
  /** Map of skillId to skillVersionId for this run */
2062
2064
  skillVersions: import_zod28.z.record(import_zod28.z.string(), import_zod28.z.string()).optional(),
2063
- /** Scenario IDs to run */
2065
+ /** Scenario IDs to run (always present — resolved server-side from tags when needed) */
2064
2066
  scenarioIds: import_zod28.z.array(import_zod28.z.string()),
2065
2067
  /** Current status */
2066
2068
  status: EvalStatusSchema,
@@ -2095,7 +2097,9 @@ var EvalRunSchema = TenantEntitySchema.extend({
2095
2097
  /** Sub-agent IDs to enable for this run (optional) */
2096
2098
  subAgentIds: import_zod28.z.array(import_zod28.z.string()).optional(),
2097
2099
  /** Rule IDs to enable for this run (optional) */
2098
- ruleIds: import_zod28.z.array(import_zod28.z.string()).optional()
2100
+ ruleIds: import_zod28.z.array(import_zod28.z.string()).optional(),
2101
+ /** Tags used to select scenarios for this run (for traceability) */
2102
+ tags: import_zod28.z.array(import_zod28.z.string()).optional()
2099
2103
  });
2100
2104
  var CreateEvalRunInputSchema = EvalRunSchema.omit({
2101
2105
  id: true,
@@ -2106,8 +2110,15 @@ var CreateEvalRunInputSchema = EvalRunSchema.omit({
2106
2110
  results: true,
2107
2111
  aggregateMetrics: true,
2108
2112
  startedAt: true,
2109
- completedAt: true
2110
- });
2113
+ completedAt: true,
2114
+ scenarioIds: true
2115
+ }).extend({
2116
+ /** Optional on input — backend resolves from tags when not provided */
2117
+ scenarioIds: import_zod28.z.array(import_zod28.z.string()).optional()
2118
+ }).refine(
2119
+ (data) => data.scenarioIds && data.scenarioIds.length > 0 || data.tags && data.tags.length > 0,
2120
+ { message: "Either scenarioIds or tags must be provided" }
2121
+ );
2111
2122
  var EvaluationProgressSchema = import_zod28.z.object({
2112
2123
  runId: import_zod28.z.string(),
2113
2124
  targetId: import_zod28.z.string(),
@@ -2281,7 +2292,8 @@ var ProjectSchema = BaseEntitySchema.extend({
2281
2292
  appId: import_zod31.z.string().optional().describe("The ID of the app in Dev Center"),
2282
2293
  appSecret: import_zod31.z.string().optional().describe("The secret of the app in Dev Center"),
2283
2294
  useWixAuth: import_zod31.z.boolean().optional().describe("Enable Wix CLI/MCP auth for evaluations"),
2284
- useBase44Auth: import_zod31.z.boolean().optional().describe("Enable Base44 auth for evaluations")
2295
+ useBase44Auth: import_zod31.z.boolean().optional().describe("Enable Base44 auth for evaluations"),
2296
+ scenarioTags: import_zod31.z.array(import_zod31.z.string()).optional().describe("Project-level tag vocabulary for scenarios")
2285
2297
  });
2286
2298
  var CreateProjectInputSchema = ProjectSchema.omit({
2287
2299
  id: true,
@@ -2456,7 +2468,7 @@ function getSystemAssertion(id) {
2456
2468
  0 && (module.exports = {
2457
2469
  AGENT_TYPE_LABELS,
2458
2470
  ALL_AVAILABLE_MODEL_IDS,
2459
- AVAILABLE_MODEL_IDS,
2471
+ AVAILABLE_CLAUDE_MODEL_IDS,
2460
2472
  AVAILABLE_OPENAI_MODEL_IDS,
2461
2473
  AVAILABLE_RUN_COMMANDS,
2462
2474
  AVAILABLE_TOOL_NAMES,