npm - @wix/evalforge-types - Versions diffs - 0.46.0 → 0.48.0 - Mend

@wix/evalforge-types 0.46.0 → 0.48.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (9) hide show

package/build/index.js +25 -13
package/build/index.js.map +2 -2
package/build/index.mjs +24 -12
package/build/index.mjs.map +2 -2
package/build/types/common/models.d.ts +1 -1
package/build/types/evaluation/eval-run.d.ts +7 -1
package/build/types/project/project.d.ts +3 -0
package/build/types/scenario/test-scenario.d.ts +3 -0
package/package.json +2 -2

package/build/index.js CHANGED Viewed

@@ -22,7 +22,7 @@ var index_exports = {};
 __export(index_exports, {
   AGENT_TYPE_LABELS: () => AGENT_TYPE_LABELS,
   ALL_AVAILABLE_MODEL_IDS: () => ALL_AVAILABLE_MODEL_IDS,
-  AVAILABLE_MODEL_IDS: () => AVAILABLE_MODEL_IDS,
+  AVAILABLE_CLAUDE_MODEL_IDS: () => AVAILABLE_CLAUDE_MODEL_IDS,
   AVAILABLE_OPENAI_MODEL_IDS: () => AVAILABLE_OPENAI_MODEL_IDS,
   AVAILABLE_RUN_COMMANDS: () => AVAILABLE_RUN_COMMANDS,
   AVAILABLE_TOOL_NAMES: () => AVAILABLE_TOOL_NAMES,
@@ -1119,17 +1119,17 @@ var WebhookIdentityType;
 })(WebhookIdentityType || (WebhookIdentityType = {}));
 // src/common/models.ts
-var AVAILABLE_MODEL_IDS = Object.values(
+var AVAILABLE_CLAUDE_MODEL_IDS = Object.values(
   ClaudeModel
 ).filter(
   (v) => typeof v === "string" && v !== ClaudeModel.UNKNOWN_CLAUDE_MODEL
 );
 var PREFERRED_JUDGE_MODEL = "CLAUDE_4_5_HAIKU_1_0";
-var DEFAULT_JUDGE_MODEL = AVAILABLE_MODEL_IDS.includes(
+var DEFAULT_JUDGE_MODEL = AVAILABLE_CLAUDE_MODEL_IDS.includes(
   PREFERRED_JUDGE_MODEL
-) ? PREFERRED_JUDGE_MODEL : AVAILABLE_MODEL_IDS[0];
+) ? PREFERRED_JUDGE_MODEL : AVAILABLE_CLAUDE_MODEL_IDS[0];
 var ClaudeModelSchema = import_zod4.z.enum(
-  AVAILABLE_MODEL_IDS
+  AVAILABLE_CLAUDE_MODEL_IDS
 );
 var AVAILABLE_OPENAI_MODEL_IDS = Object.values(
   Model
@@ -1140,7 +1140,7 @@ var OpenAIModelSchema = import_zod4.z.enum(
   AVAILABLE_OPENAI_MODEL_IDS
 );
 var ALL_AVAILABLE_MODEL_IDS = [
-  ...AVAILABLE_MODEL_IDS,
+  ...AVAILABLE_CLAUDE_MODEL_IDS,
   ...AVAILABLE_OPENAI_MODEL_IDS
 ];
 var AnyModelSchema = import_zod4.z.enum(
@@ -1791,7 +1791,9 @@ var TestScenarioSchema = TenantEntitySchema.extend({
   /** IDs of saved assertions to evaluate (from assertions table) - legacy, use assertionLinks */
   assertionIds: import_zod24.z.array(import_zod24.z.string()).optional(),
   /** Linked assertions with per-scenario parameter values */
-  assertionLinks: import_zod24.z.array(ScenarioAssertionLinkSchema).optional()
+  assertionLinks: import_zod24.z.array(ScenarioAssertionLinkSchema).optional(),
+  /** Tags for categorisation and filtering */
+  tags: import_zod24.z.array(import_zod24.z.string()).optional()
 });
 var CreateTestScenarioInputSchema = TestScenarioSchema.omit({
   id: true,
@@ -2060,7 +2062,7 @@ var EvalRunSchema = TenantEntitySchema.extend({
   skillsGroupId: import_zod28.z.string().optional(),
   /** Map of skillId to skillVersionId for this run */
   skillVersions: import_zod28.z.record(import_zod28.z.string(), import_zod28.z.string()).optional(),
-  /** Scenario IDs to run */
+  /** Scenario IDs to run (always present — resolved server-side from tags when needed) */
   scenarioIds: import_zod28.z.array(import_zod28.z.string()),
   /** Current status */
   status: EvalStatusSchema,
@@ -2095,7 +2097,9 @@ var EvalRunSchema = TenantEntitySchema.extend({
   /** Sub-agent IDs to enable for this run (optional) */
   subAgentIds: import_zod28.z.array(import_zod28.z.string()).optional(),
   /** Rule IDs to enable for this run (optional) */
-  ruleIds: import_zod28.z.array(import_zod28.z.string()).optional()
+  ruleIds: import_zod28.z.array(import_zod28.z.string()).optional(),
+  /** Tags used to select scenarios for this run (for traceability) */
+  tags: import_zod28.z.array(import_zod28.z.string()).optional()
 });
 var CreateEvalRunInputSchema = EvalRunSchema.omit({
   id: true,
@@ -2106,8 +2110,15 @@ var CreateEvalRunInputSchema = EvalRunSchema.omit({
   results: true,
   aggregateMetrics: true,
   startedAt: true,
-  completedAt: true
-});
+  completedAt: true,
+  scenarioIds: true
+}).extend({
+  /** Optional on input — backend resolves from tags when not provided */
+  scenarioIds: import_zod28.z.array(import_zod28.z.string()).optional()
+}).refine(
+  (data) => data.scenarioIds && data.scenarioIds.length > 0 || data.tags && data.tags.length > 0,
+  { message: "Either scenarioIds or tags must be provided" }
+);
 var EvaluationProgressSchema = import_zod28.z.object({
   runId: import_zod28.z.string(),
   targetId: import_zod28.z.string(),
@@ -2281,7 +2292,8 @@ var ProjectSchema = BaseEntitySchema.extend({
   appId: import_zod31.z.string().optional().describe("The ID of the app in Dev Center"),
   appSecret: import_zod31.z.string().optional().describe("The secret of the app in Dev Center"),
   useWixAuth: import_zod31.z.boolean().optional().describe("Enable Wix CLI/MCP auth for evaluations"),
-  useBase44Auth: import_zod31.z.boolean().optional().describe("Enable Base44 auth for evaluations")
+  useBase44Auth: import_zod31.z.boolean().optional().describe("Enable Base44 auth for evaluations"),
+  scenarioTags: import_zod31.z.array(import_zod31.z.string()).optional().describe("Project-level tag vocabulary for scenarios")
 });
 var CreateProjectInputSchema = ProjectSchema.omit({
   id: true,
@@ -2456,7 +2468,7 @@ function getSystemAssertion(id) {
 0 && (module.exports = {
   AGENT_TYPE_LABELS,
   ALL_AVAILABLE_MODEL_IDS,
-  AVAILABLE_MODEL_IDS,
+  AVAILABLE_CLAUDE_MODEL_IDS,
   AVAILABLE_OPENAI_MODEL_IDS,
   AVAILABLE_RUN_COMMANDS,
   AVAILABLE_TOOL_NAMES,