npm - @wix/evalforge-types - Versions diffs - 0.54.0 → 0.56.0 - Mend

@wix/evalforge-types 0.54.0 → 0.56.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (10) hide show

package/build/index.js +59 -921
package/build/index.js.map +4 -4
package/build/index.mjs +57 -921
package/build/index.mjs.map +4 -4
package/build/types/common/models.d.ts +30 -22
package/build/types/evaluation/eval-result.d.ts +4 -0
package/build/types/evaluation/eval-run.d.ts +5 -0
package/build/types/evaluation/metrics.d.ts +4 -0
package/build/types/target/agent.d.ts +2 -1
package/package.json +2 -3

package/build/types/common/models.d.ts CHANGED Viewed

@@ -1,34 +1,32 @@
 import { z } from 'zod';
-import { AnthropicModel as _AnthropicModel, Model as _OpenAIModel } from '@wix/ambassador-ds-wix-ai-gateway-v1-prompt/types';
 /**
  * Curated model sets — only models suitable for code generation.
- * Excludes legacy/superseded snapshots, previews, experimental,
- * completion-only, and non-text models.
+ * Uses official/canonical model IDs (not internal gateway enums).
  * Update these explicitly when new models become available.
  */
 export declare const ClaudeModel: {
-    readonly CLAUDE_4_SONNET_1_0: _AnthropicModel.CLAUDE_4_SONNET_1_0;
-    readonly CLAUDE_4_OPUS_1_0: _AnthropicModel.CLAUDE_4_OPUS_1_0;
-    readonly CLAUDE_4_5_SONNET_1_0: _AnthropicModel.CLAUDE_4_5_SONNET_1_0;
-    readonly CLAUDE_4_5_HAIKU_1_0: _AnthropicModel.CLAUDE_4_5_HAIKU_1_0;
-    readonly CLAUDE_4_5_OPUS_1_0: _AnthropicModel.CLAUDE_4_5_OPUS_1_0;
-    readonly CLAUDE_4_6_SONNET_1_0: _AnthropicModel.CLAUDE_4_6_SONNET_1_0;
-    readonly CLAUDE_4_6_OPUS_1_0: _AnthropicModel.CLAUDE_4_6_OPUS_1_0;
+    readonly CLAUDE_4_SONNET_1_0: "claude-sonnet-4";
+    readonly CLAUDE_4_OPUS_1_0: "claude-opus-4";
+    readonly CLAUDE_4_5_SONNET_1_0: "claude-sonnet-4-5";
+    readonly CLAUDE_4_5_HAIKU_1_0: "claude-haiku-4-5";
+    readonly CLAUDE_4_5_OPUS_1_0: "claude-opus-4-5";
+    readonly CLAUDE_4_6_SONNET_1_0: "claude-sonnet-4-6";
+    readonly CLAUDE_4_6_OPUS_1_0: "claude-opus-4-6";
 };
 export type ClaudeModel = (typeof ClaudeModel)[keyof typeof ClaudeModel];
 export declare const OpenAIModel: {
-    readonly GPT_4O_MINI_2024_07_18: _OpenAIModel.GPT_4O_MINI_2024_07_18;
-    readonly GPT_4O_2024_11_20: _OpenAIModel.GPT_4O_2024_11_20;
-    readonly O1_2024_12_17: _OpenAIModel.O1_2024_12_17;
-    readonly O3_MINI_2025_01_31: _OpenAIModel.O3_MINI_2025_01_31;
-    readonly GPT_4_1_2025_04_14: _OpenAIModel.GPT_4_1_2025_04_14;
-    readonly GPT_4_1_MINI_2025_04_14: _OpenAIModel.GPT_4_1_MINI_2025_04_14;
-    readonly GPT_4_1_NANO_2025_04_14: _OpenAIModel.GPT_4_1_NANO_2025_04_14;
-    readonly O3_2025_04_16: _OpenAIModel.O3_2025_04_16;
-    readonly O4_MINI_2025_04_16: _OpenAIModel.O4_MINI_2025_04_16;
-    readonly GPT_5_2025_08_07: _OpenAIModel.GPT_5_2025_08_07;
-    readonly GPT_5_MINI_2025_08_07: _OpenAIModel.GPT_5_MINI_2025_08_07;
-    readonly GPT_5_NANO_2025_08_07: _OpenAIModel.GPT_5_NANO_2025_08_07;
+    readonly GPT_4O_MINI_2024_07_18: "gpt-4o-mini";
+    readonly GPT_4O_2024_11_20: "gpt-4o";
+    readonly O1_2024_12_17: "o1";
+    readonly O3_MINI_2025_01_31: "o3-mini";
+    readonly GPT_4_1_2025_04_14: "gpt-4.1";
+    readonly GPT_4_1_MINI_2025_04_14: "gpt-4.1-mini";
+    readonly GPT_4_1_NANO_2025_04_14: "gpt-4.1-nano";
+    readonly O3_2025_04_16: "o3";
+    readonly O4_MINI_2025_04_16: "o4-mini";
+    readonly GPT_5_2025_08_07: "gpt-5";
+    readonly GPT_5_MINI_2025_08_07: "gpt-5-mini";
+    readonly GPT_5_NANO_2025_08_07: "gpt-5-nano";
 };
 export type OpenAIModel = (typeof OpenAIModel)[keyof typeof OpenAIModel];
 export declare const AVAILABLE_CLAUDE_MODEL_IDS: ClaudeModel[];
@@ -50,6 +48,16 @@ export declare const ALL_AVAILABLE_MODEL_IDS: string[];
 export declare const AnyModelSchema: z.ZodEnum<{
     [x: string]: string;
 }>;
+/**
+ * Maps legacy Wix AI Gateway enum strings to official model IDs.
+ * Used for backward compatibility with stored data (DB, eval traces).
+ */
+export declare const LEGACY_MODEL_ID_MAP: Record<string, string>;
+/**
+ * Normalize a model ID: translates legacy gateway enum strings to
+ * official model IDs. Returns the input unchanged if already canonical.
+ */
+export declare function normalizeModelId(modelId: string): string;
 export declare const ModelConfigSchema: z.ZodObject<{
     model: z.ZodEnum<{
         [x: string]: string;

package/build/types/evaluation/eval-result.d.ts CHANGED Viewed

@@ -45,6 +45,7 @@ export declare const AssertionResultSchema: z.ZodObject<{
         outputPreview: z.ZodOptional<z.ZodString>;
         success: z.ZodBoolean;
         error: z.ZodOptional<z.ZodString>;
+        turnIndex: z.ZodOptional<z.ZodNumber>;
     }, z.core.$strip>>>;
 }, z.core.$strip>;
 export type AssertionResult = z.infer<typeof AssertionResultSchema>;
@@ -98,6 +99,7 @@ export declare const EvalRunResultSchema: z.ZodObject<{
             outputPreview: z.ZodOptional<z.ZodString>;
             success: z.ZodBoolean;
             error: z.ZodOptional<z.ZodString>;
+            turnIndex: z.ZodOptional<z.ZodNumber>;
         }, z.core.$strip>>>;
     }, z.core.$strip>>;
     metrics: z.ZodOptional<z.ZodObject<{
@@ -167,9 +169,11 @@ export declare const EvalRunResultSchema: z.ZodObject<{
             outputPreview: z.ZodOptional<z.ZodString>;
             success: z.ZodBoolean;
             error: z.ZodOptional<z.ZodString>;
+            turnIndex: z.ZodOptional<z.ZodNumber>;
         }, z.core.$strip>>;
         summary: z.ZodObject<{
             totalSteps: z.ZodNumber;
+            totalTurns: z.ZodOptional<z.ZodNumber>;
             totalDurationMs: z.ZodNumber;
             totalTokens: z.ZodObject<{
                 prompt: z.ZodNumber;

package/build/types/evaluation/eval-run.d.ts CHANGED Viewed

@@ -287,6 +287,7 @@ export declare const EvalRunSchema: z.ZodObject<{
                 outputPreview: z.ZodOptional<z.ZodString>;
                 success: z.ZodBoolean;
                 error: z.ZodOptional<z.ZodString>;
+                turnIndex: z.ZodOptional<z.ZodNumber>;
             }, z.core.$strip>>>;
         }, z.core.$strip>>;
         metrics: z.ZodOptional<z.ZodObject<{
@@ -356,9 +357,11 @@ export declare const EvalRunSchema: z.ZodObject<{
                 outputPreview: z.ZodOptional<z.ZodString>;
                 success: z.ZodBoolean;
                 error: z.ZodOptional<z.ZodString>;
+                turnIndex: z.ZodOptional<z.ZodNumber>;
             }, z.core.$strip>>;
             summary: z.ZodObject<{
                 totalSteps: z.ZodNumber;
+                totalTurns: z.ZodOptional<z.ZodNumber>;
                 totalDurationMs: z.ZodNumber;
                 totalTokens: z.ZodObject<{
                     prompt: z.ZodNumber;
@@ -468,6 +471,7 @@ export declare const EvalRunSchema: z.ZodObject<{
     }, z.core.$strip>>>;
     llmTraceSummary: z.ZodOptional<z.ZodObject<{
         totalSteps: z.ZodNumber;
+        totalTurns: z.ZodOptional<z.ZodNumber>;
         totalDurationMs: z.ZodNumber;
         totalTokens: z.ZodObject<{
             prompt: z.ZodNumber;
@@ -597,6 +601,7 @@ export declare const CreateEvalRunInputSchema: z.ZodObject<{
     }, z.core.$strip>>>;
     llmTraceSummary: z.ZodOptional<z.ZodObject<{
         totalSteps: z.ZodNumber;
+        totalTurns: z.ZodOptional<z.ZodNumber>;
         totalDurationMs: z.ZodNumber;
         totalTokens: z.ZodObject<{
             prompt: z.ZodNumber;

package/build/types/evaluation/metrics.d.ts CHANGED Viewed

@@ -65,6 +65,7 @@ export declare const LLMTraceStepSchema: z.ZodObject<{
     outputPreview: z.ZodOptional<z.ZodString>;
     success: z.ZodBoolean;
     error: z.ZodOptional<z.ZodString>;
+    turnIndex: z.ZodOptional<z.ZodNumber>;
 }, z.core.$strip>;
 export type LLMTraceStep = z.infer<typeof LLMTraceStepSchema>;
 /**
@@ -82,6 +83,7 @@ export type LLMBreakdownStats = z.infer<typeof LLMBreakdownStatsSchema>;
  */
 export declare const LLMTraceSummarySchema: z.ZodObject<{
     totalSteps: z.ZodNumber;
+    totalTurns: z.ZodOptional<z.ZodNumber>;
     totalDurationMs: z.ZodNumber;
     totalTokens: z.ZodObject<{
         prompt: z.ZodNumber;
@@ -129,9 +131,11 @@ export declare const LLMTraceSchema: z.ZodObject<{
         outputPreview: z.ZodOptional<z.ZodString>;
         success: z.ZodBoolean;
         error: z.ZodOptional<z.ZodString>;
+        turnIndex: z.ZodOptional<z.ZodNumber>;
     }, z.core.$strip>>;
     summary: z.ZodObject<{
         totalSteps: z.ZodNumber;
+        totalTurns: z.ZodOptional<z.ZodNumber>;
         totalDurationMs: z.ZodNumber;
         totalTokens: z.ZodObject<{
             prompt: z.ZodNumber;

package/build/types/target/agent.d.ts CHANGED Viewed

@@ -28,7 +28,8 @@ export declare const AGENT_TYPE_LABELS: Record<AgentTypeValue, string>;
  * When adding a new CLI agent adapter, add its command here first.
  */
 export declare enum AgentRunCommand {
-    CLAUDE = "claude"
+    CLAUDE = "claude",
+    OPENCODE = "opencode"
 }
 /** All available run commands for use in dropdowns and validation. */
 export declare const AVAILABLE_RUN_COMMANDS: AgentRunCommand[];

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@wix/evalforge-types",
-  "version": "0.54.0",
+  "version": "0.56.0",
   "description": "Unified types for EvalForge agent evaluation system",
   "files": [
     "build"
@@ -20,7 +20,6 @@
   "devDependencies": {
     "@eslint/js": "^9.39.2",
     "@types/node": "^22.19.3",
-    "@wix/ambassador-ds-wix-ai-gateway-v1-prompt": "^1.0.312",
     "esbuild": "^0.27.2",
     "eslint": "^9.39.2",
     "eslint-config-prettier": "^10.1.8",
@@ -47,5 +46,5 @@
       "artifactId": "evalforge-types"
     }
   },
-  "falconPackageHash": "2c3aab7cd9e412ed3299c7a914bc04abfee06a97965cc30794055f8e"
+  "falconPackageHash": "331ddbd68218e960214d7b75e497534e88fa193a082b6fd1fb9a922f"
 }