npm - @wix/evalforge-types - Versions diffs - 0.68.0 → 0.70.0 - Mend

@wix/evalforge-types 0.68.0 → 0.70.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (6) hide show

package/build/index.js +27 -38
package/build/index.js.map +3 -3
package/build/index.mjs +25 -35
package/build/index.mjs.map +3 -3
package/build/types/evaluation/eval-run.d.ts +87 -169
package/package.json +2 -2

package/build/types/evaluation/eval-run.d.ts CHANGED Viewed

@@ -31,26 +31,6 @@ export declare const TriggerSchema: z.ZodObject<{
     type: z.ZodEnum<typeof TriggerType>;
 }, z.core.$strip>;
 export type Trigger = z.infer<typeof TriggerSchema>;
-/**
- * Failure category enum.
- */
-export declare enum FailureCategory {
-    MISSING_FILE = "missing_file",
-    WRONG_CONTENT = "wrong_content",
-    BUILD_ERROR = "build_error",
-    TEST_FAILURE = "test_failure",
-    RUNTIME_ERROR = "runtime_error",
-    PERFORMANCE = "performance"
-}
-/**
- * Failure severity enum.
- */
-export declare enum FailureSeverity {
-    CRITICAL = "critical",
-    HIGH = "high",
-    MEDIUM = "medium",
-    LOW = "low"
-}
 /**
  * Diff line type schema.
  */
@@ -173,59 +153,51 @@ export declare const ExecutionTraceSchema: z.ZodObject<{
 }, z.core.$strip>;
 export type ExecutionTrace = z.infer<typeof ExecutionTraceSchema>;
 /**
- * Failure analysis schema.
+ * A single finding from the LLM-generated run analysis.
  */
-export declare const FailureAnalysisSchema: z.ZodObject<{
-    category: z.ZodEnum<typeof FailureCategory>;
-    severity: z.ZodEnum<typeof FailureSeverity>;
+export declare const RunAnalysisFindingSchema: z.ZodObject<{
+    category: z.ZodEnum<{
+        failure_pattern: "failure_pattern";
+        cost_waste: "cost_waste";
+        flakiness: "flakiness";
+        inefficiency: "inefficiency";
+        positive: "positive";
+    }>;
+    severity: z.ZodEnum<{
+        low: "low";
+        medium: "medium";
+        high: "high";
+    }>;
+    description: z.ZodString;
+    affectedScenarios: z.ZodArray<z.ZodString>;
+    recommendation: z.ZodOptional<z.ZodString>;
+}, z.core.$strip>;
+export type RunAnalysisFinding = z.infer<typeof RunAnalysisFindingSchema>;
+/**
+ * LLM-generated analysis of a completed eval run.
+ */
+export declare const RunAnalysisSchema: z.ZodObject<{
+    generatedAt: z.ZodString;
     summary: z.ZodString;
-    details: z.ZodString;
-    rootCause: z.ZodString;
-    suggestedFix: z.ZodString;
-    relatedAssertions: z.ZodArray<z.ZodString>;
-    codeSnippet: z.ZodOptional<z.ZodString>;
-    similarIssues: z.ZodOptional<z.ZodArray<z.ZodString>>;
-    patternId: z.ZodOptional<z.ZodString>;
-    diff: z.ZodOptional<z.ZodObject<{
-        path: z.ZodString;
-        expected: z.ZodString;
-        actual: z.ZodString;
-        diffLines: z.ZodArray<z.ZodObject<{
-            type: z.ZodEnum<{
-                added: "added";
-                removed: "removed";
-                unchanged: "unchanged";
-            }>;
-            content: z.ZodString;
-            lineNumber: z.ZodNumber;
-        }, z.core.$strip>>;
-        renamedFrom: z.ZodOptional<z.ZodString>;
-        isInfrastructure: z.ZodOptional<z.ZodBoolean>;
-    }, z.core.$strip>>;
-    executionTrace: z.ZodOptional<z.ZodObject<{
-        commands: z.ZodArray<z.ZodObject<{
-            command: z.ZodString;
-            exitCode: z.ZodNumber;
-            output: z.ZodOptional<z.ZodString>;
-            duration: z.ZodNumber;
-        }, z.core.$strip>>;
-        filesModified: z.ZodArray<z.ZodObject<{
-            path: z.ZodString;
-            action: z.ZodEnum<{
-                deleted: "deleted";
-                created: "created";
-                modified: "modified";
-            }>;
-        }, z.core.$strip>>;
-        apiCalls: z.ZodArray<z.ZodObject<{
-            endpoint: z.ZodString;
-            tokensUsed: z.ZodNumber;
-            duration: z.ZodNumber;
-        }, z.core.$strip>>;
-        totalDuration: z.ZodNumber;
+    findings: z.ZodArray<z.ZodObject<{
+        category: z.ZodEnum<{
+            failure_pattern: "failure_pattern";
+            cost_waste: "cost_waste";
+            flakiness: "flakiness";
+            inefficiency: "inefficiency";
+            positive: "positive";
+        }>;
+        severity: z.ZodEnum<{
+            low: "low";
+            medium: "medium";
+            high: "high";
+        }>;
+        description: z.ZodString;
+        affectedScenarios: z.ZodArray<z.ZodString>;
+        recommendation: z.ZodOptional<z.ZodString>;
     }, z.core.$strip>>;
 }, z.core.$strip>;
-export type FailureAnalysis = z.infer<typeof FailureAnalysisSchema>;
+export type RunAnalysis = z.infer<typeof RunAnalysisSchema>;
 /**
  * Evaluation run schema.
  *
@@ -430,56 +402,6 @@ export declare const EvalRunSchema: z.ZodObject<{
         avgDuration: z.ZodNumber;
         totalDuration: z.ZodNumber;
     }, z.core.$strip>;
-    failureAnalyses: z.ZodOptional<z.ZodArray<z.ZodObject<{
-        category: z.ZodEnum<typeof FailureCategory>;
-        severity: z.ZodEnum<typeof FailureSeverity>;
-        summary: z.ZodString;
-        details: z.ZodString;
-        rootCause: z.ZodString;
-        suggestedFix: z.ZodString;
-        relatedAssertions: z.ZodArray<z.ZodString>;
-        codeSnippet: z.ZodOptional<z.ZodString>;
-        similarIssues: z.ZodOptional<z.ZodArray<z.ZodString>>;
-        patternId: z.ZodOptional<z.ZodString>;
-        diff: z.ZodOptional<z.ZodObject<{
-            path: z.ZodString;
-            expected: z.ZodString;
-            actual: z.ZodString;
-            diffLines: z.ZodArray<z.ZodObject<{
-                type: z.ZodEnum<{
-                    added: "added";
-                    removed: "removed";
-                    unchanged: "unchanged";
-                }>;
-                content: z.ZodString;
-                lineNumber: z.ZodNumber;
-            }, z.core.$strip>>;
-            renamedFrom: z.ZodOptional<z.ZodString>;
-            isInfrastructure: z.ZodOptional<z.ZodBoolean>;
-        }, z.core.$strip>>;
-        executionTrace: z.ZodOptional<z.ZodObject<{
-            commands: z.ZodArray<z.ZodObject<{
-                command: z.ZodString;
-                exitCode: z.ZodNumber;
-                output: z.ZodOptional<z.ZodString>;
-                duration: z.ZodNumber;
-            }, z.core.$strip>>;
-            filesModified: z.ZodArray<z.ZodObject<{
-                path: z.ZodString;
-                action: z.ZodEnum<{
-                    deleted: "deleted";
-                    created: "created";
-                    modified: "modified";
-                }>;
-            }, z.core.$strip>>;
-            apiCalls: z.ZodArray<z.ZodObject<{
-                endpoint: z.ZodString;
-                tokensUsed: z.ZodNumber;
-                duration: z.ZodNumber;
-            }, z.core.$strip>>;
-            totalDuration: z.ZodNumber;
-        }, z.core.$strip>>;
-    }, z.core.$strip>>>;
     llmTraceSummary: z.ZodOptional<z.ZodObject<{
         totalSteps: z.ZodNumber;
         totalTurns: z.ZodOptional<z.ZodNumber>;
@@ -558,6 +480,29 @@ export declare const EvalRunSchema: z.ZodObject<{
             maxTurns: z.ZodPipe<z.ZodTransform<{} | undefined, unknown>, z.ZodOptional<z.ZodNumber>>;
         }, z.core.$strip>>;
     }, z.core.$strip>>;
+    comparisonGroupId: z.ZodOptional<z.ZodString>;
+    comparisonLabel: z.ZodOptional<z.ZodString>;
+    runAnalysis: z.ZodOptional<z.ZodObject<{
+        generatedAt: z.ZodString;
+        summary: z.ZodString;
+        findings: z.ZodArray<z.ZodObject<{
+            category: z.ZodEnum<{
+                failure_pattern: "failure_pattern";
+                cost_waste: "cost_waste";
+                flakiness: "flakiness";
+                inefficiency: "inefficiency";
+                positive: "positive";
+            }>;
+            severity: z.ZodEnum<{
+                low: "low";
+                medium: "medium";
+                high: "high";
+            }>;
+            description: z.ZodString;
+            affectedScenarios: z.ZodArray<z.ZodString>;
+            recommendation: z.ZodOptional<z.ZodString>;
+        }, z.core.$strip>>;
+    }, z.core.$strip>>;
 }, z.core.$strip>;
 export type EvalRun = z.infer<typeof EvalRunSchema>;
 /**
@@ -580,56 +525,6 @@ export declare const CreateEvalRunInputSchema: z.ZodObject<{
     ruleIds: z.ZodOptional<z.ZodArray<z.ZodString>>;
     tags: z.ZodOptional<z.ZodArray<z.ZodString>>;
     presetId: z.ZodOptional<z.ZodString>;
-    failureAnalyses: z.ZodOptional<z.ZodArray<z.ZodObject<{
-        category: z.ZodEnum<typeof FailureCategory>;
-        severity: z.ZodEnum<typeof FailureSeverity>;
-        summary: z.ZodString;
-        details: z.ZodString;
-        rootCause: z.ZodString;
-        suggestedFix: z.ZodString;
-        relatedAssertions: z.ZodArray<z.ZodString>;
-        codeSnippet: z.ZodOptional<z.ZodString>;
-        similarIssues: z.ZodOptional<z.ZodArray<z.ZodString>>;
-        patternId: z.ZodOptional<z.ZodString>;
-        diff: z.ZodOptional<z.ZodObject<{
-            path: z.ZodString;
-            expected: z.ZodString;
-            actual: z.ZodString;
-            diffLines: z.ZodArray<z.ZodObject<{
-                type: z.ZodEnum<{
-                    added: "added";
-                    removed: "removed";
-                    unchanged: "unchanged";
-                }>;
-                content: z.ZodString;
-                lineNumber: z.ZodNumber;
-            }, z.core.$strip>>;
-            renamedFrom: z.ZodOptional<z.ZodString>;
-            isInfrastructure: z.ZodOptional<z.ZodBoolean>;
-        }, z.core.$strip>>;
-        executionTrace: z.ZodOptional<z.ZodObject<{
-            commands: z.ZodArray<z.ZodObject<{
-                command: z.ZodString;
-                exitCode: z.ZodNumber;
-                output: z.ZodOptional<z.ZodString>;
-                duration: z.ZodNumber;
-            }, z.core.$strip>>;
-            filesModified: z.ZodArray<z.ZodObject<{
-                path: z.ZodString;
-                action: z.ZodEnum<{
-                    deleted: "deleted";
-                    created: "created";
-                    modified: "modified";
-                }>;
-            }, z.core.$strip>>;
-            apiCalls: z.ZodArray<z.ZodObject<{
-                endpoint: z.ZodString;
-                tokensUsed: z.ZodNumber;
-                duration: z.ZodNumber;
-            }, z.core.$strip>>;
-            totalDuration: z.ZodNumber;
-        }, z.core.$strip>>;
-    }, z.core.$strip>>>;
     llmTraceSummary: z.ZodOptional<z.ZodObject<{
         totalSteps: z.ZodNumber;
         totalTurns: z.ZodOptional<z.ZodNumber>;
@@ -685,6 +580,29 @@ export declare const CreateEvalRunInputSchema: z.ZodObject<{
     jobError: z.ZodOptional<z.ZodString>;
     jobStatusCheckedAt: z.ZodOptional<z.ZodString>;
     runsPerScenario: z.ZodOptional<z.ZodNumber>;
+    comparisonGroupId: z.ZodOptional<z.ZodString>;
+    comparisonLabel: z.ZodOptional<z.ZodString>;
+    runAnalysis: z.ZodOptional<z.ZodObject<{
+        generatedAt: z.ZodString;
+        summary: z.ZodString;
+        findings: z.ZodArray<z.ZodObject<{
+            category: z.ZodEnum<{
+                failure_pattern: "failure_pattern";
+                cost_waste: "cost_waste";
+                flakiness: "flakiness";
+                inefficiency: "inefficiency";
+                positive: "positive";
+            }>;
+            severity: z.ZodEnum<{
+                low: "low";
+                medium: "medium";
+                high: "high";
+            }>;
+            description: z.ZodString;
+            affectedScenarios: z.ZodArray<z.ZodString>;
+            recommendation: z.ZodOptional<z.ZodString>;
+        }, z.core.$strip>>;
+    }, z.core.$strip>>;
     scenarioIds: z.ZodOptional<z.ZodArray<z.ZodString>>;
 }, z.core.$strip>;
 export type CreateEvalRunInput = z.infer<typeof CreateEvalRunInputSchema>;

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@wix/evalforge-types",
-  "version": "0.68.0",
+  "version": "0.70.0",
   "description": "Unified types for EvalForge agent evaluation system",
   "files": [
     "build"
@@ -46,5 +46,5 @@
       "artifactId": "evalforge-types"
     }
   },
-  "falconPackageHash": "e4412ad763ca9d048b11048eb13e0ac4f7c76f33cdc5573edf47ff05"
+  "falconPackageHash": "63ddf4c9491b8c912b2320516eb657a97b85d1ee43a35d9ea94553f7"
 }