npm - @wix/evalforge-evaluator - Versions diffs - 0.13.0 → 0.15.0 - Mend

@wix/evalforge-evaluator 0.13.0 → 0.15.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (7) hide show

package/build/index.js +624 -93
package/build/index.js.map +4 -4
package/build/index.mjs +620 -89
package/build/index.mjs.map +4 -4
package/build/types/diagnostics.d.ts +52 -0
package/build/types/error-reporter.d.ts +2 -0
package/package.json +3 -3

package/build/types/diagnostics.d.ts ADDED Viewed

@@ -0,0 +1,52 @@
+/**
+ * Diagnostics Module
+ *
+ * Runs comprehensive environment diagnostics before executing evaluations.
+ * All results are reported via trace events for visibility in the UI.
+ *
+ * This helps debug issues on remote machines (Dev Machines) where we can't
+ * easily access logs.
+ */
+import type { EvaluatorConfig } from './config.js';
+/**
+ * Result of a single diagnostic test.
+ */
+export interface DiagnosticResult {
+    /** Name of the test */
+    name: string;
+    /** Whether the test passed */
+    passed: boolean;
+    /** Detailed result information */
+    details: Record<string, unknown>;
+    /** Error message if the test failed */
+    error?: string;
+    /** Duration of the test in milliseconds */
+    durationMs: number;
+}
+/**
+ * All diagnostic results from a run.
+ */
+export interface DiagnosticReport {
+    /** Timestamp when diagnostics started */
+    startedAt: string;
+    /** Timestamp when diagnostics completed */
+    completedAt: string;
+    /** Total duration in milliseconds */
+    totalDurationMs: number;
+    /** Individual test results */
+    tests: DiagnosticResult[];
+    /** Summary counts */
+    summary: {
+        total: number;
+        passed: number;
+        failed: number;
+    };
+}
+/**
+ * Run all diagnostics and return a comprehensive report.
+ *
+ * @param config - Evaluator configuration
+ * @param evalRunId - The eval run ID for trace events
+ * @returns Diagnostic report with all test results
+ */
+export declare function runDiagnostics(config: EvaluatorConfig, evalRunId: string): Promise<DiagnosticReport>;

package/build/types/error-reporter.d.ts CHANGED Viewed

@@ -60,6 +60,8 @@ export declare function reportError(config: Partial<EvaluatorConfig> | null, pro
  * Execution phases for error context.
  */
 export declare const ExecutionPhase: {
+    /** Environment diagnostics phase (runs before execution) */
+    readonly DIAGNOSTICS: "diagnostics";
     readonly CONFIG: "config-loading";
     readonly API_CLIENT: "api-client-creation";
     readonly FETCH_EVAL_RUN: "fetch-eval-run";

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@wix/evalforge-evaluator",
-  "version": "0.13.0",
+  "version": "0.15.0",
   "description": "EvalForge Evaluator",
   "bin": "./build/index.js",
   "files": [
@@ -19,7 +19,7 @@
     "@ai-sdk/anthropic": "^3.0.2",
     "@anthropic-ai/claude-agent-sdk": "^0.2.12",
     "@anthropic-ai/claude-code": "^2.0.76",
-    "@wix/evalforge-types": "0.4.0",
+    "@wix/evalforge-types": "0.5.0",
     "ai": "^6.0.6",
     "tar": "^7.5.3",
     "zod": "^4.3.5"
@@ -56,5 +56,5 @@
       "artifactId": "evalforge-evaluator"
     }
   },
-  "falconPackageHash": "b3ce91898c7759199a30ec3fbe1f1eb5d6107ef3c6268acbf377e51c"
+  "falconPackageHash": "2fa7adc6b9b22ef16e175101994266c21244a702ece07d027d38f44d"
 }