npm - evalsense - Versions diffs - 0.2.0 → 0.3.0 - Mend

evalsense 0.2.0 → 0.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (37) hide show

package/LICENSE +190 -0
package/README.md +99 -82
package/dist/{chunk-HDJID3GC.cjs → chunk-DFC6FRTG.cjs} +8 -26
package/dist/chunk-DFC6FRTG.cjs.map +1 -0
package/dist/chunk-DGUM43GV.js +10 -0
package/dist/chunk-DGUM43GV.js.map +1 -0
package/dist/chunk-JEQ2X3Z6.cjs +12 -0
package/dist/chunk-JEQ2X3Z6.cjs.map +1 -0
package/dist/{chunk-5P7LNNO6.js → chunk-JPVZL45G.js} +8 -26
package/dist/chunk-JPVZL45G.js.map +1 -0
package/dist/{chunk-Y23VHTD3.cjs → chunk-RZFLCWTW.cjs} +2 -2
package/dist/chunk-RZFLCWTW.cjs.map +1 -0
package/dist/{chunk-BRPM6AB6.js → chunk-Z3U6AUWX.js} +2 -2
package/dist/chunk-Z3U6AUWX.js.map +1 -0
package/dist/cli.cjs +39 -36
package/dist/cli.cjs.map +1 -1
package/dist/cli.js +37 -34
package/dist/cli.js.map +1 -1
package/dist/index.cjs +300 -101
package/dist/index.cjs.map +1 -1
package/dist/index.d.cts +76 -6
package/dist/index.d.ts +76 -6
package/dist/index.js +222 -23
package/dist/index.js.map +1 -1
package/dist/metrics/index.cjs +257 -17
package/dist/metrics/index.cjs.map +1 -1
package/dist/metrics/index.d.cts +252 -1
package/dist/metrics/index.d.ts +252 -1
package/dist/metrics/index.js +240 -2
package/dist/metrics/index.js.map +1 -1
package/dist/metrics/opinionated/index.cjs +6 -5
package/dist/metrics/opinionated/index.js +2 -1
package/package.json +8 -6
package/dist/chunk-5P7LNNO6.js.map +0 -1
package/dist/chunk-BRPM6AB6.js.map +0 -1
package/dist/chunk-HDJID3GC.cjs.map +0 -1
package/dist/chunk-Y23VHTD3.cjs.map +0 -1

package/dist/index.cjs CHANGED Viewed

@@ -1,12 +1,13 @@
 'use strict';
-var chunkHDJID3GC_cjs = require('./chunk-HDJID3GC.cjs');
+var chunkDFC6FRTG_cjs = require('./chunk-DFC6FRTG.cjs');
+require('./chunk-JEQ2X3Z6.cjs');
 var fs = require('fs');
 var path = require('path');
 // src/core/describe.ts
 function describe(name, fn) {
-  const parentSuite = chunkHDJID3GC_cjs.getCurrentSuite();
+  const parentSuite = chunkDFC6FRTG_cjs.getCurrentSuite();
   const suite = {
     name,
     tests: [],
@@ -15,37 +16,37 @@ function describe(name, fn) {
     beforeEach: [],
     afterEach: []
   };
-  chunkHDJID3GC_cjs.setCurrentSuite(suite);
+  chunkDFC6FRTG_cjs.setCurrentSuite(suite);
   try {
     fn();
   } finally {
-    chunkHDJID3GC_cjs.setCurrentSuite(parentSuite);
+    chunkDFC6FRTG_cjs.setCurrentSuite(parentSuite);
   }
-  chunkHDJID3GC_cjs.addSuite(suite);
+  chunkDFC6FRTG_cjs.addSuite(suite);
 }
 function beforeAll(fn) {
-  const suite = chunkHDJID3GC_cjs.getCurrentSuite();
+  const suite = chunkDFC6FRTG_cjs.getCurrentSuite();
   if (!suite) {
     throw new Error("beforeAll() must be called inside a describe() block");
   }
   suite.beforeAll?.push(fn);
 }
 function afterAll(fn) {
-  const suite = chunkHDJID3GC_cjs.getCurrentSuite();
+  const suite = chunkDFC6FRTG_cjs.getCurrentSuite();
   if (!suite) {
     throw new Error("afterAll() must be called inside a describe() block");
   }
   suite.afterAll?.push(fn);
 }
 function beforeEach(fn) {
-  const suite = chunkHDJID3GC_cjs.getCurrentSuite();
+  const suite = chunkDFC6FRTG_cjs.getCurrentSuite();
   if (!suite) {
     throw new Error("beforeEach() must be called inside a describe() block");
   }
   suite.beforeEach?.push(fn);
 }
 function afterEach(fn) {
-  const suite = chunkHDJID3GC_cjs.getCurrentSuite();
+  const suite = chunkDFC6FRTG_cjs.getCurrentSuite();
   if (!suite) {
     throw new Error("afterEach() must be called inside a describe() block");
   }
@@ -54,7 +55,7 @@ function afterEach(fn) {
 // src/core/eval-test.ts
 function evalTest(name, fn) {
-  const currentSuite = chunkHDJID3GC_cjs.getCurrentSuite();
+  const currentSuite = chunkDFC6FRTG_cjs.getCurrentSuite();
   if (!currentSuite) {
     throw new Error("evalTest() must be called inside a describe() block");
   }
@@ -62,12 +63,12 @@ function evalTest(name, fn) {
     name,
     fn
   };
-  chunkHDJID3GC_cjs.addTestToCurrentSuite(test2);
+  chunkDFC6FRTG_cjs.addTestToCurrentSuite(test2);
 }
 var test = evalTest;
 var it = evalTest;
 function evalTestSkip(name, _fn) {
-  const currentSuite = chunkHDJID3GC_cjs.getCurrentSuite();
+  const currentSuite = chunkDFC6FRTG_cjs.getCurrentSuite();
   if (!currentSuite) {
     throw new Error("evalTest.skip() must be called inside a describe() block");
   }
@@ -76,10 +77,10 @@ function evalTestSkip(name, _fn) {
     fn: async () => {
     }
   };
-  chunkHDJID3GC_cjs.addTestToCurrentSuite(test2);
+  chunkDFC6FRTG_cjs.addTestToCurrentSuite(test2);
 }
 function evalTestOnly(name, fn) {
-  const currentSuite = chunkHDJID3GC_cjs.getCurrentSuite();
+  const currentSuite = chunkDFC6FRTG_cjs.getCurrentSuite();
   if (!currentSuite) {
     throw new Error("evalTest.only() must be called inside a describe() block");
   }
@@ -87,7 +88,7 @@ function evalTestOnly(name, fn) {
     name: `[ONLY] ${name}`,
     fn
   };
-  chunkHDJID3GC_cjs.addTestToCurrentSuite(test2);
+  chunkDFC6FRTG_cjs.addTestToCurrentSuite(test2);
 }
 evalTest.skip = evalTestSkip;
 evalTest.only = evalTestOnly;
@@ -102,17 +103,17 @@ function loadDataset(path$1) {
     } else if (ext === ".json") {
       records = parseJSON(content);
     } else {
-      throw new chunkHDJID3GC_cjs.DatasetError(
+      throw new chunkDFC6FRTG_cjs.DatasetError(
         `Unsupported file format: ${ext}. Use .json, .ndjson, or .jsonl`,
         path$1
       );
     }
   } catch (error) {
-    if (error instanceof chunkHDJID3GC_cjs.DatasetError) {
+    if (error instanceof chunkDFC6FRTG_cjs.DatasetError) {
       throw error;
     }
     const message = error instanceof Error ? error.message : String(error);
-    throw new chunkHDJID3GC_cjs.DatasetError(`Failed to load dataset from ${path$1}: ${message}`, path$1);
+    throw new chunkDFC6FRTG_cjs.DatasetError(`Failed to load dataset from ${path$1}: ${message}`, path$1);
   }
   return {
     records,
@@ -126,7 +127,7 @@ function loadDataset(path$1) {
 function parseJSON(content) {
   const parsed = JSON.parse(content);
   if (!Array.isArray(parsed)) {
-    throw new chunkHDJID3GC_cjs.DatasetError("JSON dataset must be an array of records");
+    throw new chunkDFC6FRTG_cjs.DatasetError("JSON dataset must be an array of records");
   }
   return parsed;
 }
@@ -139,7 +140,7 @@ function parseNDJSON(content) {
     try {
       records.push(JSON.parse(line));
     } catch {
-      throw new chunkHDJID3GC_cjs.DatasetError(`Invalid JSON at line ${i + 1} in NDJSON file`);
+      throw new chunkDFC6FRTG_cjs.DatasetError(`Invalid JSON at line ${i + 1} in NDJSON file`);
     }
   }
   return records;
@@ -164,7 +165,7 @@ async function runModel(dataset, modelFn) {
     const id = getRecordId(record);
     const prediction = await modelFn(record);
     if (prediction.id !== id) {
-      throw new chunkHDJID3GC_cjs.DatasetError(
+      throw new chunkDFC6FRTG_cjs.DatasetError(
         `Prediction ID mismatch: expected "${id}", got "${prediction.id}". Model function must return the same ID as the input record.`
       );
     }
@@ -184,9 +185,7 @@ async function runModel(dataset, modelFn) {
 function getRecordId(record) {
   const id = record.id ?? record._id;
   if (id === void 0 || id === null) {
-    throw new chunkHDJID3GC_cjs.DatasetError(
-      'Dataset records must have an "id" or "_id" field for alignment'
-    );
+    throw new chunkDFC6FRTG_cjs.DatasetError('Dataset records must have an "id" or "_id" field for alignment');
   }
   return String(id);
 }
@@ -208,9 +207,7 @@ async function runModelParallel(dataset, modelFn, concurrency = 10) {
   for (const { prediction, record } of results) {
     const id = getRecordId(record);
     if (prediction.id !== id) {
-      throw new chunkHDJID3GC_cjs.DatasetError(
-        `Prediction ID mismatch: expected "${id}", got "${prediction.id}".`
-      );
+      throw new chunkDFC6FRTG_cjs.DatasetError(`Prediction ID mismatch: expected "${id}", got "${prediction.id}".`);
     }
     predictions.push(prediction);
     aligned.push({
@@ -258,7 +255,7 @@ function alignByKey(predictions, expected, options = {}) {
     }
   }
   if (strict && missingIds.length > 0) {
-    throw new chunkHDJID3GC_cjs.IntegrityError(
+    throw new chunkDFC6FRTG_cjs.IntegrityError(
       `${missingIds.length} prediction(s) have no matching expected record`,
       missingIds
     );
@@ -307,9 +304,7 @@ function checkIntegrity(dataset, options = {}) {
       }
     }
     if (requiredFields.length > 0) {
-      const missing = requiredFields.filter(
-        (field) => record[field] === void 0
-      );
+      const missing = requiredFields.filter((field) => record[field] === void 0);
       if (missing.length > 0) {
         missingFields.push({
           id: String(id ?? `record[${i}]`),
@@ -332,12 +327,14 @@ function checkIntegrity(dataset, options = {}) {
       issues.push(`${missingIds.length} record(s) missing ID`);
     }
     if (duplicateIds.length > 0) {
-      issues.push(`${duplicateIds.length} duplicate ID(s): ${duplicateIds.slice(0, 3).join(", ")}${duplicateIds.length > 3 ? "..." : ""}`);
+      issues.push(
+        `${duplicateIds.length} duplicate ID(s): ${duplicateIds.slice(0, 3).join(", ")}${duplicateIds.length > 3 ? "..." : ""}`
+      );
     }
     if (missingFields.length > 0) {
       issues.push(`${missingFields.length} record(s) missing required fields`);
     }
-    throw new chunkHDJID3GC_cjs.IntegrityError(`Dataset integrity check failed: ${issues.join("; ")}`);
+    throw new chunkDFC6FRTG_cjs.IntegrityError(`Dataset integrity check failed: ${issues.join("; ")}`);
   }
   return result;
 }
@@ -355,7 +352,7 @@ function validatePredictions(predictions, expectedIds) {
 // src/statistics/classification.ts
 function computeClassificationMetrics(actual, expected) {
-  const confusionMatrix = chunkHDJID3GC_cjs.buildConfusionMatrix(actual, expected);
+  const confusionMatrix = chunkDFC6FRTG_cjs.buildConfusionMatrix(actual, expected);
   return computeMetricsFromMatrix(confusionMatrix);
 }
 function computeMetricsFromMatrix(cm) {
@@ -363,10 +360,10 @@ function computeMetricsFromMatrix(cm) {
   let totalSupport = 0;
   let correctPredictions = 0;
   for (const label of cm.labels) {
-    const tp = chunkHDJID3GC_cjs.getTruePositives(cm, label);
-    const fp = chunkHDJID3GC_cjs.getFalsePositives(cm, label);
-    const fn = chunkHDJID3GC_cjs.getFalseNegatives(cm, label);
-    const support = chunkHDJID3GC_cjs.getSupport(cm, label);
+    const tp = chunkDFC6FRTG_cjs.getTruePositives(cm, label);
+    const fp = chunkDFC6FRTG_cjs.getFalsePositives(cm, label);
+    const fn = chunkDFC6FRTG_cjs.getFalseNegatives(cm, label);
+    const support = chunkDFC6FRTG_cjs.getSupport(cm, label);
     const precision = tp + fp > 0 ? tp / (tp + fp) : 0;
     const recall = tp + fn > 0 ? tp / (tp + fn) : 0;
     const f1 = precision + recall > 0 ? 2 * precision * recall / (precision + recall) : 0;
@@ -395,15 +392,15 @@ function computeMetricsFromMatrix(cm) {
   };
 }
 function computePrecision(actual, expected, targetClass) {
-  const cm = chunkHDJID3GC_cjs.buildConfusionMatrix(actual, expected);
-  const tp = chunkHDJID3GC_cjs.getTruePositives(cm, targetClass);
-  const fp = chunkHDJID3GC_cjs.getFalsePositives(cm, targetClass);
+  const cm = chunkDFC6FRTG_cjs.buildConfusionMatrix(actual, expected);
+  const tp = chunkDFC6FRTG_cjs.getTruePositives(cm, targetClass);
+  const fp = chunkDFC6FRTG_cjs.getFalsePositives(cm, targetClass);
   return tp + fp > 0 ? tp / (tp + fp) : 0;
 }
 function computeRecall(actual, expected, targetClass) {
-  const cm = chunkHDJID3GC_cjs.buildConfusionMatrix(actual, expected);
-  const tp = chunkHDJID3GC_cjs.getTruePositives(cm, targetClass);
-  const fn = chunkHDJID3GC_cjs.getFalseNegatives(cm, targetClass);
+  const cm = chunkDFC6FRTG_cjs.buildConfusionMatrix(actual, expected);
+  const tp = chunkDFC6FRTG_cjs.getTruePositives(cm, targetClass);
+  const fn = chunkDFC6FRTG_cjs.getFalseNegatives(cm, targetClass);
   return tp + fn > 0 ? tp / (tp + fn) : 0;
 }
 function computeF1(actual, expected, targetClass) {
@@ -430,6 +427,67 @@ function computeAccuracy(actual, expected) {
   return total > 0 ? correct / total : 0;
 }
+// src/statistics/regression.ts
+function computeRegressionMetrics(actual, expected) {
+  if (actual.length !== expected.length) {
+    throw new Error(
+      `Array length mismatch: actual has ${actual.length} elements, expected has ${expected.length}`
+    );
+  }
+  const n = actual.length;
+  if (n === 0) {
+    return { mae: 0, mse: 0, rmse: 0, r2: 0 };
+  }
+  const mae = computeMAE(actual, expected);
+  const mse = computeMSE(actual, expected);
+  const rmse = Math.sqrt(mse);
+  const r2 = computeR2(actual, expected);
+  return { mae, mse, rmse, r2 };
+}
+function computeMAE(actual, expected) {
+  if (actual.length !== expected.length || actual.length === 0) {
+    return 0;
+  }
+  let sum = 0;
+  for (let i = 0; i < actual.length; i++) {
+    sum += Math.abs((actual[i] ?? 0) - (expected[i] ?? 0));
+  }
+  return sum / actual.length;
+}
+function computeMSE(actual, expected) {
+  if (actual.length !== expected.length || actual.length === 0) {
+    return 0;
+  }
+  let sum = 0;
+  for (let i = 0; i < actual.length; i++) {
+    const diff = (actual[i] ?? 0) - (expected[i] ?? 0);
+    sum += diff * diff;
+  }
+  return sum / actual.length;
+}
+function computeR2(actual, expected) {
+  if (actual.length !== expected.length || actual.length === 0) {
+    return 0;
+  }
+  let meanExpected = 0;
+  for (const val of expected) {
+    meanExpected += val ?? 0;
+  }
+  meanExpected /= expected.length;
+  let ssTotal = 0;
+  let ssResidual = 0;
+  for (let i = 0; i < actual.length; i++) {
+    const exp = expected[i] ?? 0;
+    const act = actual[i] ?? 0;
+    ssTotal += (exp - meanExpected) ** 2;
+    ssResidual += (exp - act) ** 2;
+  }
+  if (ssTotal === 0) {
+    return ssResidual === 0 ? 1 : 0;
+  }
+  return 1 - ssResidual / ssTotal;
+}
 // src/statistics/distribution.ts
 function filterNumericValues(values) {
   return values.filter(
@@ -497,9 +555,9 @@ var BinarizeSelector = class {
       field: this.fieldName
     };
     this.assertions.push(result);
-    chunkHDJID3GC_cjs.recordAssertion(result);
+    chunkDFC6FRTG_cjs.recordAssertion(result);
     if (!passed) {
-      throw new chunkHDJID3GC_cjs.AssertionError(result.message, threshold, metrics.accuracy, this.fieldName);
+      throw new chunkDFC6FRTG_cjs.AssertionError(result.message, threshold, metrics.accuracy, this.fieldName);
     }
     return this;
   }
@@ -521,7 +579,7 @@ var BinarizeSelector = class {
       actualThreshold = threshold;
       const classMetrics = metrics.perClass[targetClass];
       if (!classMetrics) {
-        throw new chunkHDJID3GC_cjs.AssertionError(
+        throw new chunkDFC6FRTG_cjs.AssertionError(
           `Class "${targetClass}" not found in binarized predictions`,
           targetClass,
           Object.keys(metrics.perClass),
@@ -541,9 +599,9 @@ var BinarizeSelector = class {
       class: targetClass
     };
     this.assertions.push(result);
-    chunkHDJID3GC_cjs.recordAssertion(result);
+    chunkDFC6FRTG_cjs.recordAssertion(result);
     if (!passed) {
-      throw new chunkHDJID3GC_cjs.AssertionError(result.message, actualThreshold, actualPrecision, this.fieldName);
+      throw new chunkDFC6FRTG_cjs.AssertionError(result.message, actualThreshold, actualPrecision, this.fieldName);
     }
     return this;
   }
@@ -565,7 +623,7 @@ var BinarizeSelector = class {
       actualThreshold = threshold;
       const classMetrics = metrics.perClass[targetClass];
       if (!classMetrics) {
-        throw new chunkHDJID3GC_cjs.AssertionError(
+        throw new chunkDFC6FRTG_cjs.AssertionError(
           `Class "${targetClass}" not found in binarized predictions`,
           targetClass,
           Object.keys(metrics.perClass),
@@ -585,9 +643,9 @@ var BinarizeSelector = class {
       class: targetClass
     };
     this.assertions.push(result);
-    chunkHDJID3GC_cjs.recordAssertion(result);
+    chunkDFC6FRTG_cjs.recordAssertion(result);
     if (!passed) {
-      throw new chunkHDJID3GC_cjs.AssertionError(result.message, actualThreshold, actualRecall, this.fieldName);
+      throw new chunkDFC6FRTG_cjs.AssertionError(result.message, actualThreshold, actualRecall, this.fieldName);
     }
     return this;
   }
@@ -607,7 +665,7 @@ var BinarizeSelector = class {
       actualThreshold = threshold;
       const classMetrics = metrics.perClass[targetClass];
       if (!classMetrics) {
-        throw new chunkHDJID3GC_cjs.AssertionError(
+        throw new chunkDFC6FRTG_cjs.AssertionError(
           `Class "${targetClass}" not found in binarized predictions`,
           targetClass,
           Object.keys(metrics.perClass),
@@ -627,9 +685,9 @@ var BinarizeSelector = class {
       class: targetClass
     };
     this.assertions.push(result);
-    chunkHDJID3GC_cjs.recordAssertion(result);
+    chunkDFC6FRTG_cjs.recordAssertion(result);
     if (!passed) {
-      throw new chunkHDJID3GC_cjs.AssertionError(result.message, actualThreshold, actualF1, this.fieldName);
+      throw new chunkDFC6FRTG_cjs.AssertionError(result.message, actualThreshold, actualF1, this.fieldName);
     }
     return this;
   }
@@ -644,7 +702,7 @@ var BinarizeSelector = class {
       binarized: true,
       binarizeThreshold: this.threshold
     };
-    chunkHDJID3GC_cjs.recordFieldMetrics(fieldResult);
+    chunkDFC6FRTG_cjs.recordFieldMetrics(fieldResult);
     const result = {
       type: "confusionMatrix",
       passed: true,
@@ -652,7 +710,7 @@ var BinarizeSelector = class {
       field: this.fieldName
     };
     this.assertions.push(result);
-    chunkHDJID3GC_cjs.recordAssertion(result);
+    chunkDFC6FRTG_cjs.recordAssertion(result);
     return this;
   }
   /**
@@ -694,11 +752,9 @@ var FieldSelector = class {
    * Throws a clear error if expected values are missing.
    */
   validateGroundTruth() {
-    const hasExpected = this.expectedValues.some(
-      (v) => v !== void 0 && v !== null
-    );
+    const hasExpected = this.expectedValues.some((v) => v !== void 0 && v !== null);
     if (!hasExpected) {
-      throw new chunkHDJID3GC_cjs.AssertionError(
+      throw new chunkDFC6FRTG_cjs.AssertionError(
         `Classification metric requires ground truth, but field "${this.fieldName}" has no expected values. Use expectStats(predictions, groundTruth) to provide expected values.`,
         void 0,
         void 0,
@@ -722,9 +778,9 @@ var FieldSelector = class {
       field: this.fieldName
     };
     this.assertions.push(result);
-    chunkHDJID3GC_cjs.recordAssertion(result);
+    chunkDFC6FRTG_cjs.recordAssertion(result);
     if (!passed) {
-      throw new chunkHDJID3GC_cjs.AssertionError(result.message, threshold, metrics.accuracy, this.fieldName);
+      throw new chunkDFC6FRTG_cjs.AssertionError(result.message, threshold, metrics.accuracy, this.fieldName);
     }
     return this;
   }
@@ -747,7 +803,7 @@ var FieldSelector = class {
       actualThreshold = threshold;
       const classMetrics = metrics.perClass[targetClass];
       if (!classMetrics) {
-        throw new chunkHDJID3GC_cjs.AssertionError(
+        throw new chunkDFC6FRTG_cjs.AssertionError(
           `Class "${targetClass}" not found in predictions`,
           targetClass,
           Object.keys(metrics.perClass),
@@ -767,9 +823,9 @@ var FieldSelector = class {
       class: targetClass
     };
     this.assertions.push(result);
-    chunkHDJID3GC_cjs.recordAssertion(result);
+    chunkDFC6FRTG_cjs.recordAssertion(result);
     if (!passed) {
-      throw new chunkHDJID3GC_cjs.AssertionError(result.message, actualThreshold, actualPrecision, this.fieldName);
+      throw new chunkDFC6FRTG_cjs.AssertionError(result.message, actualThreshold, actualPrecision, this.fieldName);
     }
     return this;
   }
@@ -792,7 +848,7 @@ var FieldSelector = class {
       actualThreshold = threshold;
       const classMetrics = metrics.perClass[targetClass];
       if (!classMetrics) {
-        throw new chunkHDJID3GC_cjs.AssertionError(
+        throw new chunkDFC6FRTG_cjs.AssertionError(
           `Class "${targetClass}" not found in predictions`,
           targetClass,
           Object.keys(metrics.perClass),
@@ -812,9 +868,9 @@ var FieldSelector = class {
       class: targetClass
     };
     this.assertions.push(result);
-    chunkHDJID3GC_cjs.recordAssertion(result);
+    chunkDFC6FRTG_cjs.recordAssertion(result);
     if (!passed) {
-      throw new chunkHDJID3GC_cjs.AssertionError(result.message, actualThreshold, actualRecall, this.fieldName);
+      throw new chunkDFC6FRTG_cjs.AssertionError(result.message, actualThreshold, actualRecall, this.fieldName);
     }
     return this;
   }
@@ -837,7 +893,7 @@ var FieldSelector = class {
       actualThreshold = threshold;
       const classMetrics = metrics.perClass[targetClass];
       if (!classMetrics) {
-        throw new chunkHDJID3GC_cjs.AssertionError(
+        throw new chunkDFC6FRTG_cjs.AssertionError(
           `Class "${targetClass}" not found in predictions`,
           targetClass,
           Object.keys(metrics.perClass),
@@ -857,9 +913,9 @@ var FieldSelector = class {
       class: targetClass
     };
     this.assertions.push(result);
-    chunkHDJID3GC_cjs.recordAssertion(result);
+    chunkDFC6FRTG_cjs.recordAssertion(result);
     if (!passed) {
-      throw new chunkHDJID3GC_cjs.AssertionError(result.message, actualThreshold, actualF1, this.fieldName);
+      throw new chunkDFC6FRTG_cjs.AssertionError(result.message, actualThreshold, actualF1, this.fieldName);
     }
     return this;
   }
@@ -873,7 +929,7 @@ var FieldSelector = class {
       metrics,
       binarized: false
     };
-    chunkHDJID3GC_cjs.recordFieldMetrics(fieldResult);
+    chunkDFC6FRTG_cjs.recordFieldMetrics(fieldResult);
     const result = {
       type: "confusionMatrix",
       passed: true,
@@ -881,7 +937,7 @@ var FieldSelector = class {
       field: this.fieldName
     };
     this.assertions.push(result);
-    chunkHDJID3GC_cjs.recordAssertion(result);
+    chunkDFC6FRTG_cjs.recordAssertion(result);
     return this;
   }
   /**
@@ -901,7 +957,7 @@ var FieldSelector = class {
   toHavePercentageBelow(valueThreshold, percentageThreshold) {
     const numericActual = filterNumericValues(this.actualValues);
     if (numericActual.length === 0) {
-      throw new chunkHDJID3GC_cjs.AssertionError(
+      throw new chunkDFC6FRTG_cjs.AssertionError(
         `Field '${this.fieldName}' contains no numeric values (found 0 numeric out of ${this.actualValues.length} total values)`,
         percentageThreshold,
         void 0,
@@ -919,9 +975,14 @@ var FieldSelector = class {
       field: this.fieldName
     };
     this.assertions.push(result);
-    chunkHDJID3GC_cjs.recordAssertion(result);
+    chunkDFC6FRTG_cjs.recordAssertion(result);
     if (!passed) {
-      throw new chunkHDJID3GC_cjs.AssertionError(result.message, percentageThreshold, actualPercentage, this.fieldName);
+      throw new chunkDFC6FRTG_cjs.AssertionError(
+        result.message,
+        percentageThreshold,
+        actualPercentage,
+        this.fieldName
+      );
     }
     return this;
   }
@@ -942,7 +1003,7 @@ var FieldSelector = class {
   toHavePercentageAbove(valueThreshold, percentageThreshold) {
     const numericActual = filterNumericValues(this.actualValues);
     if (numericActual.length === 0) {
-      throw new chunkHDJID3GC_cjs.AssertionError(
+      throw new chunkDFC6FRTG_cjs.AssertionError(
         `Field '${this.fieldName}' contains no numeric values (found 0 numeric out of ${this.actualValues.length} total values)`,
         percentageThreshold,
         void 0,
@@ -960,9 +1021,146 @@ var FieldSelector = class {
       field: this.fieldName
     };
     this.assertions.push(result);
-    chunkHDJID3GC_cjs.recordAssertion(result);
+    chunkDFC6FRTG_cjs.recordAssertion(result);
     if (!passed) {
-      throw new chunkHDJID3GC_cjs.AssertionError(result.message, percentageThreshold, actualPercentage, this.fieldName);
+      throw new chunkDFC6FRTG_cjs.AssertionError(
+        result.message,
+        percentageThreshold,
+        actualPercentage,
+        this.fieldName
+      );
+    }
+    return this;
+  }
+  // ============================================================================
+  // Regression Assertions
+  // ============================================================================
+  /**
+   * Validates that ground truth exists and both arrays contain numeric values.
+   * Returns the filtered numeric arrays for regression metrics.
+   */
+  validateRegressionInputs() {
+    this.validateGroundTruth();
+    const numericActual = filterNumericValues(this.actualValues);
+    const numericExpected = filterNumericValues(this.expectedValues);
+    if (numericActual.length === 0) {
+      throw new chunkDFC6FRTG_cjs.AssertionError(
+        `Regression metric requires numeric values, but field "${this.fieldName}" has no numeric actual values.`,
+        void 0,
+        void 0,
+        this.fieldName
+      );
+    }
+    if (numericExpected.length === 0) {
+      throw new chunkDFC6FRTG_cjs.AssertionError(
+        `Regression metric requires numeric values, but field "${this.fieldName}" has no numeric expected values.`,
+        void 0,
+        void 0,
+        this.fieldName
+      );
+    }
+    if (numericActual.length !== numericExpected.length) {
+      throw new chunkDFC6FRTG_cjs.AssertionError(
+        `Regression metric requires equal-length arrays, but got ${numericActual.length} actual and ${numericExpected.length} expected values.`,
+        numericExpected.length,
+        numericActual.length,
+        this.fieldName
+      );
+    }
+    return { actual: numericActual, expected: numericExpected };
+  }
+  /**
+   * Asserts that Mean Absolute Error is below a threshold.
+   * Requires numeric values in both actual and expected.
+   *
+   * @param threshold - Maximum allowed MAE
+   * @returns this for method chaining
+   *
+   * @example
+   * expectStats(predictions, groundTruth)
+   *   .field("score")
+   *   .toHaveMAEBelow(0.1)
+   */
+  toHaveMAEBelow(threshold) {
+    const { actual, expected } = this.validateRegressionInputs();
+    const metrics = computeRegressionMetrics(actual, expected);
+    const passed = metrics.mae <= threshold;
+    const result = {
+      type: "mae",
+      passed,
+      message: passed ? `MAE ${metrics.mae.toFixed(4)} is below ${threshold}` : `MAE ${metrics.mae.toFixed(4)} exceeds threshold ${threshold}`,
+      expected: threshold,
+      actual: metrics.mae,
+      field: this.fieldName
+    };
+    this.assertions.push(result);
+    chunkDFC6FRTG_cjs.recordAssertion(result);
+    if (!passed) {
+      throw new chunkDFC6FRTG_cjs.AssertionError(result.message, threshold, metrics.mae, this.fieldName);
+    }
+    return this;
+  }
+  /**
+   * Asserts that Root Mean Squared Error is below a threshold.
+   * Requires numeric values in both actual and expected.
+   *
+   * @param threshold - Maximum allowed RMSE
+   * @returns this for method chaining
+   *
+   * @example
+   * expectStats(predictions, groundTruth)
+   *   .field("score")
+   *   .toHaveRMSEBelow(0.15)
+   */
+  toHaveRMSEBelow(threshold) {
+    const { actual, expected } = this.validateRegressionInputs();
+    const metrics = computeRegressionMetrics(actual, expected);
+    const passed = metrics.rmse <= threshold;
+    const result = {
+      type: "rmse",
+      passed,
+      message: passed ? `RMSE ${metrics.rmse.toFixed(4)} is below ${threshold}` : `RMSE ${metrics.rmse.toFixed(4)} exceeds threshold ${threshold}`,
+      expected: threshold,
+      actual: metrics.rmse,
+      field: this.fieldName
+    };
+    this.assertions.push(result);
+    chunkDFC6FRTG_cjs.recordAssertion(result);
+    if (!passed) {
+      throw new chunkDFC6FRTG_cjs.AssertionError(result.message, threshold, metrics.rmse, this.fieldName);
+    }
+    return this;
+  }
+  /**
+   * Asserts that R-squared (coefficient of determination) is above a threshold.
+   * R² measures how well the predictions explain the variance in expected values.
+   * R² = 1.0 means perfect prediction, R² = 0 means prediction is no better than mean.
+   * Requires numeric values in both actual and expected.
+   *
+   * @param threshold - Minimum required R² value (0-1)
+   * @returns this for method chaining
+   *
+   * @example
+   * expectStats(predictions, groundTruth)
+   *   .field("score")
+   *   .toHaveR2Above(0.8)
+   */
+  toHaveR2Above(threshold) {
+    const { actual, expected } = this.validateRegressionInputs();
+    const metrics = computeRegressionMetrics(actual, expected);
+    const passed = metrics.r2 >= threshold;
+    const result = {
+      type: "r2",
+      passed,
+      message: passed ? `R\xB2 ${metrics.r2.toFixed(4)} is above ${threshold}` : `R\xB2 ${metrics.r2.toFixed(4)} is below threshold ${threshold}`,
+      expected: threshold,
+      actual: metrics.r2,
+      field: this.fieldName
+    };
+    this.assertions.push(result);
+    chunkDFC6FRTG_cjs.recordAssertion(result);
+    if (!passed) {
+      throw new chunkDFC6FRTG_cjs.AssertionError(result.message, threshold, metrics.r2, this.fieldName);
     }
     return this;
   }
@@ -999,16 +1197,17 @@ function normalizeInput(input) {
       expected: {}
     }));
   }
-  throw new Error("Invalid input to expectStats(): expected ModelRunResult, Prediction[], or AlignedRecord[]");
+  throw new Error(
+    "Invalid input to expectStats(): expected ModelRunResult, Prediction[], or AlignedRecord[]"
+  );
 }
-function expectStats(inputOrActual, expected) {
+function expectStats(inputOrActual, expected, options) {
   if (expected !== void 0) {
     if (!Array.isArray(inputOrActual)) {
-      throw new Error(
-        "When using two-argument expectStats(), first argument must be Prediction[]"
-      );
+      throw new Error("When using two-argument expectStats(), first argument must be Prediction[]");
     }
-    const aligned2 = alignByKey(inputOrActual, expected);
+    const alignOptions = options ? { idField: options.idField, strict: options.strict } : void 0;
+    const aligned2 = alignByKey(inputOrActual, expected, alignOptions);
     return new ExpectStats(aligned2);
   }
   const aligned = normalizeInput(inputOrActual);
@@ -1041,63 +1240,63 @@ var ExpectStats = class {
 Object.defineProperty(exports, "AssertionError", {
   enumerable: true,
-  get: function () { return chunkHDJID3GC_cjs.AssertionError; }
+  get: function () { return chunkDFC6FRTG_cjs.AssertionError; }
 });
 Object.defineProperty(exports, "ConfigurationError", {
   enumerable: true,
-  get: function () { return chunkHDJID3GC_cjs.ConfigurationError; }
+  get: function () { return chunkDFC6FRTG_cjs.ConfigurationError; }
 });
 Object.defineProperty(exports, "ConsoleReporter", {
   enumerable: true,
-  get: function () { return chunkHDJID3GC_cjs.ConsoleReporter; }
+  get: function () { return chunkDFC6FRTG_cjs.ConsoleReporter; }
 });
 Object.defineProperty(exports, "DatasetError", {
   enumerable: true,
-  get: function () { return chunkHDJID3GC_cjs.DatasetError; }
+  get: function () { return chunkDFC6FRTG_cjs.DatasetError; }
 });
 Object.defineProperty(exports, "EvalSenseError", {
   enumerable: true,
-  get: function () { return chunkHDJID3GC_cjs.EvalSenseError; }
+  get: function () { return chunkDFC6FRTG_cjs.EvalSenseError; }
 });
 Object.defineProperty(exports, "ExitCodes", {
   enumerable: true,
-  get: function () { return chunkHDJID3GC_cjs.ExitCodes; }
+  get: function () { return chunkDFC6FRTG_cjs.ExitCodes; }
 });
 Object.defineProperty(exports, "IntegrityError", {
   enumerable: true,
-  get: function () { return chunkHDJID3GC_cjs.IntegrityError; }
+  get: function () { return chunkDFC6FRTG_cjs.IntegrityError; }
 });
 Object.defineProperty(exports, "JsonReporter", {
   enumerable: true,
-  get: function () { return chunkHDJID3GC_cjs.JsonReporter; }
+  get: function () { return chunkDFC6FRTG_cjs.JsonReporter; }
 });
 Object.defineProperty(exports, "TestExecutionError", {
   enumerable: true,
-  get: function () { return chunkHDJID3GC_cjs.TestExecutionError; }
+  get: function () { return chunkDFC6FRTG_cjs.TestExecutionError; }
 });
 Object.defineProperty(exports, "buildConfusionMatrix", {
   enumerable: true,
-  get: function () { return chunkHDJID3GC_cjs.buildConfusionMatrix; }
+  get: function () { return chunkDFC6FRTG_cjs.buildConfusionMatrix; }
 });
 Object.defineProperty(exports, "discoverEvalFiles", {
   enumerable: true,
-  get: function () { return chunkHDJID3GC_cjs.discoverEvalFiles; }
+  get: function () { return chunkDFC6FRTG_cjs.discoverEvalFiles; }
 });
 Object.defineProperty(exports, "executeEvalFiles", {
   enumerable: true,
-  get: function () { return chunkHDJID3GC_cjs.executeEvalFiles; }
+  get: function () { return chunkDFC6FRTG_cjs.executeEvalFiles; }
 });
 Object.defineProperty(exports, "formatConfusionMatrix", {
   enumerable: true,
-  get: function () { return chunkHDJID3GC_cjs.formatConfusionMatrix; }
+  get: function () { return chunkDFC6FRTG_cjs.formatConfusionMatrix; }
 });
 Object.defineProperty(exports, "getExitCode", {
   enumerable: true,
-  get: function () { return chunkHDJID3GC_cjs.getExitCode; }
+  get: function () { return chunkDFC6FRTG_cjs.getExitCode; }
 });
 Object.defineProperty(exports, "parseReport", {
   enumerable: true,
-  get: function () { return chunkHDJID3GC_cjs.parseReport; }
+  get: function () { return chunkDFC6FRTG_cjs.parseReport; }
 });
 exports.afterAll = afterAll;
 exports.afterEach = afterEach;