npm - @evalgate/sdk - Versions diffs - 2.2.4 → 2.3.0 - Mend

@evalgate/sdk 2.2.4 → 2.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (11) hide show

package/CHANGELOG.md CHANGED Viewed

@@ -5,6 +5,32 @@ All notable changes to the @evalgate/sdk package will be documented in this file
 The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/),
 and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0.html).
+## [2.3.0] - 2026-03-04
+### Breaking
+- **`hasConsistency` / `hasConsistencyAsync` return `{ score, passed }` instead of `{ score, consistent }`** — aligns with every other assertion in the SDK that returns a `passed` field. If you were destructuring `consistent`, rename it to `passed`:
+  ```ts
+  // Before:
+  const { score, consistent } = hasConsistency(outputs);
+  // After:
+  const { score, passed } = hasConsistency(outputs);
+  ```
+- **`respondedWithinDuration` / `respondedWithinTimeSince` return `AssertionResult` instead of `boolean`** — these now return `{ name, passed, expected, actual, message }` like all other assertions, enabling uniform pipeline usage and failure messages. The deprecated `respondedWithinTime` alias also returns `AssertionResult`.
+  ```ts
+  // Before:
+  const ok = respondedWithinDuration(250, 500); // boolean
+  // After:
+  const { passed } = respondedWithinDuration(250, 500); // AssertionResult
+  ```
+### Added
+- **`computeBaselineChecksum` / `verifyBaselineChecksum` in main barrel** — previously only reachable via `@evalgate/sdk/cli/baseline` subpath. Now importable directly from `@evalgate/sdk`.
+- **`resetSentimentDeprecationWarning` in main barrel** — the one-time deprecation reset utility for `hasSentimentAsync` is now importable from the main entry point, making it easier to test deprecation behavior. `SentimentAsyncResult` type was already exported.
+---
 ## [2.2.3] - 2026-03-03
 ### Breaking

package/README.md CHANGED Viewed

@@ -3,7 +3,7 @@
 [![npm version](https://img.shields.io/npm/v/@evalgate/sdk.svg)](https://www.npmjs.com/package/@evalgate/sdk)
 [![npm downloads](https://img.shields.io/npm/dm/@evalgate/sdk.svg)](https://www.npmjs.com/package/@evalgate/sdk)
 [![TypeScript](https://img.shields.io/badge/TypeScript-strict-blue.svg)](https://www.typescriptlang.org/)
-[![SDK Tests](https://img.shields.io/badge/tests-159%20passed-brightgreen.svg)](#)
+[![SDK Tests](https://img.shields.io/badge/tests-541%20passed-brightgreen.svg)](#)
 [![Contract Version](https://img.shields.io/badge/report%20schema-v1-blue.svg)](#)
 [![License: MIT](https://img.shields.io/badge/License-MIT-yellow.svg)](https://opensource.org/licenses/MIT)

package/dist/assertions.d.ts CHANGED Viewed

@@ -238,21 +238,21 @@ export declare function similarTo(text1: string, text2: string, threshold?: numb
  *
  * @param outputs - Array of LLM outputs to compare (minimum 2)
  * @param threshold - Optional minimum consistency score to return true (default 0.7)
- * @returns `{ score, consistent }` where `consistent` is `score >= threshold`
+ * @returns `{ score, passed }` where `passed` is `score >= threshold`
  *
  * @example
  * ```ts
- * const { score, consistent } = hasConsistency([
+ * const { score, passed } = hasConsistency([
  *   "The capital of France is Paris.",
  *   "Paris is the capital of France.",
  *   "France's capital city is Paris.",
  * ]);
- * // score ≈ 0.6-0.8, consistent = true at default threshold
+ * // score ≈ 0.6-0.8, passed = true at default threshold
  * ```
  */
 export declare function hasConsistency(outputs: string[], threshold?: number): {
     score: number;
-    consistent: boolean;
+    passed: boolean;
 };
 /**
  * LLM-backed consistency check. **Slow and accurate** — asks the LLM to
@@ -263,7 +263,7 @@ export declare function hasConsistency(outputs: string[], threshold?: number): {
  */
 export declare function hasConsistencyAsync(outputs: string[], config?: AssertionLLMConfig): Promise<{
     score: number;
-    consistent: boolean;
+    passed: boolean;
 }>;
 export declare function withinRange(value: number, min: number, max: number): boolean;
 export declare function isValidEmail(email: string): boolean;
@@ -298,19 +298,19 @@ export declare function hasFactualAccuracy(text: string, facts: string[]): boole
  * @param durationMs - The actual elapsed time in milliseconds
  * @param maxMs - Maximum allowed duration in milliseconds
  */
-export declare function respondedWithinDuration(durationMs: number, maxMs: number): boolean;
+export declare function respondedWithinDuration(durationMs: number, maxMs: number): AssertionResult;
 /**
  * Check if elapsed time since a start timestamp is within the allowed limit.
  * @param startTime - Timestamp from Date.now() captured before the operation
  * @param maxMs - Maximum allowed duration in milliseconds
  */
-export declare function respondedWithinTimeSince(startTime: number, maxMs: number): boolean;
+export declare function respondedWithinTimeSince(startTime: number, maxMs: number): AssertionResult;
 /**
  * @deprecated Use {@link respondedWithinDuration} (takes measured duration)
  * or {@link respondedWithinTimeSince} (takes start timestamp) instead.
  * This function takes a start timestamp, not a duration — the name is misleading.
  */
-export declare function respondedWithinTime(startTime: number, maxMs: number): boolean;
+export declare function respondedWithinTime(startTime: number, maxMs: number): AssertionResult;
 /**
  * Blocklist-based toxicity check (~80 terms across 9 categories).
  * **Fast and approximate** — catches explicit harmful language but has

package/dist/assertions.js CHANGED Viewed

@@ -884,24 +884,24 @@ function meanPairwiseJaccard(texts) {
  *
  * @param outputs - Array of LLM outputs to compare (minimum 2)
  * @param threshold - Optional minimum consistency score to return true (default 0.7)
- * @returns `{ score, consistent }` where `consistent` is `score >= threshold`
+ * @returns `{ score, passed }` where `passed` is `score >= threshold`
  *
  * @example
  * ```ts
- * const { score, consistent } = hasConsistency([
+ * const { score, passed } = hasConsistency([
  *   "The capital of France is Paris.",
  *   "Paris is the capital of France.",
  *   "France's capital city is Paris.",
  * ]);
- * // score ≈ 0.6-0.8, consistent = true at default threshold
+ * // score ≈ 0.6-0.8, passed = true at default threshold
  * ```
  */
 function hasConsistency(outputs, threshold = 0.7) {
     if (outputs.length < 2) {
-        return { score: 1, consistent: true };
+        return { score: 1, passed: true };
     }
     const score = meanPairwiseJaccard(outputs);
-    return { score, consistent: score >= threshold };
+    return { score, passed: score >= threshold };
 }
 /**
  * LLM-backed consistency check. **Slow and accurate** — asks the LLM to
@@ -912,7 +912,7 @@ function hasConsistency(outputs, threshold = 0.7) {
  */
 async function hasConsistencyAsync(outputs, config) {
     if (outputs.length < 2) {
-        return { score: 1, consistent: true };
+        return { score: 1, passed: true };
     }
     const numbered = outputs.map((o, i) => `Output ${i + 1}: "${o}"`).join("\n");
     const prompt = `Rate the semantic consistency of the following ${outputs.length} outputs on a scale from 0 to 100, where 100 means they all convey exactly the same meaning and 0 means they completely contradict each other. Reply with ONLY a number.\n\n${numbered}`;
@@ -921,7 +921,7 @@ async function hasConsistencyAsync(outputs, config) {
     const score = Number.isNaN(parsed)
         ? 0
         : Math.min(100, Math.max(0, parsed)) / 100;
-    return { score, consistent: score >= 0.7 };
+    return { score, passed: score >= 0.7 };
 }
 function withinRange(value, min, max) {
     return value >= min && value <= max;
@@ -1218,7 +1218,16 @@ function hasFactualAccuracy(text, facts) {
  * @param maxMs - Maximum allowed duration in milliseconds
  */
 function respondedWithinDuration(durationMs, maxMs) {
-    return durationMs <= maxMs;
+    const passed = durationMs <= maxMs;
+    return {
+        name: "respondedWithinDuration",
+        passed,
+        expected: `<= ${maxMs}ms`,
+        actual: `${durationMs}ms`,
+        message: passed
+            ? `Response time ${durationMs}ms is within ${maxMs}ms limit`
+            : `Response time ${durationMs}ms exceeded ${maxMs}ms limit`,
+    };
 }
 /**
  * Check if elapsed time since a start timestamp is within the allowed limit.
@@ -1226,7 +1235,17 @@ function respondedWithinDuration(durationMs, maxMs) {
  * @param maxMs - Maximum allowed duration in milliseconds
  */
 function respondedWithinTimeSince(startTime, maxMs) {
-    return Date.now() - startTime <= maxMs;
+    const elapsed = Date.now() - startTime;
+    const passed = elapsed <= maxMs;
+    return {
+        name: "respondedWithinTimeSince",
+        passed,
+        expected: `<= ${maxMs}ms`,
+        actual: `${elapsed}ms`,
+        message: passed
+            ? `Elapsed time ${elapsed}ms is within ${maxMs}ms limit`
+            : `Elapsed time ${elapsed}ms exceeded ${maxMs}ms limit`,
+    };
 }
 /**
  * @deprecated Use {@link respondedWithinDuration} (takes measured duration)

package/dist/cli/index.js CHANGED Viewed

File without changes

package/dist/index.d.ts CHANGED Viewed

@@ -9,7 +9,7 @@
 export { AIEvalClient } from "./client";
 import { AuthenticationError, EvalGateError, NetworkError, RateLimitError, ValidationError } from "./errors";
 export { EvalGateError, RateLimitError, AuthenticationError, ValidationError, NetworkError, };
-export { type AssertionLLMConfig, configureAssertions, containsAllRequiredFields, containsJSON, containsKeywords, containsLanguage, containsLanguageAsync, expect, followsInstructions, getAssertionConfig, hasConsistency, hasConsistencyAsync, hasFactualAccuracy, hasFactualAccuracyAsync, hasLength, hasNoHallucinations, hasNoHallucinationsAsync, hasNoToxicity, hasNoToxicityAsync, hasPII, hasReadabilityScore, hasSentiment, hasSentimentAsync, hasSentimentWithScore, hasValidCodeSyntax, hasValidCodeSyntaxAsync, isValidEmail, isValidURL, matchesPattern, matchesSchema, notContainsPII, respondedWithinDuration, respondedWithinTime, respondedWithinTimeSince, type SentimentAsyncResult, similarTo, toSemanticallyContain, withinRange, } from "./assertions";
+export { type AssertionLLMConfig, configureAssertions, containsAllRequiredFields, containsJSON, containsKeywords, containsLanguage, containsLanguageAsync, expect, followsInstructions, getAssertionConfig, hasConsistency, hasConsistencyAsync, hasFactualAccuracy, hasFactualAccuracyAsync, hasLength, hasNoHallucinations, hasNoHallucinationsAsync, hasNoToxicity, hasNoToxicityAsync, hasPII, hasReadabilityScore, hasSentiment, hasSentimentAsync, hasSentimentWithScore, hasValidCodeSyntax, hasValidCodeSyntaxAsync, isValidEmail, isValidURL, matchesPattern, matchesSchema, notContainsPII, resetSentimentDeprecationWarning, respondedWithinDuration, respondedWithinTime, respondedWithinTimeSince, type SentimentAsyncResult, similarTo, toSemanticallyContain, withinRange, } from "./assertions";
 export { EvalGateError as SDKError } from "./errors";
 import { createContext, EvalContext, getCurrentContext, withContext } from "./context";
 export { createContext, getCurrentContext as getContext, withContext, EvalContext as ContextManager, };
@@ -28,6 +28,7 @@ export { exportData, importData };
 export type { ExportFormat, ExportFormat as ExportType };
 export { RequestBatcher } from "./batch";
 export { CacheTTL } from "./cache";
+export { computeBaselineChecksum, verifyBaselineChecksum, } from "./cli/baseline";
 export { type CheckArgs, EXIT, parseArgs, runCheck } from "./cli/check";
 export { traceAnthropic } from "./integrations/anthropic";
 export { traceOpenAI } from "./integrations/openai";

package/dist/index.js CHANGED Viewed

@@ -8,9 +8,9 @@
  * @packageDocumentation
  */
 Object.defineProperty(exports, "__esModule", { value: true });
-exports.validateContext = exports.mergeContexts = exports.cloneContext = exports.ContextManager = exports.withContext = exports.getContext = exports.createContext = exports.SDKError = exports.withinRange = exports.toSemanticallyContain = exports.similarTo = exports.respondedWithinTimeSince = exports.respondedWithinTime = exports.respondedWithinDuration = exports.notContainsPII = exports.matchesSchema = exports.matchesPattern = exports.isValidURL = exports.isValidEmail = exports.hasValidCodeSyntaxAsync = exports.hasValidCodeSyntax = exports.hasSentimentWithScore = exports.hasSentimentAsync = exports.hasSentiment = exports.hasReadabilityScore = exports.hasPII = exports.hasNoToxicityAsync = exports.hasNoToxicity = exports.hasNoHallucinationsAsync = exports.hasNoHallucinations = exports.hasLength = exports.hasFactualAccuracyAsync = exports.hasFactualAccuracy = exports.hasConsistencyAsync = exports.hasConsistency = exports.getAssertionConfig = exports.followsInstructions = exports.expect = exports.containsLanguageAsync = exports.containsLanguage = exports.containsKeywords = exports.containsJSON = exports.containsAllRequiredFields = exports.configureAssertions = exports.NetworkError = exports.ValidationError = exports.AuthenticationError = exports.RateLimitError = exports.EvalGateError = exports.AIEvalClient = void 0;
-exports.streamEvaluation = exports.RateLimiter = exports.batchRead = exports.batchProcess = exports.REPORT_SCHEMA_VERSION = exports.GATE_EXIT = exports.GATE_CATEGORY = exports.ARTIFACTS = exports.PaginatedIterator = exports.encodeCursor = exports.decodeCursor = exports.createPaginatedIterator = exports.autoPaginateGenerator = exports.autoPaginate = exports.OTelExporter = exports.createOTelExporter = exports.extendExpectWithToPassGate = exports.Logger = exports.openAIChatEval = exports.traceOpenAI = exports.traceAnthropic = exports.runCheck = exports.parseArgs = exports.EXIT = exports.CacheTTL = exports.RequestBatcher = exports.importData = exports.exportData = exports.saveSnapshot = exports.compareSnapshots = exports.compareWithSnapshot = exports.snapshot = exports.TestSuite = exports.createTestSuite = exports.SpecRegistrationError = exports.SpecExecutionError = exports.RuntimeError = exports.EvalRuntimeError = exports.setActiveRuntime = exports.getActiveRuntime = exports.disposeActiveRuntime = exports.createEvalRuntime = exports.defaultLocalExecutor = exports.createLocalExecutor = exports.getFilteredSpecs = exports.evalai = exports.defineSuite = exports.defineEval = exports.createResult = exports.createEvalContext = void 0;
-exports.WorkflowTracer = exports.traceWorkflowStep = exports.traceLangChainAgent = exports.traceCrewAI = exports.traceAutoGen = exports.createWorkflowTracer = exports.EvaluationTemplates = void 0;
+exports.mergeContexts = exports.cloneContext = exports.ContextManager = exports.withContext = exports.getContext = exports.createContext = exports.SDKError = exports.withinRange = exports.toSemanticallyContain = exports.similarTo = exports.respondedWithinTimeSince = exports.respondedWithinTime = exports.respondedWithinDuration = exports.resetSentimentDeprecationWarning = exports.notContainsPII = exports.matchesSchema = exports.matchesPattern = exports.isValidURL = exports.isValidEmail = exports.hasValidCodeSyntaxAsync = exports.hasValidCodeSyntax = exports.hasSentimentWithScore = exports.hasSentimentAsync = exports.hasSentiment = exports.hasReadabilityScore = exports.hasPII = exports.hasNoToxicityAsync = exports.hasNoToxicity = exports.hasNoHallucinationsAsync = exports.hasNoHallucinations = exports.hasLength = exports.hasFactualAccuracyAsync = exports.hasFactualAccuracy = exports.hasConsistencyAsync = exports.hasConsistency = exports.getAssertionConfig = exports.followsInstructions = exports.expect = exports.containsLanguageAsync = exports.containsLanguage = exports.containsKeywords = exports.containsJSON = exports.containsAllRequiredFields = exports.configureAssertions = exports.NetworkError = exports.ValidationError = exports.AuthenticationError = exports.RateLimitError = exports.EvalGateError = exports.AIEvalClient = void 0;
+exports.batchProcess = exports.REPORT_SCHEMA_VERSION = exports.GATE_EXIT = exports.GATE_CATEGORY = exports.ARTIFACTS = exports.PaginatedIterator = exports.encodeCursor = exports.decodeCursor = exports.createPaginatedIterator = exports.autoPaginateGenerator = exports.autoPaginate = exports.OTelExporter = exports.createOTelExporter = exports.extendExpectWithToPassGate = exports.Logger = exports.openAIChatEval = exports.traceOpenAI = exports.traceAnthropic = exports.runCheck = exports.parseArgs = exports.EXIT = exports.verifyBaselineChecksum = exports.computeBaselineChecksum = exports.CacheTTL = exports.RequestBatcher = exports.importData = exports.exportData = exports.saveSnapshot = exports.compareSnapshots = exports.compareWithSnapshot = exports.snapshot = exports.TestSuite = exports.createTestSuite = exports.SpecRegistrationError = exports.SpecExecutionError = exports.RuntimeError = exports.EvalRuntimeError = exports.setActiveRuntime = exports.getActiveRuntime = exports.disposeActiveRuntime = exports.createEvalRuntime = exports.defaultLocalExecutor = exports.createLocalExecutor = exports.getFilteredSpecs = exports.evalai = exports.defineSuite = exports.defineEval = exports.createResult = exports.createEvalContext = exports.validateContext = void 0;
+exports.WorkflowTracer = exports.traceWorkflowStep = exports.traceLangChainAgent = exports.traceCrewAI = exports.traceAutoGen = exports.createWorkflowTracer = exports.EvaluationTemplates = exports.streamEvaluation = exports.RateLimiter = exports.batchRead = void 0;
 // Main SDK exports
 var client_1 = require("./client");
 Object.defineProperty(exports, "AIEvalClient", { enumerable: true, get: function () { return client_1.AIEvalClient; } });
@@ -55,6 +55,7 @@ Object.defineProperty(exports, "isValidURL", { enumerable: true, get: function (
 Object.defineProperty(exports, "matchesPattern", { enumerable: true, get: function () { return assertions_1.matchesPattern; } });
 Object.defineProperty(exports, "matchesSchema", { enumerable: true, get: function () { return assertions_1.matchesSchema; } });
 Object.defineProperty(exports, "notContainsPII", { enumerable: true, get: function () { return assertions_1.notContainsPII; } });
+Object.defineProperty(exports, "resetSentimentDeprecationWarning", { enumerable: true, get: function () { return assertions_1.resetSentimentDeprecationWarning; } });
 Object.defineProperty(exports, "respondedWithinDuration", { enumerable: true, get: function () { return assertions_1.respondedWithinDuration; } });
 Object.defineProperty(exports, "respondedWithinTime", { enumerable: true, get: function () { return assertions_1.respondedWithinTime; } });
 Object.defineProperty(exports, "respondedWithinTimeSince", { enumerable: true, get: function () { return assertions_1.respondedWithinTimeSince; } });
@@ -122,6 +123,9 @@ Object.defineProperty(exports, "RequestBatcher", { enumerable: true, get: functi
 var cache_1 = require("./cache");
 Object.defineProperty(exports, "CacheTTL", { enumerable: true, get: function () { return cache_1.CacheTTL; } });
 // CLI (programmatic use)
+var baseline_1 = require("./cli/baseline");
+Object.defineProperty(exports, "computeBaselineChecksum", { enumerable: true, get: function () { return baseline_1.computeBaselineChecksum; } });
+Object.defineProperty(exports, "verifyBaselineChecksum", { enumerable: true, get: function () { return baseline_1.verifyBaselineChecksum; } });
 var check_1 = require("./cli/check");
 Object.defineProperty(exports, "EXIT", { enumerable: true, get: function () { return check_1.EXIT; } });
 Object.defineProperty(exports, "parseArgs", { enumerable: true, get: function () { return check_1.parseArgs; } });

package/dist/otel.js CHANGED Viewed

@@ -70,7 +70,7 @@ class OTelExporter {
             endpoint: options.endpoint ?? "http://localhost:4318/v1/traces",
             serviceName: options.serviceName ?? "evalgate",
             resourceAttributes: options.resourceAttributes ?? {},
-            sdkVersion: options.sdkVersion ?? "2.2.4",
+            sdkVersion: options.sdkVersion ?? "2.3.0",
             headers: options.headers ?? {},
         };
     }

package/dist/version.d.ts CHANGED Viewed

@@ -3,5 +3,5 @@
  * X-EvalGate-SDK-Version: SDK package version
  * X-EvalGate-Spec-Version: OpenAPI spec version (docs/openapi.json info.version)
  */
-export declare const SDK_VERSION = "2.2.4";
-export declare const SPEC_VERSION = "2.2.3";
+export declare const SDK_VERSION = "2.3.0";
+export declare const SPEC_VERSION = "2.3.0";

package/dist/version.js CHANGED Viewed

@@ -6,5 +6,5 @@ exports.SPEC_VERSION = exports.SDK_VERSION = void 0;
  * X-EvalGate-SDK-Version: SDK package version
  * X-EvalGate-Spec-Version: OpenAPI spec version (docs/openapi.json info.version)
  */
-exports.SDK_VERSION = "2.2.4";
-exports.SPEC_VERSION = "2.2.3";
+exports.SDK_VERSION = "2.3.0";
+exports.SPEC_VERSION = "2.3.0";

package/package.json CHANGED Viewed

@@ -1,125 +1,125 @@
 {
-	"name": "@evalgate/sdk",
-	"version": "2.2.4",
-	"publishConfig": {
-		"access": "public",
-		"registry": "https://registry.npmjs.org/"
-	},
-	"description": "EvalGate SDK - Complete API Coverage with Performance Optimizations",
-	"main": "dist/index.js",
-	"module": "dist/index.js",
-	"types": "dist/index.d.ts",
-	"sideEffects": false,
-	"files": [
-		"dist",
-		"README.md",
-		"CHANGELOG.md"
-	],
-	"bin": {
-		"evalgate": "dist/cli/index.js"
-	},
-	"engines": {
-		"node": ">=16.0.0"
-	},
-	"scripts": {
-		"build": "tsc",
-		"dev": "tsc --watch",
-		"test": "vitest run",
-		"test:dist": "tsc && vitest run src/__tests__/dist-smoke.test.ts",
-		"otel:test": "bash otel-integration/run-test.sh",
-		"test:watch": "vitest"
-	},
-	"keywords": [
-		"ai",
-		"evaluation",
-		"llm",
-		"testing",
-		"observability",
-		"tracing",
-		"monitoring",
-		"annotations",
-		"webhooks",
-		"developer-tools",
-		"openai",
-		"anthropic"
-	],
-	"author": "EvalGate Team",
-	"license": "MIT",
-	"repository": {
-		"type": "git",
-		"url": "git+https://github.com/pauly7610/ai-evaluation-platform.git",
-		"directory": "src/packages/sdk"
-	},
-	"homepage": "https://evalgate.com",
-	"bugs": {
-		"url": "https://github.com/pauly7610/ai-evaluation-platform/issues"
-	},
-	"dependencies": {
-		"commander": "^14.0.0"
-	},
-	"peerDependencies": {
-		"@anthropic-ai/sdk": "^0.20.0",
-		"openai": "^4.0.0"
-	},
-	"peerDependenciesMeta": {
-		"openai": {
-			"optional": true
-		},
-		"@anthropic-ai/sdk": {
-			"optional": true
-		}
-	},
-	"devDependencies": {
-		"@types/node": "^20.0.0",
-		"ts-node": "^10.9.2",
-		"typescript": "^5.0.0",
-		"vitest": "^1.0.0"
-	},
-	"exports": {
-		".": {
-			"import": "./dist/index.js",
-			"require": "./dist/index.js",
-			"types": "./dist/index.d.ts"
-		},
-		"./assertions": {
-			"import": "./dist/assertions.js",
-			"require": "./dist/assertions.js",
-			"types": "./dist/assertions.d.ts"
-		},
-		"./testing": {
-			"import": "./dist/testing.js",
-			"require": "./dist/testing.js",
-			"types": "./dist/testing.d.ts"
-		},
-		"./integrations/openai": {
-			"import": "./dist/integrations/openai.js",
-			"require": "./dist/integrations/openai.js",
-			"types": "./dist/integrations/openai.d.ts"
-		},
-		"./integrations/anthropic": {
-			"import": "./dist/integrations/anthropic.js",
-			"require": "./dist/integrations/anthropic.js",
-			"types": "./dist/integrations/anthropic.d.ts"
-		},
-		"./integrations/openai-eval": {
-			"import": "./dist/integrations/openai-eval.js",
-			"require": "./dist/integrations/openai-eval.js",
-			"types": "./dist/integrations/openai-eval.d.ts"
-		},
-		"./matchers": {
-			"import": "./dist/matchers/index.js",
-			"require": "./dist/matchers/index.js",
-			"types": "./dist/matchers/index.d.ts"
-		},
-		"./regression": {
-			"import": "./dist/regression.js",
-			"require": "./dist/regression.js",
-			"types": "./dist/regression.d.ts"
-		},
-		"./otel": {
-			"import": "./dist/otel.js",
-			"require": "./dist/otel.js",
-			"types": "./dist/otel.d.ts"
-		}
-	}
-}
+  "name": "@evalgate/sdk",
+  "version": "2.3.0",
+  "publishConfig": {
+    "access": "public",
+    "registry": "https://registry.npmjs.org/"
+  },
+  "description": "EvalGate SDK - Complete API Coverage with Performance Optimizations",
+  "main": "dist/index.js",
+  "module": "dist/index.js",
+  "types": "dist/index.d.ts",
+  "sideEffects": false,
+  "files": [
+    "dist",
+    "README.md",
+    "CHANGELOG.md"
+  ],
+  "bin": {
+    "evalgate": "dist/cli/index.js"
+  },
+  "engines": {
+    "node": ">=16.0.0"
+  },
+  "keywords": [
+    "ai",
+    "evaluation",
+    "llm",
+    "testing",
+    "observability",
+    "tracing",
+    "monitoring",
+    "annotations",
+    "webhooks",
+    "developer-tools",
+    "openai",
+    "anthropic"
+  ],
+  "author": "EvalGate Team",
+  "license": "MIT",
+  "repository": {
+    "type": "git",
+    "url": "git+https://github.com/pauly7610/ai-evaluation-platform.git",
+    "directory": "src/packages/sdk"
+  },
+  "homepage": "https://evalgate.com",
+  "bugs": {
+    "url": "https://github.com/pauly7610/ai-evaluation-platform/issues"
+  },
+  "dependencies": {
+    "commander": "^14.0.0"
+  },
+  "peerDependencies": {
+    "@anthropic-ai/sdk": "^0.20.0",
+    "openai": "^4.0.0"
+  },
+  "peerDependenciesMeta": {
+    "openai": {
+      "optional": true
+    },
+    "@anthropic-ai/sdk": {
+      "optional": true
+    }
+  },
+  "devDependencies": {
+    "@types/node": "^20.0.0",
+    "ts-node": "^10.9.2",
+    "typescript": "^5.0.0",
+    "vitest": "^1.0.0"
+  },
+  "exports": {
+    ".": {
+      "import": "./dist/index.js",
+      "require": "./dist/index.js",
+      "types": "./dist/index.d.ts"
+    },
+    "./assertions": {
+      "import": "./dist/assertions.js",
+      "require": "./dist/assertions.js",
+      "types": "./dist/assertions.d.ts"
+    },
+    "./testing": {
+      "import": "./dist/testing.js",
+      "require": "./dist/testing.js",
+      "types": "./dist/testing.d.ts"
+    },
+    "./integrations/openai": {
+      "import": "./dist/integrations/openai.js",
+      "require": "./dist/integrations/openai.js",
+      "types": "./dist/integrations/openai.d.ts"
+    },
+    "./integrations/anthropic": {
+      "import": "./dist/integrations/anthropic.js",
+      "require": "./dist/integrations/anthropic.js",
+      "types": "./dist/integrations/anthropic.d.ts"
+    },
+    "./integrations/openai-eval": {
+      "import": "./dist/integrations/openai-eval.js",
+      "require": "./dist/integrations/openai-eval.js",
+      "types": "./dist/integrations/openai-eval.d.ts"
+    },
+    "./matchers": {
+      "import": "./dist/matchers/index.js",
+      "require": "./dist/matchers/index.js",
+      "types": "./dist/matchers/index.d.ts"
+    },
+    "./regression": {
+      "import": "./dist/regression.js",
+      "require": "./dist/regression.js",
+      "types": "./dist/regression.d.ts"
+    },
+    "./otel": {
+      "import": "./dist/otel.js",
+      "require": "./dist/otel.js",
+      "types": "./dist/otel.d.ts"
+    }
+  },
+  "scripts": {
+    "build": "tsc",
+    "dev": "tsc --watch",
+    "test": "vitest run",
+    "test:dist": "tsc && vitest run src/__tests__/dist-smoke.test.ts",
+    "otel:test": "bash otel-integration/run-test.sh",
+    "test:watch": "vitest"
+  }
+}