npm - @evalgate/sdk - Versions diffs - 2.0.0 - Mend

@evalgate/sdk 2.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (141) hide show

package/CHANGELOG.md +638 -0
package/README.md +398 -0
package/dist/assertions.d.ts +189 -0
package/dist/assertions.js +662 -0
package/dist/batch.d.ts +68 -0
package/dist/batch.js +179 -0
package/dist/cache.d.ts +65 -0
package/dist/cache.js +131 -0
package/dist/cli/api.d.ts +108 -0
package/dist/cli/api.js +132 -0
package/dist/cli/baseline.d.ts +10 -0
package/dist/cli/baseline.js +172 -0
package/dist/cli/check.d.ts +73 -0
package/dist/cli/check.js +355 -0
package/dist/cli/ci-context.d.ts +6 -0
package/dist/cli/ci-context.js +112 -0
package/dist/cli/ci.d.ts +45 -0
package/dist/cli/ci.js +192 -0
package/dist/cli/config.d.ts +30 -0
package/dist/cli/config.js +230 -0
package/dist/cli/constants.d.ts +15 -0
package/dist/cli/constants.js +18 -0
package/dist/cli/diff.d.ts +173 -0
package/dist/cli/diff.js +685 -0
package/dist/cli/discover.d.ts +84 -0
package/dist/cli/discover.js +419 -0
package/dist/cli/doctor.d.ts +88 -0
package/dist/cli/doctor.js +675 -0
package/dist/cli/env.d.ts +21 -0
package/dist/cli/env.js +42 -0
package/dist/cli/explain.d.ts +58 -0
package/dist/cli/explain.js +561 -0
package/dist/cli/formatters/github.d.ts +8 -0
package/dist/cli/formatters/github.js +135 -0
package/dist/cli/formatters/human.d.ts +6 -0
package/dist/cli/formatters/human.js +110 -0
package/dist/cli/formatters/json.d.ts +6 -0
package/dist/cli/formatters/json.js +10 -0
package/dist/cli/formatters/pr-comment.d.ts +12 -0
package/dist/cli/formatters/pr-comment.js +103 -0
package/dist/cli/formatters/types.d.ts +103 -0
package/dist/cli/formatters/types.js +8 -0
package/dist/cli/gate.d.ts +21 -0
package/dist/cli/gate.js +179 -0
package/dist/cli/impact-analysis.d.ts +63 -0
package/dist/cli/impact-analysis.js +252 -0
package/dist/cli/index.d.ts +9 -0
package/dist/cli/index.js +332 -0
package/dist/cli/init.d.ts +16 -0
package/dist/cli/init.js +292 -0
package/dist/cli/manifest.d.ts +103 -0
package/dist/cli/manifest.js +282 -0
package/dist/cli/migrate.d.ts +41 -0
package/dist/cli/migrate.js +349 -0
package/dist/cli/policy-packs.d.ts +23 -0
package/dist/cli/policy-packs.js +89 -0
package/dist/cli/print-config.d.ts +29 -0
package/dist/cli/print-config.js +270 -0
package/dist/cli/profiles.d.ts +28 -0
package/dist/cli/profiles.js +30 -0
package/dist/cli/reason-codes.d.ts +17 -0
package/dist/cli/reason-codes.js +19 -0
package/dist/cli/regression-gate.d.ts +15 -0
package/dist/cli/regression-gate.js +341 -0
package/dist/cli/render/snippet.d.ts +5 -0
package/dist/cli/render/snippet.js +15 -0
package/dist/cli/render/sort.d.ts +10 -0
package/dist/cli/render/sort.js +24 -0
package/dist/cli/report/build-check-report.d.ts +19 -0
package/dist/cli/report/build-check-report.js +132 -0
package/dist/cli/run.d.ts +101 -0
package/dist/cli/run.js +395 -0
package/dist/cli/share.d.ts +17 -0
package/dist/cli/share.js +91 -0
package/dist/cli/upgrade.d.ts +15 -0
package/dist/cli/upgrade.js +492 -0
package/dist/cli/workspace.d.ts +31 -0
package/dist/cli/workspace.js +68 -0
package/dist/client.d.ts +368 -0
package/dist/client.js +893 -0
package/dist/client.request.test.d.ts +1 -0
package/dist/client.request.test.js +232 -0
package/dist/context.d.ts +134 -0
package/dist/context.js +215 -0
package/dist/errors.d.ts +82 -0
package/dist/errors.js +298 -0
package/dist/export.d.ts +195 -0
package/dist/export.js +344 -0
package/dist/index.d.ts +44 -0
package/dist/index.js +153 -0
package/dist/integrations/anthropic.d.ts +91 -0
package/dist/integrations/anthropic.js +163 -0
package/dist/integrations/openai-eval.d.ts +57 -0
package/dist/integrations/openai-eval.js +232 -0
package/dist/integrations/openai.d.ts +92 -0
package/dist/integrations/openai.js +160 -0
package/dist/local.d.ts +39 -0
package/dist/local.js +148 -0
package/dist/logger.d.ts +128 -0
package/dist/logger.js +227 -0
package/dist/matchers/index.d.ts +1 -0
package/dist/matchers/index.js +6 -0
package/dist/matchers/to-pass-gate.d.ts +29 -0
package/dist/matchers/to-pass-gate.js +35 -0
package/dist/pagination.d.ts +74 -0
package/dist/pagination.js +139 -0
package/dist/regression.d.ts +100 -0
package/dist/regression.js +44 -0
package/dist/runtime/adapters/config-to-dsl.d.ts +33 -0
package/dist/runtime/adapters/config-to-dsl.js +400 -0
package/dist/runtime/adapters/testsuite-to-dsl.d.ts +63 -0
package/dist/runtime/adapters/testsuite-to-dsl.js +276 -0
package/dist/runtime/context.d.ts +26 -0
package/dist/runtime/context.js +74 -0
package/dist/runtime/eval.d.ts +46 -0
package/dist/runtime/eval.js +244 -0
package/dist/runtime/execution-mode.d.ts +80 -0
package/dist/runtime/execution-mode.js +357 -0
package/dist/runtime/executor.d.ts +16 -0
package/dist/runtime/executor.js +152 -0
package/dist/runtime/registry.d.ts +78 -0
package/dist/runtime/registry.js +403 -0
package/dist/runtime/run-report.d.ts +200 -0
package/dist/runtime/run-report.js +222 -0
package/dist/runtime/types.d.ts +356 -0
package/dist/runtime/types.js +76 -0
package/dist/snapshot.d.ts +176 -0
package/dist/snapshot.js +322 -0
package/dist/streaming.d.ts +173 -0
package/dist/streaming.js +268 -0
package/dist/testing.d.ts +273 -0
package/dist/testing.js +317 -0
package/dist/types.d.ts +754 -0
package/dist/types.js +54 -0
package/dist/utils/input-hash.d.ts +8 -0
package/dist/utils/input-hash.js +41 -0
package/dist/version.d.ts +7 -0
package/dist/version.js +10 -0
package/dist/workflows.d.ts +389 -0
package/dist/workflows.js +671 -0
package/package.json +117 -0

package/dist/runtime/adapters/config-to-dsl.js ADDED Viewed

@@ -0,0 +1,400 @@
+"use strict";
+/**
+ * Config → DSL Adapter - LAYER 2 Compatibility Bridge
+ *
+ * Migrates existing evalgate.config.json and TestSuite configurations
+ * to the new defineEval() DSL without breaking user workflows.
+ */
+var __createBinding = (this && this.__createBinding) || (Object.create ? (function(o, m, k, k2) {
+    if (k2 === undefined) k2 = k;
+    var desc = Object.getOwnPropertyDescriptor(m, k);
+    if (!desc || ("get" in desc ? !m.__esModule : desc.writable || desc.configurable)) {
+      desc = { enumerable: true, get: function() { return m[k]; } };
+    }
+    Object.defineProperty(o, k2, desc);
+}) : (function(o, m, k, k2) {
+    if (k2 === undefined) k2 = k;
+    o[k2] = m[k];
+}));
+var __setModuleDefault = (this && this.__setModuleDefault) || (Object.create ? (function(o, v) {
+    Object.defineProperty(o, "default", { enumerable: true, value: v });
+}) : function(o, v) {
+    o["default"] = v;
+});
+var __importStar = (this && this.__importStar) || (function () {
+    var ownKeys = function(o) {
+        ownKeys = Object.getOwnPropertyNames || function (o) {
+            var ar = [];
+            for (var k in o) if (Object.prototype.hasOwnProperty.call(o, k)) ar[ar.length] = k;
+            return ar;
+        };
+        return ownKeys(o);
+    };
+    return function (mod) {
+        if (mod && mod.__esModule) return mod;
+        var result = {};
+        if (mod != null) for (var k = ownKeys(mod), i = 0; i < k.length; i++) if (k[i] !== "default") __createBinding(result, mod, k[i]);
+        __setModuleDefault(result, mod);
+        return result;
+    };
+})();
+Object.defineProperty(exports, "__esModule", { value: true });
+exports.migrateTestSuiteToDSL = migrateTestSuiteToDSL;
+exports.migrateConfigToDSL = migrateConfigToDSL;
+exports.migrateProjectToDSL = migrateProjectToDSL;
+const fs = __importStar(require("node:fs"));
+const path = __importStar(require("node:path"));
+const registry_1 = require("../registry");
+/**
+ * Convert TestSuite to defineEval() specifications
+ */
+function migrateTestSuiteToDSL(testSuite, outputPath) {
+    const result = {
+        success: true,
+        specsGenerated: 0,
+        errors: [],
+        warnings: [],
+        outputPath,
+    };
+    try {
+        // Create isolated runtime for migration
+        const _runtime = (0, registry_1.createEvalRuntime)();
+        // Use the runtime handle to define specs
+        const _boundDefineEval = (nameOrConfig, executor, options) => {
+            // The runtime handle manages the active runtime internally
+            const { defineEval } = require("../eval");
+            return defineEval(nameOrConfig, executor, options);
+        };
+        // Get test suite data via public methods
+        // Note: We need to access the internal data structure for migration
+        // This is a limitation of the current TestSuite design
+        const suiteData = extractTestSuiteData(testSuite);
+        // Generate DSL file content
+        const dslContent = generateDSLFromTestSuiteData(suiteData);
+        // Write DSL file
+        fs.writeFileSync(outputPath, dslContent, "utf-8");
+        result.specsGenerated = suiteData.cases.length;
+        result.warnings.push(`Migrated ${suiteData.cases.length} test cases from TestSuite to defineEval() DSL`);
+        // Cleanup runtime
+        (0, registry_1.disposeActiveRuntime)();
+    }
+    catch (error) {
+        result.success = false;
+        result.errors.push(`Migration failed: ${error instanceof Error ? error.message : String(error)}`);
+    }
+    return result;
+}
+/**
+ * Extract data from TestSuite instance
+ * This is a workaround for the private properties
+ */
+function extractTestSuiteData(_testSuite) {
+    // Since TestSuite properties are private, we need to reconstruct from usage
+    // This is a limitation that should be addressed in a future version
+    // For now, we'll create a basic structure and warn the user
+    return {
+        name: "test-suite", // Can't access private name
+        cases: [], // Can't access private config
+        config: {
+            cases: [],
+            timeout: 30000,
+            parallel: true,
+            stopOnFailure: false,
+            retries: 0,
+        },
+    };
+}
+/**
+ * Convert evalgate.config.json to DSL specifications
+ */
+function migrateConfigToDSL(configPath, outputPath) {
+    const result = {
+        success: true,
+        specsGenerated: 0,
+        errors: [],
+        warnings: [],
+        outputPath,
+    };
+    try {
+        if (!fs.existsSync(configPath)) {
+            result.success = false;
+            result.errors.push(`Configuration file not found: ${configPath}`);
+            return result;
+        }
+        const configContent = fs.readFileSync(configPath, "utf-8");
+        const config = JSON.parse(configContent);
+        // Create isolated runtime for migration
+        const _runtime = (0, registry_1.createEvalRuntime)();
+        // Use the runtime handle to define specs
+        const _boundDefineEval = (nameOrConfig, executor, options) => {
+            // The runtime handle manages the active runtime internally
+            const { defineEval } = require("../eval");
+            return defineEval(nameOrConfig, executor, options);
+        };
+        // Generate basic DSL structure from config
+        const dslContent = generateDSLFromConfig(config);
+        // Write DSL file
+        fs.writeFileSync(outputPath, dslContent, "utf-8");
+        result.specsGenerated = 1; // Basic structure generated
+        result.warnings.push("Generated basic DSL structure from evalgate.config.json. Manual completion required.");
+        // Cleanup runtime
+        (0, registry_1.disposeActiveRuntime)();
+    }
+    catch (error) {
+        result.success = false;
+        result.errors.push(`Config migration failed: ${error instanceof Error ? error.message : String(error)}`);
+    }
+    return result;
+}
+/**
+ * Generate DSL code from TestSuite data
+ */
+function generateDSLFromTestSuiteData(suiteData) {
+    const imports = [
+        `// Auto-generated from TestSuite: ${suiteData.name}`,
+        `// Generated at: ${new Date().toISOString()}`,
+        `// This file replaces the old TestSuite configuration`,
+        "",
+        `import { defineEval, createResult } from '@evalgate/sdk';`,
+        "",
+    ];
+    const specs = suiteData.cases.map((testCase, index) => {
+        const specName = testCase.id || `${suiteData.name}-case-${index + 1}`;
+        // Generate assertion code
+        const assertionCode = testCase.assertions
+            ? generateAssertionCode(testCase.assertions)
+            : "// No assertions defined";
+        return [
+            `defineEval("${specName}", async (context) => {`,
+            `  // Original input: ${testCase.input}`,
+            `  const input = context.input;`,
+            `  `,
+            `  // TODO: Replace with your actual agent/LLM call`,
+            `  const output = await simulateAgent(input);`,
+            `  `,
+            `  // Assertions:`,
+            assertionCode,
+            `  `,
+            `  return createResult({`,
+            `    pass: allAssertionsPassed,`,
+            `    score: allAssertionsPassed ? 100 : 0,`,
+            `    assertions: assertionResults,`,
+            `    metadata: {`,
+            `      originalInput: ${JSON.stringify(testCase.input)},`,
+            `      originalExpected: ${testCase.expected ? JSON.stringify(testCase.expected) : "undefined"},`,
+            `    },`,
+            `  });`,
+            `}, {`,
+            `  description: "Migrated from TestSuite case",`,
+            `  tags: ["migrated", "testsuite"],`,
+            `});`,
+            "",
+        ].join("\n");
+    });
+    const helperFunctions = [
+        `// Helper function to simulate your agent/LLM`,
+        `// Replace this with your actual implementation`,
+        `async function simulateAgent(input: string): Promise<string> {`,
+        `  // TODO: Implement your actual agent/LLM call here`,
+        `  // For now, return a simple echo as placeholder`,
+        `  return \`Agent response to: \${input}\`;`,
+        `}`,
+        "",
+    ];
+    return [...imports, ...helperFunctions, ...specs].join("\n");
+}
+/**
+ * Generate DSL code from configuration
+ */
+function generateDSLFromConfig(config) {
+    return [
+        `// Auto-generated from evalgate.config.json`,
+        `// Generated at: ${new Date().toISOString()}`,
+        `// This is a basic DSL structure - complete with your actual evaluations`,
+        "",
+        `import { defineEval, createResult } from '@evalgate/sdk';`,
+        "",
+        `defineEval("basic-evaluation", async (context) => {`,
+        `  const input = context.input;`,
+        `  `,
+        `  // TODO: Replace with your actual agent/LLM call`,
+        `  const output = await simulateAgent(input);`,
+        `  `,
+        `  // TODO: Add your actual evaluation logic`,
+        `  const pass = output.length > 0;`,
+        `  const score = pass ? 100 : 0;`,
+        `  `,
+        `  return createResult({`,
+        `    pass,`,
+        `    score,`,
+        `    metadata: {`,
+        `      evaluationId: ${config.evaluationId ? JSON.stringify(config.evaluationId) : "undefined"},`,
+        `      input,`,
+        `      output,`,
+        `    },`,
+        `  });`,
+        `}, {`,
+        `  description: "Basic evaluation migrated from evalgate.config.json",`,
+        `  tags: ["migrated", "config"],`,
+        `});`,
+        "",
+        `// Helper function to simulate your agent/LLM`,
+        `// Replace this with your actual implementation`,
+        `async function simulateAgent(input: string): Promise<string> {`,
+        `  // TODO: Implement your actual agent/LLM call here`,
+        `  return \`Agent response to: \${input}\`;`,
+        `}`,
+        "",
+    ].join("\n");
+}
+/**
+ * Generate assertion code from TestSuite assertions
+ */
+function generateAssertionCode(assertions) {
+    // Since we can't analyze the assertion functions at runtime,
+    // we generate placeholder code that users need to complete
+    return [
+        `  // Original assertions: ${assertions.length} defined`,
+        `  // TODO: Manually convert these assertions to evaluation logic:`,
+        ...assertions.map((_, index) => `  // assertion ${index + 1}: <convert to evaluation logic>`),
+        `  `,
+        `  const assertionResults = [];`,
+        `  let allAssertionsPassed = true;`,
+        `  `,
+        `  // TODO: Add your actual assertion logic here`,
+        `  // Example:`,
+        `  // const containsExpected = output.includes(expected);`,
+        `  // assertionResults.push({ name: "contains-expected", passed: containsExpected });`,
+        `  // if (!containsExpected) allAssertionsPassed = false;`,
+    ].join("\n");
+}
+/**
+ * Discover and migrate all TestSuite configurations in a project
+ */
+function migrateProjectToDSL(projectRoot, options = {}) {
+    const result = {
+        success: true,
+        specsGenerated: 0,
+        errors: [],
+        warnings: [],
+        outputPath: options.outputDir || path.join(projectRoot, ".evalgate", "migrated"),
+    };
+    try {
+        // Find evalgate.config.json or evalai.config.json
+        const evalgatePath = path.join(projectRoot, "evalgate.config.json");
+        const legacyPath = path.join(projectRoot, "evalai.config.json");
+        const configPath = fs.existsSync(evalgatePath)
+            ? evalgatePath
+            : fs.existsSync(legacyPath)
+                ? legacyPath
+                : null;
+        if (configPath) {
+            const outputPath = path.join(result.outputPath, "evalgate.config.migrated.ts");
+            if (!options.dryRun) {
+                fs.mkdirSync(path.dirname(outputPath), { recursive: true });
+                const configResult = migrateConfigToDSL(configPath, outputPath);
+                result.specsGenerated += configResult.specsGenerated;
+                result.errors.push(...configResult.errors);
+                result.warnings.push(...configResult.warnings);
+            }
+            else {
+                result.warnings.push(`Would migrate evalgate.config.json to ${outputPath}`);
+            }
+        }
+        // Look for TestSuite usage in TypeScript/JavaScript files
+        const testFiles = findTestSuiteFiles(projectRoot);
+        for (const testFile of testFiles) {
+            const outputPath = path.join(result.outputPath, path.basename(testFile).replace(/\.(ts|js)$/, ".migrated.ts"));
+            if (!options.dryRun) {
+                fs.mkdirSync(path.dirname(outputPath), { recursive: true });
+                // Note: Actual TestSuite parsing would require AST analysis
+                // For now, we create placeholder files
+                const placeholderContent = generatePlaceholderDSL(testFile);
+                fs.writeFileSync(outputPath, placeholderContent, "utf-8");
+                result.specsGenerated += 1;
+                result.warnings.push(`Created migration placeholder for ${testFile}`);
+            }
+            else {
+                result.warnings.push(`Would migrate ${testFile} to ${outputPath}`);
+            }
+        }
+        if (result.specsGenerated === 0) {
+            result.warnings.push("No TestSuite configurations found to migrate");
+        }
+    }
+    catch (error) {
+        result.success = false;
+        result.errors.push(`Project migration failed: ${error instanceof Error ? error.message : String(error)}`);
+    }
+    return result;
+}
+/**
+ * Find files that might contain TestSuite usage
+ */
+function findTestSuiteFiles(projectRoot) {
+    const testFiles = [];
+    function scanDirectory(dir) {
+        if (!fs.existsSync(dir))
+            return;
+        const entries = fs.readdirSync(dir, { withFileTypes: true });
+        for (const entry of entries) {
+            const fullPath = path.join(dir, entry.name);
+            if (entry.isDirectory() &&
+                !entry.name.startsWith(".") &&
+                entry.name !== "node_modules") {
+                scanDirectory(fullPath);
+            }
+            else if (entry.isFile() && /\.(ts|js)$/.test(entry.name)) {
+                try {
+                    const content = fs.readFileSync(fullPath, "utf-8");
+                    if (content.includes("createTestSuite") ||
+                        content.includes("TestSuite")) {
+                        testFiles.push(fullPath);
+                    }
+                }
+                catch {
+                    // Skip files that can't be read
+                }
+            }
+        }
+    }
+    scanDirectory(projectRoot);
+    return testFiles;
+}
+/**
+ * Generate placeholder DSL for files that need manual migration
+ */
+function generatePlaceholderDSL(originalFile) {
+    return [
+        `// Migration placeholder for: ${originalFile}`,
+        `// Generated at: ${new Date().toISOString()}`,
+        `// This file contains TestSuite usage that needs manual migration`,
+        "",
+        `import { defineEval, createResult } from '@evalgate/sdk';`,
+        "",
+        `defineEval("placeholder-from-${path.basename(originalFile)}", async (context) => {`,
+        `  // TODO: Manually migrate TestSuite from ${originalFile}`,
+        `  const input = context.input;`,
+        `  `,
+        `  // Replace with your actual evaluation logic`,
+        `  const output = await simulateAgent(input);`,
+        `  `,
+        `  return createResult({`,
+        `    pass: output.length > 0,`,
+        `    score: output.length > 0 ? 100 : 0,`,
+        `    metadata: {`,
+        `      migratedFrom: ${JSON.stringify(originalFile)},`,
+        `    },`,
+        `  });`,
+        `}, {`,
+        `  description: "Placeholder - complete migration manually",`,
+        `  tags: ["placeholder", "needs-migration"],`,
+        `});`,
+        "",
+        `async function simulateAgent(input: string): Promise<string> {`,
+        `  // TODO: Implement your actual agent/LLM call`,
+        `  return \`Response to: \${input}\`;`,
+        `}`,
+        "",
+    ].join("\n");
+}

package/dist/runtime/adapters/testsuite-to-dsl.d.ts ADDED Viewed

@@ -0,0 +1,63 @@
+/**
+ * COMPAT-202: Legacy TestSuite → defineEval adapter
+ *
+ * Converts legacy TestSuite instances to defineEval specifications
+ * without forcing migration. Enables lossless where possible.
+ */
+import type { TestSuite } from "../../testing";
+import type { EvalSpec } from "../types";
+/**
+ * Adapter configuration options
+ */
+export interface TestSuiteAdapterOptions {
+    /** Include provenance metadata in generated specs */
+    includeProvenance?: boolean;
+    /** Preserve original test IDs */
+    preserveIds?: boolean;
+    /** Generate helper functions for assertions */
+    generateHelpers?: boolean;
+}
+/**
+ * Convert TestSuite to defineEval specifications
+ *
+ * @param suite - Legacy TestSuite instance
+ * @param options - Adapter configuration options
+ * @returns Array of EvalSpec definitions
+ */
+export declare function adaptTestSuite(suite: TestSuite, options?: Partial<TestSuiteOptions>): EvalSpec[];
+/**
+ * Generate defineEval code from TestSuite
+ *
+ * @param suite - Legacy TestSuite instance
+ * @param options - Code generation options
+ * @returns Generated TypeScript code
+ */
+export declare function generateDefineEvalCode(suite: TestSuite, options?: Partial<TestSuiteOptions>): string;
+/**
+ * Create adapter configuration for TestSuite
+ */
+export interface TestSuiteConfig {
+    /** Test cases to run */
+    cases: unknown[];
+    /** Function that generates output from input */
+    executor?: (input: string) => Promise<string>;
+    /** Run tests in parallel (default: true) */
+    parallel?: boolean;
+    /** Stop on first failure (default: false) */
+    stopOnFailure?: boolean;
+    /** Timeout per test case in ms (default: 30000) */
+    timeout?: number;
+    /** Retry failing cases N times (default: 0) */
+    retries?: number;
+}
+/**
+ * TestSuite options (alias for compatibility)
+ */
+export interface TestSuiteOptions extends TestSuiteConfig {
+    /** Include provenance metadata in generated specs */
+    includeProvenance?: boolean;
+    /** Preserve original test IDs */
+    preserveIds?: boolean;
+    /** Generate helper functions for assertions */
+    generateHelpers?: boolean;
+}