npm - @pauly4010/evalai-sdk - Versions diffs - 1.9.0 → 1.9.1 - Mend

@pauly4010/evalai-sdk 1.9.0 → 1.9.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (57) hide show

package/README.md +136 -23
package/dist/assertions.js +51 -18
package/dist/batch.js +8 -2
package/dist/cli/api.js +3 -1
package/dist/cli/check.js +19 -6
package/dist/cli/ci-context.js +3 -1
package/dist/cli/config.js +28 -8
package/dist/cli/diff.js +14 -9
package/dist/cli/discover.js +18 -7
package/dist/cli/doctor.js +43 -9
package/dist/cli/explain.js +37 -11
package/dist/cli/formatters/human.js +4 -1
package/dist/cli/formatters/pr-comment.js +3 -1
package/dist/cli/gate.js +6 -2
package/dist/cli/impact-analysis.js +6 -5
package/dist/cli/index.js +18 -6
package/dist/cli/manifest.d.ts +3 -5
package/dist/cli/manifest.js +21 -14
package/dist/cli/migrate.js +4 -4
package/dist/cli/policy-packs.js +8 -2
package/dist/cli/print-config.js +19 -4
package/dist/cli/regression-gate.js +8 -2
package/dist/cli/report/build-check-report.js +8 -2
package/dist/cli/run.js +11 -5
package/dist/cli/share.js +3 -1
package/dist/cli/upgrade.js +2 -1
package/dist/client.d.ts +16 -19
package/dist/client.js +60 -43
package/dist/client.request.test.d.ts +1 -1
package/dist/client.request.test.js +222 -147
package/dist/context.js +3 -1
package/dist/errors.js +11 -4
package/dist/export.js +3 -1
package/dist/index.d.ts +8 -8
package/dist/index.js +19 -19
package/dist/integrations/anthropic.d.ts +20 -1
package/dist/integrations/openai-eval.js +4 -2
package/dist/integrations/openai.d.ts +24 -1
package/dist/local.js +3 -1
package/dist/logger.js +6 -2
package/dist/pagination.js +6 -2
package/dist/runtime/adapters/config-to-dsl.js +12 -9
package/dist/runtime/adapters/testsuite-to-dsl.d.ts +1 -1
package/dist/runtime/adapters/testsuite-to-dsl.js +11 -6
package/dist/runtime/eval.d.ts +1 -1
package/dist/runtime/eval.js +12 -5
package/dist/runtime/execution-mode.js +13 -9
package/dist/runtime/registry.js +8 -21
package/dist/runtime/run-report.d.ts +0 -2
package/dist/runtime/run-report.js +12 -10
package/dist/testing.js +7 -2
package/dist/types.d.ts +100 -69
package/dist/utils/input-hash.js +4 -1
package/dist/version.d.ts +1 -1
package/dist/version.js +1 -1
package/dist/workflows.js +62 -14
package/package.json +115 -111

package/dist/cli/discover.js CHANGED Viewed

@@ -123,7 +123,7 @@ async function getProjectMetadata(projectRoot) {
         hasPackageJson = true;
         projectName = parsed.name || "unknown";
     }
-    catch (error) {
+    catch (_error) {
         // No package.json
     }
     const hasGit = await fs
@@ -173,9 +173,13 @@ function analyzeSpecFile(filePath, content) {
         content.includes("model=") ||
         content.includes("openai") ||
         content.includes("anthropic");
-    const usesTools = content.includes("tool:") || content.includes("function.") || content.includes("call(");
+    const usesTools = content.includes("tool:") ||
+        content.includes("function.") ||
+        content.includes("call(");
     // Check for assertions
-    const hasAssertions = content.includes("assert") || content.includes("expect") || content.includes("should");
+    const hasAssertions = content.includes("assert") ||
+        content.includes("expect") ||
+        content.includes("should");
     // Generate ID from file path
     const id = generateSpecId(filePath);
     return {
@@ -234,7 +238,9 @@ function analyzeComplexity(content) {
     const hasLoops = content.includes("for") || content.includes("while");
     const hasConditionals = content.includes("if") || content.includes("switch");
     const hasTryCatch = content.includes("try") || content.includes("catch");
-    const hasExternalCalls = content.includes("fetch") || content.includes("http") || content.includes("api");
+    const hasExternalCalls = content.includes("fetch") ||
+        content.includes("http") ||
+        content.includes("api");
     let complexityScore = 0;
     if (lines > 50)
         complexityScore += 2;
@@ -261,7 +267,10 @@ function analyzeComplexity(content) {
  */
 function generateSpecId(filePath) {
     const relativePath = path.relative(process.cwd(), filePath);
-    const hash = Buffer.from(relativePath).toString("base64").replace(/[+/=]/g, "").slice(0, 8);
+    const hash = Buffer.from(relativePath)
+        .toString("base64")
+        .replace(/[+/=]/g, "")
+        .slice(0, 8);
     return hash;
 }
 /**
@@ -381,10 +390,12 @@ function printRecommendations(stats) {
     else {
         console.log(`   🏆 Excellent coverage! Consider running evalai run`);
     }
-    if (!stats.executionMode.hasSpecRuntime && !stats.executionMode.hasLegacyRuntime) {
+    if (!stats.executionMode.hasSpecRuntime &&
+        !stats.executionMode.hasLegacyRuntime) {
         console.log(`   🆕 New project? Try 'evalai init' to get started`);
     }
-    if (stats.executionMode.hasLegacyRuntime && !stats.executionMode.hasSpecRuntime) {
+    if (stats.executionMode.hasLegacyRuntime &&
+        !stats.executionMode.hasSpecRuntime) {
         console.log(`   🔄 Legacy project detected. Try 'evalai migrate config' to upgrade`);
     }
     if (stats.executionMode.hasSpecRuntime) {

package/dist/cli/doctor.js CHANGED Viewed

@@ -113,7 +113,15 @@ function parseFlags(argv) {
             evaluationId = String(merged.evaluationId);
     }
     const strict = raw.strict === "true" || raw.strict === "1";
-    return { report, format: report ? "json" : fmt, strict, baseUrl, apiKey, evaluationId, baseline };
+    return {
+        report,
+        format: report ? "json" : fmt,
+        strict,
+        baseUrl,
+        apiKey,
+        evaluationId,
+        baseline,
+    };
 }
 // ── Individual checks ──
 function checkProject(cwd) {
@@ -224,7 +232,10 @@ function checkBaseline(cwd) {
         };
     }
     const schemaVersion = typeof data.schemaVersion === "number" ? data.schemaVersion : undefined;
-    const hash = (0, node_crypto_1.createHash)("sha256").update(JSON.stringify(data)).digest("hex").slice(0, 12);
+    const hash = (0, node_crypto_1.createHash)("sha256")
+        .update(JSON.stringify(data))
+        .digest("hex")
+        .slice(0, 12);
     const updatedAt = typeof data.updatedAt === "string" ? data.updatedAt : undefined;
     // Staleness: warn if baseline older than 30 days
     let stale = false;
@@ -239,7 +250,12 @@ function checkBaseline(cwd) {
             status: "fail",
             message: `Unsupported baseline schemaVersion: ${schemaVersion ?? "missing"}`,
             remediation: "Run: npx evalai baseline init  (creates schemaVersion 1)",
-            baselineInfo: { path: "evals/baseline.json", exists: true, hash, schemaVersion },
+            baselineInfo: {
+                path: "evals/baseline.json",
+                exists: true,
+                hash,
+                schemaVersion,
+            },
         };
     }
     if (stale) {
@@ -249,7 +265,13 @@ function checkBaseline(cwd) {
             status: "warn",
             message: `Baseline is stale (last updated ${updatedAt})`,
             remediation: "Run: npx evalai baseline update",
-            baselineInfo: { path: "evals/baseline.json", exists: true, hash, schemaVersion, stale },
+            baselineInfo: {
+                path: "evals/baseline.json",
+                exists: true,
+                hash,
+                schemaVersion,
+                stale,
+            },
         };
     }
     return {
@@ -257,7 +279,13 @@ function checkBaseline(cwd) {
         label: "Baseline file",
         status: "pass",
         message: `schemaVersion ${schemaVersion}, hash ${hash}`,
-        baselineInfo: { path: "evals/baseline.json", exists: true, hash, schemaVersion, stale },
+        baselineInfo: {
+            path: "evals/baseline.json",
+            exists: true,
+            hash,
+            schemaVersion,
+            stale,
+        },
     };
 }
 function checkAuth(apiKey) {
@@ -437,7 +465,8 @@ function checkCiWiring(cwd) {
             ciInfo: { workflowPath, exists: true },
         };
     }
-    if (!content.includes("evalai") && !content.includes("@pauly4010/evalai-sdk")) {
+    if (!content.includes("evalai") &&
+        !content.includes("@pauly4010/evalai-sdk")) {
         return {
             id: "ci_wiring",
             label: "CI wiring",
@@ -551,7 +580,9 @@ async function runDoctor(argv) {
         };
     }
     // 7. Eval access (async, depends on auth + connectivity)
-    if (flags.apiKey && flags.evaluationId && connectivityResult.status !== "fail") {
+    if (flags.apiKey &&
+        flags.evaluationId &&
+        connectivityResult.status !== "fail") {
         try {
             const accessResult = await checkEvalAccess(flags.baseUrl, flags.apiKey, flags.evaluationId, flags.baseline);
             checks.push(accessResult);
@@ -592,7 +623,9 @@ async function runDoctor(argv) {
     if (flags.report || flags.format === "json") {
         const redactedConfig = {
             ...(configResult.config ?? {}),
-            path: configResult.configPath ? path.relative(cwd, configResult.configPath) : null,
+            path: configResult.configPath
+                ? path.relative(cwd, configResult.configPath)
+                : null,
         };
         const bundle = {
             timestamp: new Date().toISOString(),
@@ -604,7 +637,8 @@ async function runDoctor(argv) {
             config: redactedConfig,
             baseline: baselineResult.baselineInfo,
             api: {
-                reachable: connectivityResult.status === "pass" || connectivityResult.status === "warn",
+                reachable: connectivityResult.status === "pass" ||
+                    connectivityResult.status === "warn",
                 latencyMs: connectivityResult.latencyMs,
             },
             ci: ciResult.ciInfo,

package/dist/cli/explain.js CHANGED Viewed

@@ -87,7 +87,9 @@ const REPORT_SEARCH_PATHS = [
 ];
 function findReport(cwd, explicitPath) {
     if (explicitPath) {
-        const abs = path.isAbsolute(explicitPath) ? explicitPath : path.join(cwd, explicitPath);
+        const abs = path.isAbsolute(explicitPath)
+            ? explicitPath
+            : path.join(cwd, explicitPath);
         return fs.existsSync(abs) ? abs : null;
     }
     for (const rel of REPORT_SEARCH_PATHS) {
@@ -115,16 +117,20 @@ function classifyRootCauses(report) {
         causes.push("cost_regression");
     }
     // Latency regression
-    if (reasonCode === "LATENCY_BUDGET_EXCEEDED" || reasonCode === "LATENCY_RISK") {
+    if (reasonCode === "LATENCY_BUDGET_EXCEEDED" ||
+        reasonCode === "LATENCY_RISK") {
         causes.push("latency_regression");
     }
     // Coverage drop (test count decreased)
-    if (reasonCode === "LOW_SAMPLE_SIZE" || reasonCode === "INSUFFICIENT_EVIDENCE") {
+    if (reasonCode === "LOW_SAMPLE_SIZE" ||
+        reasonCode === "INSUFFICIENT_EVIDENCE") {
         causes.push("coverage_drop");
     }
     // Analyze failed cases for drift patterns
     if (failedCases.length > 0) {
-        const outputs = failedCases.map((fc) => (fc.output ?? "").toLowerCase()).filter(Boolean);
+        const outputs = failedCases
+            .map((fc) => (fc.output ?? "").toLowerCase())
+            .filter(Boolean);
         const expectedOutputs = failedCases
             .map((fc) => (fc.expectedOutput ?? "").toLowerCase())
             .filter(Boolean);
@@ -136,7 +142,9 @@ function classifyRootCauses(report) {
             causes.push("formatting_drift");
         }
         // Tool use drift: output mentions tool calls or function calls
-        const hasToolIssue = outputs.some((o) => o.includes("tool_call") || o.includes("function_call") || o.includes("tool_use"));
+        const hasToolIssue = outputs.some((o) => o.includes("tool_call") ||
+            o.includes("function_call") ||
+            o.includes("tool_use"));
         if (hasToolIssue) {
             causes.push("tool_use_drift");
         }
@@ -356,7 +364,9 @@ function buildExplainOutput(report, reportPath) {
 function buildFromCheckReport(report, reportPath) {
     const failedCases = report.failedCases ?? [];
     // Top failures (up to 3)
-    const topFailures = failedCases.slice(0, 3).map((fc, i) => ({
+    const topFailures = failedCases
+        .slice(0, 3)
+        .map((fc, i) => ({
         rank: i + 1,
         name: fc.name,
         input: fc.inputSnippet || fc.input,
@@ -444,7 +454,11 @@ function buildFromBuiltinReport(report, reportPath) {
 }
 // ── Output formatting ──
 function printHuman(output) {
-    const verdictIcon = output.verdict === "pass" ? "\u2705" : output.verdict === "warn" ? "\u26A0\uFE0F" : "\u274C";
+    const verdictIcon = output.verdict === "pass"
+        ? "\u2705"
+        : output.verdict === "warn"
+            ? "\u26A0\uFE0F"
+            : "\u274C";
     console.log(`\n  evalai explain\n`);
     console.log(`  ${verdictIcon} Verdict: ${output.verdict.toUpperCase()}`);
     if (output.score != null) {
@@ -460,7 +474,11 @@ function printHuman(output) {
     if (output.changes.length > 0) {
         console.log("\n  What changed:");
         for (const c of output.changes) {
-            const arrow = c.direction === "worse" ? "\u2193" : c.direction === "better" ? "\u2191" : "\u2192";
+            const arrow = c.direction === "worse"
+                ? "\u2193"
+                : c.direction === "better"
+                    ? "\u2191"
+                    : "\u2192";
             console.log(`    ${arrow} ${c.metric}: ${c.baseline} \u2192 ${c.current}`);
         }
     }
@@ -490,7 +508,11 @@ function printHuman(output) {
     if (output.suggestedFixes.length > 0) {
         console.log("\n  Suggested fixes:");
         for (const fix of output.suggestedFixes) {
-            const pIcon = fix.priority === "high" ? "\u203C\uFE0F" : fix.priority === "medium" ? "\u2757" : "\u2022";
+            const pIcon = fix.priority === "high"
+                ? "\u203C\uFE0F"
+                : fix.priority === "medium"
+                    ? "\u2757"
+                    : "\u2022";
             console.log(`    ${pIcon} ${fix.action}`);
             console.log(`      ${fix.detail}`);
         }
@@ -503,7 +525,9 @@ async function runExplain(argv) {
     const cwd = process.cwd();
     const reportPath = findReport(cwd, flags.reportPath);
     if (!reportPath) {
-        const searched = flags.reportPath ? flags.reportPath : REPORT_SEARCH_PATHS.join(", ");
+        const searched = flags.reportPath
+            ? flags.reportPath
+            : REPORT_SEARCH_PATHS.join(", ");
         console.error(`\n  \u274C No report found. Searched: ${searched}`);
         console.error("  Run a gate first:");
         console.error("    npx evalai gate --format json");
@@ -519,7 +543,9 @@ async function runExplain(argv) {
         return 1;
     }
     // Schema version compatibility check
-    const reportSchema = typeof reportData.schemaVersion === "number" ? reportData.schemaVersion : undefined;
+    const reportSchema = typeof reportData.schemaVersion === "number"
+        ? reportData.schemaVersion
+        : undefined;
     if (reportSchema != null && reportSchema > types_1.CHECK_REPORT_SCHEMA_VERSION) {
         console.error(`\n  \u26A0\uFE0F  Report schema version ${reportSchema} is newer than this CLI supports (v${types_1.CHECK_REPORT_SCHEMA_VERSION}).`);
         console.error("  Update your SDK: npm install @pauly4010/evalai-sdk@latest\n");

package/dist/cli/formatters/human.js CHANGED Viewed

@@ -43,7 +43,10 @@ function formatHuman(report) {
         lines.push("Next: View full report above, fix failing cases, or adjust gate with --minScore / --maxDrop / --warnDrop");
     }
     if (report.explain &&
-        (report.breakdown01 || report.contribPts || report.flags?.length || report.policyEvidence)) {
+        (report.breakdown01 ||
+            report.contribPts ||
+            report.flags?.length ||
+            report.policyEvidence)) {
         lines.push("");
         lines.push("--- Explain ---");
         if (report.contribPts) {

package/dist/cli/formatters/pr-comment.js CHANGED Viewed

@@ -34,7 +34,9 @@ function buildPrComment(report) {
         }
     }
     else {
-        lines.push(passed ? "## ✅ EvalAI Regression Gate — PASSED" : "## 🚨 EvalAI Regression Gate — FAILED");
+        lines.push(passed
+            ? "## ✅ EvalAI Regression Gate — PASSED"
+            : "## 🚨 EvalAI Regression Gate — FAILED");
     }
     lines.push("");
     // Score + Delta (skip when gate not applied)

package/dist/cli/gate.js CHANGED Viewed

@@ -55,7 +55,9 @@ function evaluateGate(args, quality) {
             reasonMessage: `cost $${costUsd.toFixed(4)} exceeds maxCostUsd $${args.maxCostUsd.toFixed(4)}`,
         };
     }
-    if (args.maxLatencyMs != null && avgLatencyMs != null && avgLatencyMs > args.maxLatencyMs) {
+    if (args.maxLatencyMs != null &&
+        avgLatencyMs != null &&
+        avgLatencyMs > args.maxLatencyMs) {
         return {
             exitCode: constants_1.EXIT.SCORE_BELOW,
             passed: false,
@@ -102,7 +104,9 @@ function evaluateGate(args, quality) {
         };
     }
     // warnDrop: soft warning band; maxDrop: hard fail
-    if (args.maxDrop !== undefined && regressionDelta !== null && regressionDelta < -args.maxDrop) {
+    if (args.maxDrop !== undefined &&
+        regressionDelta !== null &&
+        regressionDelta < -args.maxDrop) {
         return {
             exitCode: constants_1.EXIT.REGRESSION,
             passed: false,

package/dist/cli/impact-analysis.js CHANGED Viewed

@@ -48,9 +48,9 @@ exports.analyzeImpact = analyzeImpact;
 exports.printHumanResults = printHumanResults;
 exports.printJsonResults = printJsonResults;
 exports.runImpactAnalysisCLI = runImpactAnalysisCLI;
+const node_child_process_1 = require("node:child_process");
 const fs = __importStar(require("node:fs/promises"));
 const path = __importStar(require("node:path"));
-const node_child_process_1 = require("node:child_process");
 /**
  * Run impact analysis
  */
@@ -87,7 +87,7 @@ async function readManifest(projectRoot = process.cwd()) {
         const content = await fs.readFile(manifestPath, "utf-8");
         return JSON.parse(content);
     }
-    catch (error) {
+    catch (_error) {
         return null;
     }
 }
@@ -138,7 +138,7 @@ function analyzeImpact(changedFiles, manifest) {
         if (!specsByFile.has(spec.filePath)) {
             specsByFile.set(spec.filePath, []);
         }
-        specsByFile.get(spec.filePath).push(spec);
+        specsByFile.get(spec.filePath)?.push(spec);
         // By dependencies
         const deps = [
             ...spec.dependsOn.prompts,
@@ -150,7 +150,7 @@ function analyzeImpact(changedFiles, manifest) {
             if (!specsByDependency.has(dep)) {
                 specsByDependency.set(dep, []);
             }
-            specsByDependency.get(dep).push(spec);
+            specsByDependency.get(dep)?.push(spec);
         }
     }
     // Analyze each changed file
@@ -179,7 +179,8 @@ function analyzeImpact(changedFiles, manifest) {
             // Add all specs
             for (const spec of manifest.specs) {
                 impactedSpecIds.add(spec.id);
-                reasonBySpecId[spec.id] = `Unknown file changed: ${changedFile} (safe fallback)`;
+                reasonBySpecId[spec.id] =
+                    `Unknown file changed: ${changedFile} (safe fallback)`;
             }
             break; // No need to continue analyzing
         }

package/dist/cli/index.js CHANGED Viewed

@@ -160,9 +160,13 @@ else if (subcommand === "impact-analysis") {
     const changedFilesIndex = args.indexOf("--changed-files");
     const formatIndex = args.indexOf("--format");
     const baseBranch = baseIndex !== -1 ? args[baseIndex + 1] : "main";
-    const changedFiles = changedFilesIndex !== -1 ? args[changedFilesIndex + 1]?.split(",") : undefined;
+    const changedFiles = changedFilesIndex !== -1
+        ? args[changedFilesIndex + 1]?.split(",")
+        : undefined;
     const format = formatIndex !== -1 ? args[formatIndex + 1] : "human";
-    (0, impact_analysis_1.runImpactAnalysisCLI)({ baseBranch, changedFiles, format }).catch((err) => {
+    (0, impact_analysis_1.runImpactAnalysisCLI)({ baseBranch, changedFiles, format })
+        .then(() => process.exit(0))
+        .catch((err) => {
         console.error(`EvalAI ERROR: ${err instanceof Error ? err.message : String(err)}`);
         process.exit(2);
     });
@@ -186,7 +190,9 @@ else if (subcommand === "run") {
         baseBranch,
         format,
         writeResults,
-    }).catch((err) => {
+    })
+        .then(() => process.exit(0))
+        .catch((err) => {
         console.error(`EvalAI ERROR: ${err instanceof Error ? err.message : String(err)}`);
         process.exit(2);
     });
@@ -200,7 +206,9 @@ else if (subcommand === "diff") {
     const base = baseIndex !== -1 ? args[baseIndex + 1] : undefined;
     const head = headIndex !== -1 ? args[headIndex + 1] : undefined;
     const format = formatIndex !== -1 ? args[formatIndex + 1] : "human";
-    (0, diff_1.runDiffCLI)({ base, head, format }).catch((err) => {
+    (0, diff_1.runDiffCLI)({ base, head, format })
+        .then(() => process.exit(0))
+        .catch((err) => {
         console.error(`EvalAI ERROR: ${err instanceof Error ? err.message : String(err)}`);
         process.exit(2);
     });
@@ -214,9 +222,13 @@ else if (subcommand === "ci") {
     const writeResultsIndex = args.indexOf("--write-results");
     const base = baseIndex !== -1 ? args[baseIndex + 1] : undefined;
     const impactedOnly = impactedOnlyIndex !== -1;
-    const format = formatIndex !== -1 ? args[formatIndex + 1] : "human";
+    const format = formatIndex !== -1
+        ? args[formatIndex + 1]
+        : "human";
     const writeResults = writeResultsIndex !== -1;
-    (0, ci_1.runCICLI)({ base, impactedOnly, format, writeResults }).catch((err) => {
+    (0, ci_1.runCICLI)({ base, impactedOnly, format, writeResults })
+        .then(() => process.exit(0))
+        .catch((err) => {
         console.error(`EvalAI ERROR: ${err instanceof Error ? err.message : String(err)}`);
         process.exit(2);
     });

package/dist/cli/manifest.d.ts CHANGED Viewed

@@ -6,16 +6,14 @@
  *
  * This is the compiler output that everything else consumes.
  */
-import type { SpecAnalysis } from "./discover";
 import type { ExecutionModeConfig } from "../runtime/execution-mode";
+import { SDK_VERSION } from "../version";
+import type { SpecAnalysis } from "./discover";
+export { SDK_VERSION };
 /**
  * Manifest schema version
  */
 export declare const MANIFEST_SCHEMA_VERSION = 1;
-/**
- * SDK version from package.json
- */
-export declare const SDK_VERSION = "1.8.0";
 /**
  * Evaluation Manifest Schema
  */

package/dist/cli/manifest.js CHANGED Viewed

@@ -41,22 +41,20 @@ var __importStar = (this && this.__importStar) || (function () {
     };
 })();
 Object.defineProperty(exports, "__esModule", { value: true });
-exports.SDK_VERSION = exports.MANIFEST_SCHEMA_VERSION = void 0;
+exports.MANIFEST_SCHEMA_VERSION = exports.SDK_VERSION = void 0;
 exports.generateManifest = generateManifest;
 exports.writeManifest = writeManifest;
 exports.readManifest = readManifest;
 exports.readLock = readLock;
+const crypto = __importStar(require("node:crypto"));
 const fs = __importStar(require("node:fs/promises"));
 const path = __importStar(require("node:path"));
-const crypto = __importStar(require("node:crypto"));
+const version_1 = require("../version");
+Object.defineProperty(exports, "SDK_VERSION", { enumerable: true, get: function () { return version_1.SDK_VERSION; } });
 /**
  * Manifest schema version
  */
 exports.MANIFEST_SCHEMA_VERSION = 1;
-/**
- * SDK version from package.json
- */
-exports.SDK_VERSION = "1.8.0";
 /**
  * Generate evaluation manifest from discovery results
  */
@@ -73,7 +71,7 @@ async function generateManifest(specs, projectRoot, projectName, executionMode)
         if (!specsByFile.has(normalizedPath)) {
             specsByFile.set(normalizedPath, []);
         }
-        specsByFile.get(normalizedPath).push(spec);
+        specsByFile.get(normalizedPath)?.push(spec);
     }
     // Process each file
     for (const [filePath, fileSpecs] of specsByFile) {
@@ -100,7 +98,7 @@ async function generateManifest(specs, projectRoot, projectName, executionMode)
         },
         runtime: {
             mode: executionMode.mode,
-            sdkVersion: exports.SDK_VERSION,
+            sdkVersion: version_1.SDK_VERSION,
         },
         specFiles,
         specs: processedSpecs,
@@ -163,7 +161,8 @@ function extractDependencies(content) {
     const dependsOnMatch = content.match(/dependsOn\s*:\s*({[^}]+})/s);
     if (dependsOnMatch) {
         try {
-            const deps = eval(`(${dependsOnMatch[1]})`);
+            // Use JSON.parse instead of eval for safety
+            const deps = JSON.parse(dependsOnMatch[1]);
             return {
                 prompts: deps.prompts || [],
                 datasets: deps.datasets || [],
@@ -171,8 +170,14 @@ function extractDependencies(content) {
                 code: deps.code || [],
             };
         }
-        catch (error) {
-            // Fall back to simple extraction
+        catch (_error) {
+            // If parsing fails, return empty dependencies
+            return {
+                prompts: [],
+                datasets: [],
+                tools: [],
+                code: [],
+            };
         }
     }
     // Simple extraction as fallback
@@ -184,8 +189,10 @@ function extractDependencies(content) {
     };
     for (const [type, pattern] of Object.entries(patterns)) {
         let match;
-        while ((match = pattern.exec(content)) !== null) {
+        match = pattern.exec(content);
+        while (match !== null) {
             dependsOn[type].push(match[1]);
+            match = pattern.exec(content);
         }
     }
     return dependsOn;
@@ -256,7 +263,7 @@ async function readManifest(projectRoot) {
         const content = await fs.readFile(manifestPath, "utf-8");
         return JSON.parse(content);
     }
-    catch (error) {
+    catch (_error) {
         return null;
     }
 }
@@ -269,7 +276,7 @@ async function readLock(projectRoot) {
         const content = await fs.readFile(lockPath, "utf-8");
         return JSON.parse(content);
     }
-    catch (error) {
+    catch (_error) {
         return null;
     }
 }

package/dist/cli/migrate.js CHANGED Viewed

@@ -43,9 +43,9 @@ exports.migrateConfig = migrateConfig;
 exports.createMigrateCommand = createMigrateCommand;
 exports.validateConfigFile = validateConfigFile;
 exports.previewMigration = previewMigration;
-const commander_1 = require("commander");
 const fs = __importStar(require("node:fs/promises"));
 const path = __importStar(require("node:path"));
+const commander_1 = require("commander");
 const testsuite_to_dsl_1 = require("../runtime/adapters/testsuite-to-dsl");
 const testing_1 = require("../testing");
 /**
@@ -97,7 +97,7 @@ function extractTestSuitesFromConfig(config) {
 /**
  * Generate DSL file header
  */
-function generateFileHeader(config, options) {
+function generateFileHeader(_config, options) {
     const timestamp = new Date().toISOString();
     const inputPath = path.resolve(options.input);
     const outputPath = path.resolve(options.output);
@@ -127,7 +127,7 @@ function generateFileHeader(config, options) {
 /**
  * Generate helper functions for the entire file
  */
-function generateGlobalHelpers(config, options) {
+function generateGlobalHelpers(config, _options) {
     const helpers = [];
     // Add executor helper if config has executor
     if (config.executor) {
@@ -164,7 +164,7 @@ function generateGlobalHelpers(config, options) {
         ` * Legacy test evaluation function`,
         ` * TODO: Adapt based on your original test logic`,
         ` */`,
-        `async function evaluateLegacyTest(input: string, expected?: string): Promise<any> {`,
+        `async function evaluateLegacyTest(input: string, expected?: string): Promise<unknown> {`,
         `  const output = await legacyExecutor(input);`,
         `  const passed = evaluateAssertions(output, expected);`,
         `  `,

package/dist/cli/policy-packs.js CHANGED Viewed

@@ -22,7 +22,10 @@ exports.POLICY_PACKS = {
         1: {
             policyId: "SOC2",
             version: 1,
-            thresholds: { requiredSafetyRate: 0.95, maxFlags: ["SAFETY_RISK", "LOW_PASS_RATE"] },
+            thresholds: {
+                requiredSafetyRate: 0.95,
+                maxFlags: ["SAFETY_RISK", "LOW_PASS_RATE"],
+            },
             rationale: "SOC2 trust criteria for security and availability.",
             checks: ["safety_rate", "flag_restrictions"],
         },
@@ -40,7 +43,10 @@ exports.POLICY_PACKS = {
         1: {
             policyId: "PCI_DSS",
             version: 1,
-            thresholds: { requiredSafetyRate: 0.99, maxFlags: ["SAFETY_RISK", "LOW_PASS_RATE"] },
+            thresholds: {
+                requiredSafetyRate: 0.99,
+                maxFlags: ["SAFETY_RISK", "LOW_PASS_RATE"],
+            },
             rationale: "PCI DSS cardholder data security standards.",
             checks: ["safety_rate", "flag_restrictions"],
         },

package/dist/cli/print-config.js CHANGED Viewed

@@ -135,13 +135,20 @@ function buildResolvedConfig(cwd, flags) {
                 : "default";
     fields.push({
         key: "baseUrl",
-        value: flags.baseUrl || envBaseUrl || fileConfig?.baseUrl || "http://localhost:3000",
+        value: flags.baseUrl ||
+            envBaseUrl ||
+            fileConfig?.baseUrl ||
+            "http://localhost:3000",
         source: baseUrlSource,
     });
     // apiKey (always redacted)
     const envApiKey = process.env.EVALAI_API_KEY;
     const rawApiKey = flags.apiKey || envApiKey || "";
-    const apiKeySource = flags.apiKey ? "arg" : envApiKey ? "env" : "default";
+    const apiKeySource = flags.apiKey
+        ? "arg"
+        : envApiKey
+            ? "env"
+            : "default";
     fields.push({
         key: "apiKey",
         value: redact(rawApiKey) ?? "(not set)",
@@ -150,7 +157,11 @@ function buildResolvedConfig(cwd, flags) {
     });
     // profile
     const profileName = (flags.profile || fileConfig?.profile);
-    const profileSource = flags.profile ? "arg" : fileConfig?.profile ? "file" : "default";
+    const profileSource = flags.profile
+        ? "arg"
+        : fileConfig?.profile
+            ? "file"
+            : "default";
     fields.push({
         key: "profile",
         value: profileName ?? null,
@@ -184,7 +195,11 @@ function buildResolvedConfig(cwd, flags) {
         });
     }
     // baseline
-    const baselineSource = flags.baseline ? "arg" : fileConfig?.baseline ? "file" : "default";
+    const baselineSource = flags.baseline
+        ? "arg"
+        : fileConfig?.baseline
+            ? "file"
+            : "default";
     fields.push({
         key: "baseline",
         value: merged.baseline ?? "published",