@deepagents/evals 0.20.0 → 0.23.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -150,6 +150,22 @@ function truncateString(text, maxLength) {
150
150
  if (text.length <= maxLength) return text;
151
151
  return text.slice(0, maxLength) + "\u2026";
152
152
  }
153
+ function stringifyRationale(value) {
154
+ if (typeof value === "string") {
155
+ const trimmed = value.trim();
156
+ return trimmed.length > 0 ? trimmed : void 0;
157
+ }
158
+ if (Array.isArray(value)) {
159
+ const parts = value.map((item) => typeof item === "string" ? item.trim() : "").filter(Boolean);
160
+ if (parts.length > 0) return parts.join(" | ");
161
+ }
162
+ return void 0;
163
+ }
164
+ function scoreReasonWithMetadata(score) {
165
+ const reason = score.reason?.trim();
166
+ if (reason) return reason;
167
+ return stringifyRationale(score.metadata?.["rationale"]);
168
+ }
153
169
  function renderSummaryTable(data) {
154
170
  const { summary } = data;
155
171
  const passRate = summary.totalCases > 0 ? (summary.passCount / summary.totalCases * 100).toFixed(1) : "0.0";
@@ -211,7 +227,8 @@ function renderCaseDetail(c, threshold, options) {
211
227
  }
212
228
  for (const [name, s] of entries) {
213
229
  const scoreColor = s.score >= threshold ? chalk.green : chalk.red;
214
- const reasonStr = s.reason ? ` \u2014 ${s.reason}` : "";
230
+ const reason = scoreReasonWithMetadata(s);
231
+ const reasonStr = reason ? ` \u2014 ${reason}` : "";
215
232
  console.log(
216
233
  ` ${chalk.dim(name + ":")} ${scoreColor(s.score.toFixed(3))}${reasonStr}`
217
234
  );
@@ -1,7 +1,7 @@
1
1
  {
2
2
  "version": 3,
3
3
  "sources": ["../../src/reporters/console.ts", "../../src/reporters/format.ts", "../../src/reporters/shared.ts", "../../src/reporters/json.ts", "../../src/reporters/csv.ts", "../../src/reporters/markdown.ts", "../../src/reporters/html.ts"],
4
- "sourcesContent": ["import chalk from 'chalk';\n\nimport {\n formatDuration,\n formatErrorValue,\n formatTokens,\n stringifyUnknown,\n} from './format.ts';\nimport { getCaseStatus } from './shared.ts';\nimport type { CaseResult, Reporter, RunEndData, Verbosity } from './types.ts';\n\nexport interface ConsoleReporterOptions {\n verbosity?: Verbosity;\n}\n\nconst BAR_WIDTH = 20;\n\nfunction renderProgressBar(\n completed: number,\n total: number,\n elapsedMs: number,\n): string {\n const pct = total > 0 ? completed / total : 0;\n const filled = Math.round(pct * BAR_WIDTH);\n const bar = '\\u2593'.repeat(filled) + '\\u2591'.repeat(BAR_WIDTH - filled);\n const pctStr = `${(pct * 100).toFixed(0)}%`;\n return ` ${bar} ${pctStr} (${completed}/${total}) ${formatDuration(elapsedMs)}`;\n}\n\nfunction statusLabel(status: 'pass' | 'fail' | 'error'): string {\n if (status === 'pass') return chalk.green('PASS');\n if (status === 'error') return chalk.yellow('ERROR');\n return chalk.red('FAIL');\n}\n\nexport function consoleReporter(options?: ConsoleReporterOptions): Reporter {\n const verbosity = options?.verbosity ?? 'normal';\n\n let totalCases = 0;\n let completed = 0;\n let startTime = 0;\n\n return {\n onRunStart(data) {\n totalCases = data.totalCases;\n completed = 0;\n startTime = Date.now();\n\n if (verbosity !== 'quiet') {\n const label = data.name;\n console.log('');\n console.log(\n ` ${chalk.dim('\\u2500\\u2500')} ${chalk.bold(label)} ${chalk.dim('\\u2500'.repeat(Math.max(0, 56 - label.length)))}`,\n );\n console.log(` ${chalk.dim(`Running ${data.totalCases} cases...`)}`);\n console.log('');\n }\n },\n\n onCaseEnd() {\n completed++;\n if (verbosity !== 'quiet') {\n const elapsed = Date.now() - startTime;\n process.stdout.write(\n `\\r${renderProgressBar(completed, totalCases, elapsed)}`,\n );\n }\n },\n\n onRunEnd(data) {\n if (verbosity !== 'quiet') {\n process.stdout.write('\\r' + ' '.repeat(70) + '\\r');\n }\n\n renderSummaryTable(data);\n\n if (verbosity === 'quiet') return;\n\n const sorted = [...data.cases].sort((a, b) => a.index - b.index);\n\n if (verbosity === 'verbose') {\n for (const c of sorted) {\n renderCaseDetail(c, data.threshold, {\n includeIO: true,\n maxStringLength: 20_000,\n });\n }\n } else {\n renderFailuresByScorer(sorted, data.threshold);\n }\n },\n };\n}\n\nfunction indentBlock(text: string, spaces: number): string {\n const pad = ' '.repeat(spaces);\n return text\n .replace(/\\r\\n/g, '\\n')\n .split('\\n')\n .map((line) => pad + line)\n .join('\\n');\n}\n\nfunction truncateString(text: string, maxLength: number): string {\n if (text.length <= maxLength) return text;\n return text.slice(0, maxLength) + '\\u2026';\n}\n\nfunction renderSummaryTable(data: RunEndData): void {\n const { summary } = data;\n const passRate =\n summary.totalCases > 0\n ? ((summary.passCount / summary.totalCases) * 100).toFixed(1)\n : '0.0';\n\n console.log('');\n console.log(chalk.bold(' Summary'));\n console.log(chalk.dim(' ' + '\\u2500'.repeat(60)));\n console.log(` ${chalk.dim('Eval:')} ${data.name}`);\n console.log(` ${chalk.dim('Model:')} ${data.model}`);\n console.log(` ${chalk.dim('Threshold:')} ${data.threshold}`);\n console.log(` ${chalk.dim('Cases:')} ${summary.totalCases}`);\n console.log(\n ` ${chalk.dim('Pass/Fail:')} ${chalk.green(String(summary.passCount))} / ${chalk.red(String(summary.failCount))} ${chalk.dim(`(${passRate}%)`)}`,\n );\n console.log(\n ` ${chalk.dim('Duration:')} ${formatDuration(summary.totalLatencyMs)}`,\n );\n console.log(\n ` ${chalk.dim('Tokens:')} ${chalk.dim('In:')} ${formatTokens(summary.totalTokensIn)} ${chalk.dim('Out:')} ${formatTokens(summary.totalTokensOut)} ${chalk.dim('Total:')} ${formatTokens(summary.totalTokensIn + summary.totalTokensOut)}`,\n );\n\n const scoreEntries = Object.entries(summary.meanScores);\n if (scoreEntries.length > 0) {\n console.log('');\n console.log(chalk.bold(' Scores'));\n for (const [name, score] of scoreEntries) {\n const scoreColor = score >= data.threshold ? chalk.green : chalk.red;\n console.log(\n ` ${chalk.dim(name + ':')}${' '.repeat(Math.max(1, 12 - name.length))}${scoreColor(score.toFixed(3))}`,\n );\n }\n }\n\n console.log(chalk.dim(' ' + '\\u2500'.repeat(60)));\n console.log('');\n}\n\nfunction renderCaseDetail(\n c: CaseResult,\n threshold: number,\n options?: {\n includeIO?: boolean;\n maxStringLength?: number;\n },\n): void {\n const entries = Object.entries(c.scores);\n const status = getCaseStatus(c, threshold);\n const prefix = statusLabel(status);\n const includeIO = options?.includeIO ?? false;\n const maxStringLength = options?.maxStringLength ?? 4_000;\n\n const meta = `${chalk.dim(formatDuration(c.latencyMs))} ${chalk.dim(`${c.tokensIn}/${c.tokensOut} tokens`)}`;\n console.log(` ${prefix} ${chalk.dim(`Case #${c.index}`)} ${meta}`);\n\n const inputStr = stringifyUnknown(c.input, {\n space: 2,\n fallback: String(c.input),\n });\n console.log(` ${chalk.dim('Input:')}`);\n console.log(indentBlock(truncateString(inputStr, maxStringLength), 6));\n\n if (includeIO) {\n console.log(` ${chalk.dim('Output:')}`);\n console.log(indentBlock(truncateString(c.output, maxStringLength), 6));\n console.log(` ${chalk.dim('Expected:')}`);\n const expectedStrRaw = stringifyUnknown(c.expected, {\n space: 2,\n fallback: String(c.expected),\n });\n console.log(\n indentBlock(truncateString(expectedStrRaw, maxStringLength), 6),\n );\n }\n\n for (const [name, s] of entries) {\n const scoreColor = s.score >= threshold ? chalk.green : chalk.red;\n const reasonStr = s.reason ? ` \\u2014 ${s.reason}` : '';\n console.log(\n ` ${chalk.dim(name + ':')} ${scoreColor(s.score.toFixed(3))}${reasonStr}`,\n );\n }\n\n if (c.error) {\n console.log(` ${chalk.dim('Error:')}`);\n const errorStr = formatErrorValue(c.error);\n console.log(` ${chalk.red(errorStr)}`);\n }\n\n console.log('');\n}\n\nfunction renderFailuresByScorer(cases: CaseResult[], threshold: number): void {\n const scorerNames = new Set<string>();\n for (const c of cases) {\n for (const name of Object.keys(c.scores)) {\n scorerNames.add(name);\n }\n }\n\n let hasFailures = false;\n\n for (const scorer of scorerNames) {\n const failing = cases.filter((c) => {\n const s = c.scores[scorer];\n return (\n (s && s.score < threshold) || getCaseStatus(c, threshold) === 'error'\n );\n });\n\n if (failing.length === 0) continue;\n\n if (!hasFailures) {\n console.log(chalk.dim(' Failing by scorer:'));\n console.log('');\n hasFailures = true;\n }\n\n console.log(\n ` ${chalk.bold(scorer)} ${chalk.dim(`(${failing.length} failures)`)}`,\n );\n console.log(chalk.dim(' ' + '\\u2500'.repeat(40)));\n\n for (const c of failing) {\n renderCaseDetail(c, threshold, {\n includeIO: true,\n maxStringLength: 4_000,\n });\n }\n }\n}\n", "export function truncate(str: string, maxLen = 80): string {\n if (str.length <= maxLen) return str;\n return str.slice(0, maxLen) + '...';\n}\n\nexport function formatDuration(ms: number): string {\n if (ms < 1000) return `${ms}ms`;\n return `${(ms / 1000).toFixed(1)}s`;\n}\n\nexport function formatTokens(n: number): string {\n if (n >= 1_000_000) return `${(n / 1_000_000).toFixed(1)}M`;\n if (n >= 1_000) return `${(n / 1_000).toFixed(0)}k`;\n return String(n);\n}\n\nexport function generateFilename(\n name: string,\n runId: string,\n ext: string,\n): string {\n const slug = name.replace(/[^a-zA-Z0-9-_]/g, '-').toLowerCase();\n const prefix = runId.slice(0, 8);\n return `${slug}-${prefix}.${ext}`;\n}\n\nexport function stringifyUnknown(\n value: unknown,\n options?: {\n space?: number;\n fallback?: string;\n },\n): string {\n if (typeof value === 'string') return value;\n\n const space = options?.space ?? 0;\n const fallback = options?.fallback ?? 'null';\n try {\n return JSON.stringify(value, null, space) ?? fallback;\n } catch {\n return String(value);\n }\n}\n\nexport function formatInputValue(value: unknown): string {\n return stringifyUnknown(value, { space: 0, fallback: '' });\n}\n\nexport function formatErrorValue(value: unknown): string {\n if (value == null) return '';\n if (typeof value === 'string') return value;\n return stringifyUnknown(value, { space: 2, fallback: '' });\n}\n\nexport function escapeCsv(value: unknown): string {\n const str = stringifyUnknown(value, { space: 0, fallback: 'null' });\n if (str.includes(',') || str.includes('\"') || str.includes('\\n')) {\n return `\"${str.replace(/\"/g, '\"\"')}\"`;\n }\n return str;\n}\n", "import { mkdir, writeFile } from 'node:fs/promises';\nimport { join } from 'node:path';\n\nimport { generateFilename } from './format.ts';\nimport type { CaseResult, Reporter, RunEndData } from './types.ts';\n\nconst DEFAULT_OUTPUT_DIR = '.evals/reports';\n\nexport function resolveOutputDir(outputDir?: string): string {\n return outputDir ?? DEFAULT_OUTPUT_DIR;\n}\n\nexport function getReportPath(\n outputDir: string,\n name: string,\n runId: string,\n ext: string,\n): string {\n return join(outputDir, generateFilename(name, runId, ext));\n}\n\nexport async function writeRunReportFile(\n outputDir: string,\n name: string,\n runId: string,\n ext: string,\n content: string,\n): Promise<void> {\n await mkdir(outputDir, { recursive: true });\n await writeFile(getReportPath(outputDir, name, runId, ext), content, 'utf-8');\n}\n\nexport function getCaseStatus(\n result: CaseResult,\n threshold: number,\n): 'error' | 'pass' | 'fail' {\n if (result.error) return 'error';\n const passed = Object.values(result.scores).every(\n (s) => s.score >= threshold,\n );\n return passed ? 'pass' : 'fail';\n}\n\nexport function createRunEndFileReporter(options: {\n outputDir?: string;\n ext: string;\n render: (data: RunEndData) => string | Promise<string>;\n}): Reporter {\n const outputDir = resolveOutputDir(options.outputDir);\n\n return {\n async onRunEnd(data) {\n const content = await options.render(data);\n await writeRunReportFile(\n outputDir,\n data.name,\n data.runId,\n options.ext,\n content,\n );\n },\n };\n}\n", "import { appendFile, mkdir } from 'node:fs/promises';\n\nimport { stringifyUnknown } from './format.ts';\nimport {\n getReportPath,\n resolveOutputDir,\n writeRunReportFile,\n} from './shared.ts';\nimport type { Reporter } from './types.ts';\n\nexport interface JsonReporterOptions {\n outputDir?: string;\n pretty?: boolean;\n}\n\nexport function jsonReporter(options?: JsonReporterOptions): Reporter {\n const outputDir = resolveOutputDir(options?.outputDir);\n const pretty = options?.pretty ?? true;\n let streamFilename = '';\n\n return {\n async onRunStart(data) {\n await mkdir(outputDir, { recursive: true });\n streamFilename = getReportPath(outputDir, data.name, data.runId, 'jsonl');\n },\n async onCaseEnd(data) {\n const line = stringifyUnknown(data, { space: 0, fallback: 'null' });\n await appendFile(streamFilename, line + '\\n', 'utf-8');\n },\n async onRunEnd(data) {\n const content = stringifyUnknown(data, {\n space: pretty ? 2 : 0,\n fallback: 'null',\n });\n await writeRunReportFile(\n outputDir,\n data.name,\n data.runId,\n 'json',\n content,\n );\n },\n };\n}\n", "import { escapeCsv } from './format.ts';\nimport { createRunEndFileReporter, getCaseStatus } from './shared.ts';\nimport type { Reporter } from './types.ts';\n\nexport interface CsvReporterOptions {\n outputDir?: string;\n}\n\nexport function csvReporter(options?: CsvReporterOptions): Reporter {\n return createRunEndFileReporter({\n outputDir: options?.outputDir,\n ext: 'csv',\n render(data) {\n const scorerNames = Object.keys(data.summary.meanScores);\n\n const headerParts = [\n 'index',\n 'status',\n 'input',\n 'output',\n 'expected',\n 'error',\n 'latency_ms',\n 'tokens_in',\n 'tokens_out',\n ];\n for (const name of scorerNames) {\n headerParts.push(`${name}_score`, `${name}_reason`);\n }\n\n const rows = [headerParts.join(',')];\n\n for (const c of data.cases) {\n const status = getCaseStatus(c, data.threshold);\n const parts = [\n String(c.index),\n status,\n escapeCsv(c.input),\n escapeCsv(c.output),\n escapeCsv(c.expected),\n escapeCsv(c.error ?? ''),\n String(c.latencyMs),\n String(c.tokensIn),\n String(c.tokensOut),\n ];\n for (const name of scorerNames) {\n const s = c.scores[name];\n parts.push(String(s?.score ?? ''), escapeCsv(s?.reason ?? ''));\n }\n rows.push(parts.join(','));\n }\n\n return rows.join('\\n') + '\\n';\n },\n });\n}\n", "import {\n formatDuration,\n formatErrorValue,\n formatInputValue,\n formatTokens,\n} from './format.ts';\nimport { createRunEndFileReporter, getCaseStatus } from './shared.ts';\nimport type { Reporter } from './types.ts';\n\nexport interface MarkdownReporterOptions {\n outputDir?: string;\n}\n\nexport function markdownReporter(options?: MarkdownReporterOptions): Reporter {\n return createRunEndFileReporter({\n outputDir: options?.outputDir,\n ext: 'md',\n render(data) {\n const { summary } = data;\n const scorerNames = Object.keys(summary.meanScores);\n const lines: string[] = [];\n const passRate =\n summary.totalCases > 0\n ? ((summary.passCount / summary.totalCases) * 100).toFixed(1)\n : '0.0';\n\n lines.push(`# ${data.name}`);\n lines.push('');\n lines.push(`**Model:** ${data.model}`);\n lines.push(`**Threshold:** ${data.threshold}`);\n lines.push(\n `**Cases:** ${summary.totalCases} (${summary.passCount} pass, ${summary.failCount} fail, ${passRate}%)`,\n );\n lines.push(`**Duration:** ${formatDuration(summary.totalLatencyMs)}`);\n lines.push(\n `**Tokens:** In: ${formatTokens(summary.totalTokensIn)} | Out: ${formatTokens(summary.totalTokensOut)} | Total: ${formatTokens(summary.totalTokensIn + summary.totalTokensOut)}`,\n );\n lines.push('');\n\n lines.push('## Scores');\n lines.push('');\n lines.push('| Scorer | Mean |');\n lines.push('|--------|------|');\n for (const [name, score] of Object.entries(summary.meanScores)) {\n lines.push(`| ${name} | ${score.toFixed(3)} |`);\n }\n lines.push('');\n\n lines.push('## Cases');\n lines.push('');\n\n const caseHeader = [\n '#',\n 'Status',\n 'Input',\n ...scorerNames,\n 'Latency',\n 'Tokens',\n 'Error',\n ];\n lines.push(`| ${caseHeader.join(' | ')} |`);\n lines.push(`| ${caseHeader.map(() => '---').join(' | ')} |`);\n\n for (const c of data.cases) {\n const statusValue = getCaseStatus(c, data.threshold);\n const status =\n statusValue === 'error'\n ? '\uD83D\uDD34 Error'\n : statusValue === 'pass'\n ? '\u2705 Pass'\n : '\u274C Fail';\n const input = formatInputValue(c.input).slice(0, 60);\n const scores = scorerNames.map(\n (name) => c.scores[name]?.score.toFixed(3) ?? '-',\n );\n const error = c.error\n ? formatErrorValue(c.error)\n .replace(/\\r?\\n/g, '<br>')\n .replace(/\\|/g, '\\\\|')\n : '-';\n const row = [\n String(c.index),\n status,\n input,\n ...scores,\n formatDuration(c.latencyMs),\n `${c.tokensIn}/${c.tokensOut}`,\n error,\n ];\n lines.push(`| ${row.join(' | ')} |`);\n }\n lines.push('');\n\n return lines.join('\\n');\n },\n });\n}\n", "import {\n formatDuration,\n formatErrorValue,\n formatInputValue,\n formatTokens,\n stringifyUnknown,\n} from './format.ts';\nimport { createRunEndFileReporter, getCaseStatus } from './shared.ts';\nimport type { Reporter, RunEndData } from './types.ts';\n\nexport interface HtmlReporterOptions {\n outputDir?: string;\n}\n\nexport function htmlReporter(options?: HtmlReporterOptions): Reporter {\n return createRunEndFileReporter({\n outputDir: options?.outputDir,\n ext: 'html',\n render: renderHtml,\n });\n}\n\nfunction esc(str: string): string {\n return str\n .replace(/&/g, '&amp;')\n .replace(/</g, '&lt;')\n .replace(/>/g, '&gt;')\n .replace(/\"/g, '&quot;');\n}\n\nfunction renderHtml(data: RunEndData): string {\n const { summary } = data;\n const scorerNames = Object.keys(summary.meanScores);\n const passRate =\n summary.totalCases > 0\n ? ((summary.passCount / summary.totalCases) * 100).toFixed(1)\n : '0.0';\n\n const caseRows = data.cases\n .map((c) => {\n const status = getCaseStatus(c, data.threshold);\n const statusLabel =\n status === 'error' ? 'ERROR' : status === 'pass' ? 'PASS' : 'FAIL';\n const scoresCells = scorerNames\n .map((name) => {\n const s = c.scores[name];\n const score = s?.score ?? 0;\n const cls = score >= data.threshold ? 'pass' : 'fail';\n const reason = s?.reason ? ` title=\"${esc(s.reason)}\"` : '';\n return `<td class=\"${cls}\"${reason}>${score.toFixed(3)}</td>`;\n })\n .join('');\n\n const expectedStr = stringifyUnknown(c.expected, {\n space: 0,\n fallback: '',\n });\n\n return `<tr class=\"${status}\">\n <td>${c.index}</td>\n <td class=\"${status}\">${statusLabel}</td>\n <td class=\"text\">${esc(formatInputValue(c.input).slice(0, 120))}</td>\n <td class=\"text\">${esc(c.output.slice(0, 120))}</td>\n <td class=\"text\">${esc(expectedStr.slice(0, 120))}</td>\n ${scoresCells}\n <td>${formatDuration(c.latencyMs)}</td>\n <td>${c.tokensIn}/${c.tokensOut}</td>\n <td class=\"error-text\">${c.error ? esc(formatErrorValue(c.error)) : ''}</td>\n </tr>`;\n })\n .join('\\n');\n\n const scorerHeaders = scorerNames.map((n) => `<th>${esc(n)}</th>`).join('');\n const meanScoreRows = Object.entries(summary.meanScores)\n .map(\n ([name, score]) =>\n `<tr><td>${esc(name)}</td><td>${score.toFixed(3)}</td></tr>`,\n )\n .join('');\n\n return `<!DOCTYPE html>\n<html lang=\"en\">\n<head>\n<meta charset=\"utf-8\">\n<title>${esc(data.name)} \u2014 Eval Report</title>\n<style>\n * { box-sizing: border-box; margin: 0; padding: 0; }\n body { font-family: system-ui, -apple-system, sans-serif; background: #f8f9fa; color: #1a1a1a; padding: 2rem; }\n h1 { font-size: 1.5rem; margin-bottom: 0.5rem; }\n .meta { color: #666; margin-bottom: 1.5rem; font-size: 0.9rem; }\n .meta span { margin-right: 1.5rem; }\n .summary-table, .cases-table { width: 100%; border-collapse: collapse; margin-bottom: 2rem; }\n .summary-table th, .summary-table td,\n .cases-table th, .cases-table td { padding: 0.5rem 0.75rem; border: 1px solid #ddd; text-align: left; font-size: 0.85rem; }\n .summary-table th, .cases-table th { background: #f1f3f5; font-weight: 600; }\n .cases-table .text { max-width: 300px; overflow: hidden; text-overflow: ellipsis; white-space: nowrap; }\n .cases-table .error-text { max-width: 480px; white-space: pre-wrap; word-break: break-word; }\n .pass { color: #2b8a3e; }\n .fail { color: #c92a2a; }\n .error { color: #e67700; }\n tr.pass:hover, tr.fail:hover, tr.error:hover { background: #f1f3f5; }\n td.pass { background: #ebfbee; }\n td.fail { background: #fff5f5; }\n h2 { font-size: 1.2rem; margin: 1.5rem 0 0.75rem; }\n</style>\n</head>\n<body>\n <h1>${esc(data.name)}</h1>\n <div class=\"meta\">\n <span><strong>Model:</strong> ${esc(data.model)}</span>\n <span><strong>Threshold:</strong> ${data.threshold}</span>\n <span><strong>Cases:</strong> ${summary.totalCases}</span>\n <span><strong>Pass:</strong> ${summary.passCount}</span>\n <span><strong>Fail:</strong> ${summary.failCount} (${passRate}%)</span>\n <span><strong>Duration:</strong> ${formatDuration(summary.totalLatencyMs)}</span>\n <span><strong>Tokens In:</strong> ${formatTokens(summary.totalTokensIn)}</span>\n <span><strong>Tokens Out:</strong> ${formatTokens(summary.totalTokensOut)}</span>\n <span><strong>Total Tokens:</strong> ${formatTokens(summary.totalTokensIn + summary.totalTokensOut)}</span>\n </div>\n\n <h2>Mean Scores</h2>\n <table class=\"summary-table\">\n <thead><tr><th>Scorer</th><th>Mean</th></tr></thead>\n <tbody>${meanScoreRows}</tbody>\n </table>\n\n <h2>Cases</h2>\n <table class=\"cases-table\">\n <thead>\n <tr>\n <th>#</th>\n <th>Status</th>\n <th>Input</th>\n <th>Output</th>\n <th>Expected</th>\n ${scorerHeaders}\n <th>Latency</th>\n <th>Tokens</th>\n <th>Error</th>\n </tr>\n </thead>\n <tbody>\n ${caseRows}\n </tbody>\n </table>\n</body>\n</html>`;\n}\n"],
5
- "mappings": ";AAAA,OAAO,WAAW;;;ACKX,SAAS,eAAe,IAAoB;AACjD,MAAI,KAAK,IAAM,QAAO,GAAG,EAAE;AAC3B,SAAO,IAAI,KAAK,KAAM,QAAQ,CAAC,CAAC;AAClC;AAEO,SAAS,aAAa,GAAmB;AAC9C,MAAI,KAAK,IAAW,QAAO,IAAI,IAAI,KAAW,QAAQ,CAAC,CAAC;AACxD,MAAI,KAAK,IAAO,QAAO,IAAI,IAAI,KAAO,QAAQ,CAAC,CAAC;AAChD,SAAO,OAAO,CAAC;AACjB;AAEO,SAAS,iBACd,MACA,OACA,KACQ;AACR,QAAM,OAAO,KAAK,QAAQ,mBAAmB,GAAG,EAAE,YAAY;AAC9D,QAAM,SAAS,MAAM,MAAM,GAAG,CAAC;AAC/B,SAAO,GAAG,IAAI,IAAI,MAAM,IAAI,GAAG;AACjC;AAEO,SAAS,iBACd,OACA,SAIQ;AACR,MAAI,OAAO,UAAU,SAAU,QAAO;AAEtC,QAAM,QAAQ,SAAS,SAAS;AAChC,QAAM,WAAW,SAAS,YAAY;AACtC,MAAI;AACF,WAAO,KAAK,UAAU,OAAO,MAAM,KAAK,KAAK;AAAA,EAC/C,QAAQ;AACN,WAAO,OAAO,KAAK;AAAA,EACrB;AACF;AAEO,SAAS,iBAAiB,OAAwB;AACvD,SAAO,iBAAiB,OAAO,EAAE,OAAO,GAAG,UAAU,GAAG,CAAC;AAC3D;AAEO,SAAS,iBAAiB,OAAwB;AACvD,MAAI,SAAS,KAAM,QAAO;AAC1B,MAAI,OAAO,UAAU,SAAU,QAAO;AACtC,SAAO,iBAAiB,OAAO,EAAE,OAAO,GAAG,UAAU,GAAG,CAAC;AAC3D;AAEO,SAAS,UAAU,OAAwB;AAChD,QAAM,MAAM,iBAAiB,OAAO,EAAE,OAAO,GAAG,UAAU,OAAO,CAAC;AAClE,MAAI,IAAI,SAAS,GAAG,KAAK,IAAI,SAAS,GAAG,KAAK,IAAI,SAAS,IAAI,GAAG;AAChE,WAAO,IAAI,IAAI,QAAQ,MAAM,IAAI,CAAC;AAAA,EACpC;AACA,SAAO;AACT;;;AC5DA,SAAS,OAAO,iBAAiB;AACjC,SAAS,YAAY;AAKrB,IAAM,qBAAqB;AAEpB,SAAS,iBAAiB,WAA4B;AAC3D,SAAO,aAAa;AACtB;AAEO,SAAS,cACd,WACA,MACA,OACA,KACQ;AACR,SAAO,KAAK,WAAW,iBAAiB,MAAM,OAAO,GAAG,CAAC;AAC3D;AAEA,eAAsB,mBACpB,WACA,MACA,OACA,KACA,SACe;AACf,QAAM,MAAM,WAAW,EAAE,WAAW,KAAK,CAAC;AAC1C,QAAM,UAAU,cAAc,WAAW,MAAM,OAAO,GAAG,GAAG,SAAS,OAAO;AAC9E;AAEO,SAAS,cACd,QACA,WAC2B;AAC3B,MAAI,OAAO,MAAO,QAAO;AACzB,QAAM,SAAS,OAAO,OAAO,OAAO,MAAM,EAAE;AAAA,IAC1C,CAAC,MAAM,EAAE,SAAS;AAAA,EACpB;AACA,SAAO,SAAS,SAAS;AAC3B;AAEO,SAAS,yBAAyB,SAI5B;AACX,QAAM,YAAY,iBAAiB,QAAQ,SAAS;AAEpD,SAAO;AAAA,IACL,MAAM,SAAS,MAAM;AACnB,YAAM,UAAU,MAAM,QAAQ,OAAO,IAAI;AACzC,YAAM;AAAA,QACJ;AAAA,QACA,KAAK;AAAA,QACL,KAAK;AAAA,QACL,QAAQ;AAAA,QACR;AAAA,MACF;AAAA,IACF;AAAA,EACF;AACF;;;AF/CA,IAAM,YAAY;AAElB,SAAS,kBACP,WACA,OACA,WACQ;AACR,QAAM,MAAM,QAAQ,IAAI,YAAY,QAAQ;AAC5C,QAAM,SAAS,KAAK,MAAM,MAAM,SAAS;AACzC,QAAM,MAAM,SAAS,OAAO,MAAM,IAAI,SAAS,OAAO,YAAY,MAAM;AACxE,QAAM,SAAS,IAAI,MAAM,KAAK,QAAQ,CAAC,CAAC;AACxC,SAAO,KAAK,GAAG,IAAI,MAAM,KAAK,SAAS,IAAI,KAAK,KAAK,eAAe,SAAS,CAAC;AAChF;AAEA,SAAS,YAAY,QAA2C;AAC9D,MAAI,WAAW,OAAQ,QAAO,MAAM,MAAM,MAAM;AAChD,MAAI,WAAW,QAAS,QAAO,MAAM,OAAO,OAAO;AACnD,SAAO,MAAM,IAAI,MAAM;AACzB;AAEO,SAAS,gBAAgB,SAA4C;AAC1E,QAAM,YAAY,SAAS,aAAa;AAExC,MAAI,aAAa;AACjB,MAAI,YAAY;AAChB,MAAI,YAAY;AAEhB,SAAO;AAAA,IACL,WAAW,MAAM;AACf,mBAAa,KAAK;AAClB,kBAAY;AACZ,kBAAY,KAAK,IAAI;AAErB,UAAI,cAAc,SAAS;AACzB,cAAM,QAAQ,KAAK;AACnB,gBAAQ,IAAI,EAAE;AACd,gBAAQ;AAAA,UACN,KAAK,MAAM,IAAI,cAAc,CAAC,IAAI,MAAM,KAAK,KAAK,CAAC,IAAI,MAAM,IAAI,SAAS,OAAO,KAAK,IAAI,GAAG,KAAK,MAAM,MAAM,CAAC,CAAC,CAAC;AAAA,QACnH;AACA,gBAAQ,IAAI,KAAK,MAAM,IAAI,WAAW,KAAK,UAAU,WAAW,CAAC,EAAE;AACnE,gBAAQ,IAAI,EAAE;AAAA,MAChB;AAAA,IACF;AAAA,IAEA,YAAY;AACV;AACA,UAAI,cAAc,SAAS;AACzB,cAAM,UAAU,KAAK,IAAI,IAAI;AAC7B,gBAAQ,OAAO;AAAA,UACb,KAAK,kBAAkB,WAAW,YAAY,OAAO,CAAC;AAAA,QACxD;AAAA,MACF;AAAA,IACF;AAAA,IAEA,SAAS,MAAM;AACb,UAAI,cAAc,SAAS;AACzB,gBAAQ,OAAO,MAAM,OAAO,IAAI,OAAO,EAAE,IAAI,IAAI;AAAA,MACnD;AAEA,yBAAmB,IAAI;AAEvB,UAAI,cAAc,QAAS;AAE3B,YAAM,SAAS,CAAC,GAAG,KAAK,KAAK,EAAE,KAAK,CAAC,GAAG,MAAM,EAAE,QAAQ,EAAE,KAAK;AAE/D,UAAI,cAAc,WAAW;AAC3B,mBAAW,KAAK,QAAQ;AACtB,2BAAiB,GAAG,KAAK,WAAW;AAAA,YAClC,WAAW;AAAA,YACX,iBAAiB;AAAA,UACnB,CAAC;AAAA,QACH;AAAA,MACF,OAAO;AACL,+BAAuB,QAAQ,KAAK,SAAS;AAAA,MAC/C;AAAA,IACF;AAAA,EACF;AACF;AAEA,SAAS,YAAY,MAAc,QAAwB;AACzD,QAAM,MAAM,IAAI,OAAO,MAAM;AAC7B,SAAO,KACJ,QAAQ,SAAS,IAAI,EACrB,MAAM,IAAI,EACV,IAAI,CAAC,SAAS,MAAM,IAAI,EACxB,KAAK,IAAI;AACd;AAEA,SAAS,eAAe,MAAc,WAA2B;AAC/D,MAAI,KAAK,UAAU,UAAW,QAAO;AACrC,SAAO,KAAK,MAAM,GAAG,SAAS,IAAI;AACpC;AAEA,SAAS,mBAAmB,MAAwB;AAClD,QAAM,EAAE,QAAQ,IAAI;AACpB,QAAM,WACJ,QAAQ,aAAa,KACf,QAAQ,YAAY,QAAQ,aAAc,KAAK,QAAQ,CAAC,IAC1D;AAEN,UAAQ,IAAI,EAAE;AACd,UAAQ,IAAI,MAAM,KAAK,WAAW,CAAC;AACnC,UAAQ,IAAI,MAAM,IAAI,OAAO,SAAS,OAAO,EAAE,CAAC,CAAC;AACjD,UAAQ,IAAI,KAAK,MAAM,IAAI,OAAO,CAAC,SAAS,KAAK,IAAI,EAAE;AACvD,UAAQ,IAAI,KAAK,MAAM,IAAI,QAAQ,CAAC,QAAQ,KAAK,KAAK,EAAE;AACxD,UAAQ,IAAI,KAAK,MAAM,IAAI,YAAY,CAAC,IAAI,KAAK,SAAS,EAAE;AAC5D,UAAQ,IAAI,KAAK,MAAM,IAAI,QAAQ,CAAC,QAAQ,QAAQ,UAAU,EAAE;AAChE,UAAQ;AAAA,IACN,KAAK,MAAM,IAAI,YAAY,CAAC,IAAI,MAAM,MAAM,OAAO,QAAQ,SAAS,CAAC,CAAC,MAAM,MAAM,IAAI,OAAO,QAAQ,SAAS,CAAC,CAAC,IAAI,MAAM,IAAI,IAAI,QAAQ,IAAI,CAAC;AAAA,EACjJ;AACA,UAAQ;AAAA,IACN,KAAK,MAAM,IAAI,WAAW,CAAC,KAAK,eAAe,QAAQ,cAAc,CAAC;AAAA,EACxE;AACA,UAAQ;AAAA,IACN,KAAK,MAAM,IAAI,SAAS,CAAC,OAAO,MAAM,IAAI,KAAK,CAAC,IAAI,aAAa,QAAQ,aAAa,CAAC,KAAK,MAAM,IAAI,MAAM,CAAC,IAAI,aAAa,QAAQ,cAAc,CAAC,KAAK,MAAM,IAAI,QAAQ,CAAC,IAAI,aAAa,QAAQ,gBAAgB,QAAQ,cAAc,CAAC;AAAA,EAC/O;AAEA,QAAM,eAAe,OAAO,QAAQ,QAAQ,UAAU;AACtD,MAAI,aAAa,SAAS,GAAG;AAC3B,YAAQ,IAAI,EAAE;AACd,YAAQ,IAAI,MAAM,KAAK,UAAU,CAAC;AAClC,eAAW,CAAC,MAAM,KAAK,KAAK,cAAc;AACxC,YAAM,aAAa,SAAS,KAAK,YAAY,MAAM,QAAQ,MAAM;AACjE,cAAQ;AAAA,QACN,OAAO,MAAM,IAAI,OAAO,GAAG,CAAC,GAAG,IAAI,OAAO,KAAK,IAAI,GAAG,KAAK,KAAK,MAAM,CAAC,CAAC,GAAG,WAAW,MAAM,QAAQ,CAAC,CAAC,CAAC;AAAA,MACzG;AAAA,IACF;AAAA,EACF;AAEA,UAAQ,IAAI,MAAM,IAAI,OAAO,SAAS,OAAO,EAAE,CAAC,CAAC;AACjD,UAAQ,IAAI,EAAE;AAChB;AAEA,SAAS,iBACP,GACA,WACA,SAIM;AACN,QAAM,UAAU,OAAO,QAAQ,EAAE,MAAM;AACvC,QAAM,SAAS,cAAc,GAAG,SAAS;AACzC,QAAM,SAAS,YAAY,MAAM;AACjC,QAAM,YAAY,SAAS,aAAa;AACxC,QAAM,kBAAkB,SAAS,mBAAmB;AAEpD,QAAM,OAAO,GAAG,MAAM,IAAI,eAAe,EAAE,SAAS,CAAC,CAAC,KAAK,MAAM,IAAI,GAAG,EAAE,QAAQ,IAAI,EAAE,SAAS,SAAS,CAAC;AAC3G,UAAQ,IAAI,KAAK,MAAM,IAAI,MAAM,IAAI,SAAS,EAAE,KAAK,EAAE,CAAC,KAAK,IAAI,EAAE;AAEnE,QAAM,WAAW,iBAAiB,EAAE,OAAO;AAAA,IACzC,OAAO;AAAA,IACP,UAAU,OAAO,EAAE,KAAK;AAAA,EAC1B,CAAC;AACD,UAAQ,IAAI,OAAO,MAAM,IAAI,QAAQ,CAAC,EAAE;AACxC,UAAQ,IAAI,YAAY,eAAe,UAAU,eAAe,GAAG,CAAC,CAAC;AAErE,MAAI,WAAW;AACb,YAAQ,IAAI,OAAO,MAAM,IAAI,SAAS,CAAC,EAAE;AACzC,YAAQ,IAAI,YAAY,eAAe,EAAE,QAAQ,eAAe,GAAG,CAAC,CAAC;AACrE,YAAQ,IAAI,OAAO,MAAM,IAAI,WAAW,CAAC,EAAE;AAC3C,UAAM,iBAAiB,iBAAiB,EAAE,UAAU;AAAA,MAClD,OAAO;AAAA,MACP,UAAU,OAAO,EAAE,QAAQ;AAAA,IAC7B,CAAC;AACD,YAAQ;AAAA,MACN,YAAY,eAAe,gBAAgB,eAAe,GAAG,CAAC;AAAA,IAChE;AAAA,EACF;AAEA,aAAW,CAAC,MAAM,CAAC,KAAK,SAAS;AAC/B,UAAM,aAAa,EAAE,SAAS,YAAY,MAAM,QAAQ,MAAM;AAC9D,UAAM,YAAY,EAAE,SAAS,WAAW,EAAE,MAAM,KAAK;AACrD,YAAQ;AAAA,MACN,OAAO,MAAM,IAAI,OAAO,GAAG,CAAC,IAAI,WAAW,EAAE,MAAM,QAAQ,CAAC,CAAC,CAAC,GAAG,SAAS;AAAA,IAC5E;AAAA,EACF;AAEA,MAAI,EAAE,OAAO;AACX,YAAQ,IAAI,OAAO,MAAM,IAAI,QAAQ,CAAC,EAAE;AACxC,UAAM,WAAW,iBAAiB,EAAE,KAAK;AACzC,YAAQ,IAAI,SAAS,MAAM,IAAI,QAAQ,CAAC,EAAE;AAAA,EAC5C;AAEA,UAAQ,IAAI,EAAE;AAChB;AAEA,SAAS,uBAAuB,OAAqB,WAAyB;AAC5E,QAAM,cAAc,oBAAI,IAAY;AACpC,aAAW,KAAK,OAAO;AACrB,eAAW,QAAQ,OAAO,KAAK,EAAE,MAAM,GAAG;AACxC,kBAAY,IAAI,IAAI;AAAA,IACtB;AAAA,EACF;AAEA,MAAI,cAAc;AAElB,aAAW,UAAU,aAAa;AAChC,UAAM,UAAU,MAAM,OAAO,CAAC,MAAM;AAClC,YAAM,IAAI,EAAE,OAAO,MAAM;AACzB,aACG,KAAK,EAAE,QAAQ,aAAc,cAAc,GAAG,SAAS,MAAM;AAAA,IAElE,CAAC;AAED,QAAI,QAAQ,WAAW,EAAG;AAE1B,QAAI,CAAC,aAAa;AAChB,cAAQ,IAAI,MAAM,IAAI,sBAAsB,CAAC;AAC7C,cAAQ,IAAI,EAAE;AACd,oBAAc;AAAA,IAChB;AAEA,YAAQ;AAAA,MACN,KAAK,MAAM,KAAK,MAAM,CAAC,IAAI,MAAM,IAAI,IAAI,QAAQ,MAAM,YAAY,CAAC;AAAA,IACtE;AACA,YAAQ,IAAI,MAAM,IAAI,OAAO,SAAS,OAAO,EAAE,CAAC,CAAC;AAEjD,eAAW,KAAK,SAAS;AACvB,uBAAiB,GAAG,WAAW;AAAA,QAC7B,WAAW;AAAA,QACX,iBAAiB;AAAA,MACnB,CAAC;AAAA,IACH;AAAA,EACF;AACF;;;AGhPA,SAAS,YAAY,SAAAA,cAAa;AAe3B,SAAS,aAAa,SAAyC;AACpE,QAAM,YAAY,iBAAiB,SAAS,SAAS;AACrD,QAAM,SAAS,SAAS,UAAU;AAClC,MAAI,iBAAiB;AAErB,SAAO;AAAA,IACL,MAAM,WAAW,MAAM;AACrB,YAAMC,OAAM,WAAW,EAAE,WAAW,KAAK,CAAC;AAC1C,uBAAiB,cAAc,WAAW,KAAK,MAAM,KAAK,OAAO,OAAO;AAAA,IAC1E;AAAA,IACA,MAAM,UAAU,MAAM;AACpB,YAAM,OAAO,iBAAiB,MAAM,EAAE,OAAO,GAAG,UAAU,OAAO,CAAC;AAClE,YAAM,WAAW,gBAAgB,OAAO,MAAM,OAAO;AAAA,IACvD;AAAA,IACA,MAAM,SAAS,MAAM;AACnB,YAAM,UAAU,iBAAiB,MAAM;AAAA,QACrC,OAAO,SAAS,IAAI;AAAA,QACpB,UAAU;AAAA,MACZ,CAAC;AACD,YAAM;AAAA,QACJ;AAAA,QACA,KAAK;AAAA,QACL,KAAK;AAAA,QACL;AAAA,QACA;AAAA,MACF;AAAA,IACF;AAAA,EACF;AACF;;;ACnCO,SAAS,YAAY,SAAwC;AAClE,SAAO,yBAAyB;AAAA,IAC9B,WAAW,SAAS;AAAA,IACpB,KAAK;AAAA,IACL,OAAO,MAAM;AACX,YAAM,cAAc,OAAO,KAAK,KAAK,QAAQ,UAAU;AAEvD,YAAM,cAAc;AAAA,QAClB;AAAA,QACA;AAAA,QACA;AAAA,QACA;AAAA,QACA;AAAA,QACA;AAAA,QACA;AAAA,QACA;AAAA,QACA;AAAA,MACF;AACA,iBAAW,QAAQ,aAAa;AAC9B,oBAAY,KAAK,GAAG,IAAI,UAAU,GAAG,IAAI,SAAS;AAAA,MACpD;AAEA,YAAM,OAAO,CAAC,YAAY,KAAK,GAAG,CAAC;AAEnC,iBAAW,KAAK,KAAK,OAAO;AAC1B,cAAM,SAAS,cAAc,GAAG,KAAK,SAAS;AAC9C,cAAM,QAAQ;AAAA,UACZ,OAAO,EAAE,KAAK;AAAA,UACd;AAAA,UACA,UAAU,EAAE,KAAK;AAAA,UACjB,UAAU,EAAE,MAAM;AAAA,UAClB,UAAU,EAAE,QAAQ;AAAA,UACpB,UAAU,EAAE,SAAS,EAAE;AAAA,UACvB,OAAO,EAAE,SAAS;AAAA,UAClB,OAAO,EAAE,QAAQ;AAAA,UACjB,OAAO,EAAE,SAAS;AAAA,QACpB;AACA,mBAAW,QAAQ,aAAa;AAC9B,gBAAM,IAAI,EAAE,OAAO,IAAI;AACvB,gBAAM,KAAK,OAAO,GAAG,SAAS,EAAE,GAAG,UAAU,GAAG,UAAU,EAAE,CAAC;AAAA,QAC/D;AACA,aAAK,KAAK,MAAM,KAAK,GAAG,CAAC;AAAA,MAC3B;AAEA,aAAO,KAAK,KAAK,IAAI,IAAI;AAAA,IAC3B;AAAA,EACF,CAAC;AACH;;;AC1CO,SAAS,iBAAiB,SAA6C;AAC5E,SAAO,yBAAyB;AAAA,IAC9B,WAAW,SAAS;AAAA,IACpB,KAAK;AAAA,IACL,OAAO,MAAM;AACX,YAAM,EAAE,QAAQ,IAAI;AACpB,YAAM,cAAc,OAAO,KAAK,QAAQ,UAAU;AAClD,YAAM,QAAkB,CAAC;AACzB,YAAM,WACJ,QAAQ,aAAa,KACf,QAAQ,YAAY,QAAQ,aAAc,KAAK,QAAQ,CAAC,IAC1D;AAEN,YAAM,KAAK,KAAK,KAAK,IAAI,EAAE;AAC3B,YAAM,KAAK,EAAE;AACb,YAAM,KAAK,cAAc,KAAK,KAAK,EAAE;AACrC,YAAM,KAAK,kBAAkB,KAAK,SAAS,EAAE;AAC7C,YAAM;AAAA,QACJ,cAAc,QAAQ,UAAU,KAAK,QAAQ,SAAS,UAAU,QAAQ,SAAS,UAAU,QAAQ;AAAA,MACrG;AACA,YAAM,KAAK,iBAAiB,eAAe,QAAQ,cAAc,CAAC,EAAE;AACpE,YAAM;AAAA,QACJ,mBAAmB,aAAa,QAAQ,aAAa,CAAC,WAAW,aAAa,QAAQ,cAAc,CAAC,aAAa,aAAa,QAAQ,gBAAgB,QAAQ,cAAc,CAAC;AAAA,MAChL;AACA,YAAM,KAAK,EAAE;AAEb,YAAM,KAAK,WAAW;AACtB,YAAM,KAAK,EAAE;AACb,YAAM,KAAK,mBAAmB;AAC9B,YAAM,KAAK,mBAAmB;AAC9B,iBAAW,CAAC,MAAM,KAAK,KAAK,OAAO,QAAQ,QAAQ,UAAU,GAAG;AAC9D,cAAM,KAAK,KAAK,IAAI,MAAM,MAAM,QAAQ,CAAC,CAAC,IAAI;AAAA,MAChD;AACA,YAAM,KAAK,EAAE;AAEb,YAAM,KAAK,UAAU;AACrB,YAAM,KAAK,EAAE;AAEb,YAAM,aAAa;AAAA,QACjB;AAAA,QACA;AAAA,QACA;AAAA,QACA,GAAG;AAAA,QACH;AAAA,QACA;AAAA,QACA;AAAA,MACF;AACA,YAAM,KAAK,KAAK,WAAW,KAAK,KAAK,CAAC,IAAI;AAC1C,YAAM,KAAK,KAAK,WAAW,IAAI,MAAM,KAAK,EAAE,KAAK,KAAK,CAAC,IAAI;AAE3D,iBAAW,KAAK,KAAK,OAAO;AAC1B,cAAM,cAAc,cAAc,GAAG,KAAK,SAAS;AACnD,cAAM,SACJ,gBAAgB,UACZ,oBACA,gBAAgB,SACd,gBACA;AACR,cAAM,QAAQ,iBAAiB,EAAE,KAAK,EAAE,MAAM,GAAG,EAAE;AACnD,cAAM,SAAS,YAAY;AAAA,UACzB,CAAC,SAAS,EAAE,OAAO,IAAI,GAAG,MAAM,QAAQ,CAAC,KAAK;AAAA,QAChD;AACA,cAAM,QAAQ,EAAE,QACZ,iBAAiB,EAAE,KAAK,EACrB,QAAQ,UAAU,MAAM,EACxB,QAAQ,OAAO,KAAK,IACvB;AACJ,cAAM,MAAM;AAAA,UACV,OAAO,EAAE,KAAK;AAAA,UACd;AAAA,UACA;AAAA,UACA,GAAG;AAAA,UACH,eAAe,EAAE,SAAS;AAAA,UAC1B,GAAG,EAAE,QAAQ,IAAI,EAAE,SAAS;AAAA,UAC5B;AAAA,QACF;AACA,cAAM,KAAK,KAAK,IAAI,KAAK,KAAK,CAAC,IAAI;AAAA,MACrC;AACA,YAAM,KAAK,EAAE;AAEb,aAAO,MAAM,KAAK,IAAI;AAAA,IACxB;AAAA,EACF,CAAC;AACH;;;AClFO,SAAS,aAAa,SAAyC;AACpE,SAAO,yBAAyB;AAAA,IAC9B,WAAW,SAAS;AAAA,IACpB,KAAK;AAAA,IACL,QAAQ;AAAA,EACV,CAAC;AACH;AAEA,SAAS,IAAI,KAAqB;AAChC,SAAO,IACJ,QAAQ,MAAM,OAAO,EACrB,QAAQ,MAAM,MAAM,EACpB,QAAQ,MAAM,MAAM,EACpB,QAAQ,MAAM,QAAQ;AAC3B;AAEA,SAAS,WAAW,MAA0B;AAC5C,QAAM,EAAE,QAAQ,IAAI;AACpB,QAAM,cAAc,OAAO,KAAK,QAAQ,UAAU;AAClD,QAAM,WACJ,QAAQ,aAAa,KACf,QAAQ,YAAY,QAAQ,aAAc,KAAK,QAAQ,CAAC,IAC1D;AAEN,QAAM,WAAW,KAAK,MACnB,IAAI,CAAC,MAAM;AACV,UAAM,SAAS,cAAc,GAAG,KAAK,SAAS;AAC9C,UAAMC,eACJ,WAAW,UAAU,UAAU,WAAW,SAAS,SAAS;AAC9D,UAAM,cAAc,YACjB,IAAI,CAAC,SAAS;AACb,YAAM,IAAI,EAAE,OAAO,IAAI;AACvB,YAAM,QAAQ,GAAG,SAAS;AAC1B,YAAM,MAAM,SAAS,KAAK,YAAY,SAAS;AAC/C,YAAM,SAAS,GAAG,SAAS,WAAW,IAAI,EAAE,MAAM,CAAC,MAAM;AACzD,aAAO,cAAc,GAAG,IAAI,MAAM,IAAI,MAAM,QAAQ,CAAC,CAAC;AAAA,IACxD,CAAC,EACA,KAAK,EAAE;AAEV,UAAM,cAAc,iBAAiB,EAAE,UAAU;AAAA,MAC/C,OAAO;AAAA,MACP,UAAU;AAAA,IACZ,CAAC;AAED,WAAO,cAAc,MAAM;AAAA,cACnB,EAAE,KAAK;AAAA,qBACA,MAAM,KAAKA,YAAW;AAAA,2BAChB,IAAI,iBAAiB,EAAE,KAAK,EAAE,MAAM,GAAG,GAAG,CAAC,CAAC;AAAA,2BAC5C,IAAI,EAAE,OAAO,MAAM,GAAG,GAAG,CAAC,CAAC;AAAA,2BAC3B,IAAI,YAAY,MAAM,GAAG,GAAG,CAAC,CAAC;AAAA,UAC/C,WAAW;AAAA,cACP,eAAe,EAAE,SAAS,CAAC;AAAA,cAC3B,EAAE,QAAQ,IAAI,EAAE,SAAS;AAAA,iCACN,EAAE,QAAQ,IAAI,iBAAiB,EAAE,KAAK,CAAC,IAAI,EAAE;AAAA;AAAA,EAE1E,CAAC,EACA,KAAK,IAAI;AAEZ,QAAM,gBAAgB,YAAY,IAAI,CAAC,MAAM,OAAO,IAAI,CAAC,CAAC,OAAO,EAAE,KAAK,EAAE;AAC1E,QAAM,gBAAgB,OAAO,QAAQ,QAAQ,UAAU,EACpD;AAAA,IACC,CAAC,CAAC,MAAM,KAAK,MACX,WAAW,IAAI,IAAI,CAAC,YAAY,MAAM,QAAQ,CAAC,CAAC;AAAA,EACpD,EACC,KAAK,EAAE;AAEV,SAAO;AAAA;AAAA;AAAA;AAAA,SAIA,IAAI,KAAK,IAAI,CAAC;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA,QAuBf,IAAI,KAAK,IAAI,CAAC;AAAA;AAAA,oCAEc,IAAI,KAAK,KAAK,CAAC;AAAA,wCACX,KAAK,SAAS;AAAA,oCAClB,QAAQ,UAAU;AAAA,mCACnB,QAAQ,SAAS;AAAA,mCACjB,QAAQ,SAAS,KAAK,QAAQ;AAAA,uCAC1B,eAAe,QAAQ,cAAc,CAAC;AAAA,wCACrC,aAAa,QAAQ,aAAa,CAAC;AAAA,yCAClC,aAAa,QAAQ,cAAc,CAAC;AAAA,2CAClC,aAAa,QAAQ,gBAAgB,QAAQ,cAAc,CAAC;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA,aAM1F,aAAa;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA,UAYhB,aAAa;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA,QAOf,QAAQ;AAAA;AAAA;AAAA;AAAA;AAKhB;",
4
+ "sourcesContent": ["import chalk from 'chalk';\n\nimport {\n formatDuration,\n formatErrorValue,\n formatTokens,\n stringifyUnknown,\n} from './format.ts';\nimport { getCaseStatus } from './shared.ts';\nimport type { CaseResult, Reporter, RunEndData, Verbosity } from './types.ts';\n\nexport interface ConsoleReporterOptions {\n verbosity?: Verbosity;\n}\n\nconst BAR_WIDTH = 20;\n\nfunction renderProgressBar(\n completed: number,\n total: number,\n elapsedMs: number,\n): string {\n const pct = total > 0 ? completed / total : 0;\n const filled = Math.round(pct * BAR_WIDTH);\n const bar = '\\u2593'.repeat(filled) + '\\u2591'.repeat(BAR_WIDTH - filled);\n const pctStr = `${(pct * 100).toFixed(0)}%`;\n return ` ${bar} ${pctStr} (${completed}/${total}) ${formatDuration(elapsedMs)}`;\n}\n\nfunction statusLabel(status: 'pass' | 'fail' | 'error'): string {\n if (status === 'pass') return chalk.green('PASS');\n if (status === 'error') return chalk.yellow('ERROR');\n return chalk.red('FAIL');\n}\n\nexport function consoleReporter(options?: ConsoleReporterOptions): Reporter {\n const verbosity = options?.verbosity ?? 'normal';\n\n let totalCases = 0;\n let completed = 0;\n let startTime = 0;\n\n return {\n onRunStart(data) {\n totalCases = data.totalCases;\n completed = 0;\n startTime = Date.now();\n\n if (verbosity !== 'quiet') {\n const label = data.name;\n console.log('');\n console.log(\n ` ${chalk.dim('\\u2500\\u2500')} ${chalk.bold(label)} ${chalk.dim('\\u2500'.repeat(Math.max(0, 56 - label.length)))}`,\n );\n console.log(` ${chalk.dim(`Running ${data.totalCases} cases...`)}`);\n console.log('');\n }\n },\n\n onCaseEnd() {\n completed++;\n if (verbosity !== 'quiet') {\n const elapsed = Date.now() - startTime;\n process.stdout.write(\n `\\r${renderProgressBar(completed, totalCases, elapsed)}`,\n );\n }\n },\n\n onRunEnd(data) {\n if (verbosity !== 'quiet') {\n process.stdout.write('\\r' + ' '.repeat(70) + '\\r');\n }\n\n renderSummaryTable(data);\n\n if (verbosity === 'quiet') return;\n\n const sorted = [...data.cases].sort((a, b) => a.index - b.index);\n\n if (verbosity === 'verbose') {\n for (const c of sorted) {\n renderCaseDetail(c, data.threshold, {\n includeIO: true,\n maxStringLength: 20_000,\n });\n }\n } else {\n renderFailuresByScorer(sorted, data.threshold);\n }\n },\n };\n}\n\nfunction indentBlock(text: string, spaces: number): string {\n const pad = ' '.repeat(spaces);\n return text\n .replace(/\\r\\n/g, '\\n')\n .split('\\n')\n .map((line) => pad + line)\n .join('\\n');\n}\n\nfunction truncateString(text: string, maxLength: number): string {\n if (text.length <= maxLength) return text;\n return text.slice(0, maxLength) + '\\u2026';\n}\n\nfunction stringifyRationale(value: unknown): string | undefined {\n if (typeof value === 'string') {\n const trimmed = value.trim();\n return trimmed.length > 0 ? trimmed : undefined;\n }\n\n if (Array.isArray(value)) {\n const parts = value\n .map((item) => (typeof item === 'string' ? item.trim() : ''))\n .filter(Boolean);\n if (parts.length > 0) return parts.join(' | ');\n }\n\n return undefined;\n}\n\nfunction scoreReasonWithMetadata(score: {\n reason?: string;\n metadata?: Record<string, unknown>;\n}): string | undefined {\n const reason = score.reason?.trim();\n if (reason) return reason;\n return stringifyRationale(score.metadata?.['rationale']);\n}\n\nfunction renderSummaryTable(data: RunEndData): void {\n const { summary } = data;\n const passRate =\n summary.totalCases > 0\n ? ((summary.passCount / summary.totalCases) * 100).toFixed(1)\n : '0.0';\n\n console.log('');\n console.log(chalk.bold(' Summary'));\n console.log(chalk.dim(' ' + '\\u2500'.repeat(60)));\n console.log(` ${chalk.dim('Eval:')} ${data.name}`);\n console.log(` ${chalk.dim('Model:')} ${data.model}`);\n console.log(` ${chalk.dim('Threshold:')} ${data.threshold}`);\n console.log(` ${chalk.dim('Cases:')} ${summary.totalCases}`);\n console.log(\n ` ${chalk.dim('Pass/Fail:')} ${chalk.green(String(summary.passCount))} / ${chalk.red(String(summary.failCount))} ${chalk.dim(`(${passRate}%)`)}`,\n );\n console.log(\n ` ${chalk.dim('Duration:')} ${formatDuration(summary.totalLatencyMs)}`,\n );\n console.log(\n ` ${chalk.dim('Tokens:')} ${chalk.dim('In:')} ${formatTokens(summary.totalTokensIn)} ${chalk.dim('Out:')} ${formatTokens(summary.totalTokensOut)} ${chalk.dim('Total:')} ${formatTokens(summary.totalTokensIn + summary.totalTokensOut)}`,\n );\n\n const scoreEntries = Object.entries(summary.meanScores);\n if (scoreEntries.length > 0) {\n console.log('');\n console.log(chalk.bold(' Scores'));\n for (const [name, score] of scoreEntries) {\n const scoreColor = score >= data.threshold ? chalk.green : chalk.red;\n console.log(\n ` ${chalk.dim(name + ':')}${' '.repeat(Math.max(1, 12 - name.length))}${scoreColor(score.toFixed(3))}`,\n );\n }\n }\n\n console.log(chalk.dim(' ' + '\\u2500'.repeat(60)));\n console.log('');\n}\n\nfunction renderCaseDetail(\n c: CaseResult,\n threshold: number,\n options?: {\n includeIO?: boolean;\n maxStringLength?: number;\n },\n): void {\n const entries = Object.entries(c.scores);\n const status = getCaseStatus(c, threshold);\n const prefix = statusLabel(status);\n const includeIO = options?.includeIO ?? false;\n const maxStringLength = options?.maxStringLength ?? 4_000;\n\n const meta = `${chalk.dim(formatDuration(c.latencyMs))} ${chalk.dim(`${c.tokensIn}/${c.tokensOut} tokens`)}`;\n console.log(` ${prefix} ${chalk.dim(`Case #${c.index}`)} ${meta}`);\n\n const inputStr = stringifyUnknown(c.input, {\n space: 2,\n fallback: String(c.input),\n });\n console.log(` ${chalk.dim('Input:')}`);\n console.log(indentBlock(truncateString(inputStr, maxStringLength), 6));\n\n if (includeIO) {\n console.log(` ${chalk.dim('Output:')}`);\n console.log(indentBlock(truncateString(c.output, maxStringLength), 6));\n console.log(` ${chalk.dim('Expected:')}`);\n const expectedStrRaw = stringifyUnknown(c.expected, {\n space: 2,\n fallback: String(c.expected),\n });\n console.log(\n indentBlock(truncateString(expectedStrRaw, maxStringLength), 6),\n );\n }\n\n for (const [name, s] of entries) {\n const scoreColor = s.score >= threshold ? chalk.green : chalk.red;\n const reason = scoreReasonWithMetadata(s);\n const reasonStr = reason ? ` \\u2014 ${reason}` : '';\n console.log(\n ` ${chalk.dim(name + ':')} ${scoreColor(s.score.toFixed(3))}${reasonStr}`,\n );\n }\n\n if (c.error) {\n console.log(` ${chalk.dim('Error:')}`);\n const errorStr = formatErrorValue(c.error);\n console.log(` ${chalk.red(errorStr)}`);\n }\n\n console.log('');\n}\n\nfunction renderFailuresByScorer(cases: CaseResult[], threshold: number): void {\n const scorerNames = new Set<string>();\n for (const c of cases) {\n for (const name of Object.keys(c.scores)) {\n scorerNames.add(name);\n }\n }\n\n let hasFailures = false;\n\n for (const scorer of scorerNames) {\n const failing = cases.filter((c) => {\n const s = c.scores[scorer];\n return (\n (s && s.score < threshold) || getCaseStatus(c, threshold) === 'error'\n );\n });\n\n if (failing.length === 0) continue;\n\n if (!hasFailures) {\n console.log(chalk.dim(' Failing by scorer:'));\n console.log('');\n hasFailures = true;\n }\n\n console.log(\n ` ${chalk.bold(scorer)} ${chalk.dim(`(${failing.length} failures)`)}`,\n );\n console.log(chalk.dim(' ' + '\\u2500'.repeat(40)));\n\n for (const c of failing) {\n renderCaseDetail(c, threshold, {\n includeIO: true,\n maxStringLength: 4_000,\n });\n }\n }\n}\n", "export function truncate(str: string, maxLen = 80): string {\n if (str.length <= maxLen) return str;\n return str.slice(0, maxLen) + '...';\n}\n\nexport function formatDuration(ms: number): string {\n if (ms < 1000) return `${ms}ms`;\n return `${(ms / 1000).toFixed(1)}s`;\n}\n\nexport function formatTokens(n: number): string {\n if (n >= 1_000_000) return `${(n / 1_000_000).toFixed(1)}M`;\n if (n >= 1_000) return `${(n / 1_000).toFixed(0)}k`;\n return String(n);\n}\n\nexport function generateFilename(\n name: string,\n runId: string,\n ext: string,\n): string {\n const slug = name.replace(/[^a-zA-Z0-9-_]/g, '-').toLowerCase();\n const prefix = runId.slice(0, 8);\n return `${slug}-${prefix}.${ext}`;\n}\n\nexport function stringifyUnknown(\n value: unknown,\n options?: {\n space?: number;\n fallback?: string;\n },\n): string {\n if (typeof value === 'string') return value;\n\n const space = options?.space ?? 0;\n const fallback = options?.fallback ?? 'null';\n try {\n return JSON.stringify(value, null, space) ?? fallback;\n } catch {\n return String(value);\n }\n}\n\nexport function formatInputValue(value: unknown): string {\n return stringifyUnknown(value, { space: 0, fallback: '' });\n}\n\nexport function formatErrorValue(value: unknown): string {\n if (value == null) return '';\n if (typeof value === 'string') return value;\n return stringifyUnknown(value, { space: 2, fallback: '' });\n}\n\nexport function escapeCsv(value: unknown): string {\n const str = stringifyUnknown(value, { space: 0, fallback: 'null' });\n if (str.includes(',') || str.includes('\"') || str.includes('\\n')) {\n return `\"${str.replace(/\"/g, '\"\"')}\"`;\n }\n return str;\n}\n", "import { mkdir, writeFile } from 'node:fs/promises';\nimport { join } from 'node:path';\n\nimport { generateFilename } from './format.ts';\nimport type { CaseResult, Reporter, RunEndData } from './types.ts';\n\nconst DEFAULT_OUTPUT_DIR = '.evals/reports';\n\nexport function resolveOutputDir(outputDir?: string): string {\n return outputDir ?? DEFAULT_OUTPUT_DIR;\n}\n\nexport function getReportPath(\n outputDir: string,\n name: string,\n runId: string,\n ext: string,\n): string {\n return join(outputDir, generateFilename(name, runId, ext));\n}\n\nexport async function writeRunReportFile(\n outputDir: string,\n name: string,\n runId: string,\n ext: string,\n content: string,\n): Promise<void> {\n await mkdir(outputDir, { recursive: true });\n await writeFile(getReportPath(outputDir, name, runId, ext), content, 'utf-8');\n}\n\nexport function getCaseStatus(\n result: CaseResult,\n threshold: number,\n): 'error' | 'pass' | 'fail' {\n if (result.error) return 'error';\n const passed = Object.values(result.scores).every(\n (s) => s.score >= threshold,\n );\n return passed ? 'pass' : 'fail';\n}\n\nexport function createRunEndFileReporter(options: {\n outputDir?: string;\n ext: string;\n render: (data: RunEndData) => string | Promise<string>;\n}): Reporter {\n const outputDir = resolveOutputDir(options.outputDir);\n\n return {\n async onRunEnd(data) {\n const content = await options.render(data);\n await writeRunReportFile(\n outputDir,\n data.name,\n data.runId,\n options.ext,\n content,\n );\n },\n };\n}\n", "import { appendFile, mkdir } from 'node:fs/promises';\n\nimport { stringifyUnknown } from './format.ts';\nimport {\n getReportPath,\n resolveOutputDir,\n writeRunReportFile,\n} from './shared.ts';\nimport type { Reporter } from './types.ts';\n\nexport interface JsonReporterOptions {\n outputDir?: string;\n pretty?: boolean;\n}\n\nexport function jsonReporter(options?: JsonReporterOptions): Reporter {\n const outputDir = resolveOutputDir(options?.outputDir);\n const pretty = options?.pretty ?? true;\n let streamFilename = '';\n\n return {\n async onRunStart(data) {\n await mkdir(outputDir, { recursive: true });\n streamFilename = getReportPath(outputDir, data.name, data.runId, 'jsonl');\n },\n async onCaseEnd(data) {\n const line = stringifyUnknown(data, { space: 0, fallback: 'null' });\n await appendFile(streamFilename, line + '\\n', 'utf-8');\n },\n async onRunEnd(data) {\n const content = stringifyUnknown(data, {\n space: pretty ? 2 : 0,\n fallback: 'null',\n });\n await writeRunReportFile(\n outputDir,\n data.name,\n data.runId,\n 'json',\n content,\n );\n },\n };\n}\n", "import { escapeCsv } from './format.ts';\nimport { createRunEndFileReporter, getCaseStatus } from './shared.ts';\nimport type { Reporter } from './types.ts';\n\nexport interface CsvReporterOptions {\n outputDir?: string;\n}\n\nexport function csvReporter(options?: CsvReporterOptions): Reporter {\n return createRunEndFileReporter({\n outputDir: options?.outputDir,\n ext: 'csv',\n render(data) {\n const scorerNames = Object.keys(data.summary.meanScores);\n\n const headerParts = [\n 'index',\n 'status',\n 'input',\n 'output',\n 'expected',\n 'error',\n 'latency_ms',\n 'tokens_in',\n 'tokens_out',\n ];\n for (const name of scorerNames) {\n headerParts.push(`${name}_score`, `${name}_reason`);\n }\n\n const rows = [headerParts.join(',')];\n\n for (const c of data.cases) {\n const status = getCaseStatus(c, data.threshold);\n const parts = [\n String(c.index),\n status,\n escapeCsv(c.input),\n escapeCsv(c.output),\n escapeCsv(c.expected),\n escapeCsv(c.error ?? ''),\n String(c.latencyMs),\n String(c.tokensIn),\n String(c.tokensOut),\n ];\n for (const name of scorerNames) {\n const s = c.scores[name];\n parts.push(String(s?.score ?? ''), escapeCsv(s?.reason ?? ''));\n }\n rows.push(parts.join(','));\n }\n\n return rows.join('\\n') + '\\n';\n },\n });\n}\n", "import {\n formatDuration,\n formatErrorValue,\n formatInputValue,\n formatTokens,\n} from './format.ts';\nimport { createRunEndFileReporter, getCaseStatus } from './shared.ts';\nimport type { Reporter } from './types.ts';\n\nexport interface MarkdownReporterOptions {\n outputDir?: string;\n}\n\nexport function markdownReporter(options?: MarkdownReporterOptions): Reporter {\n return createRunEndFileReporter({\n outputDir: options?.outputDir,\n ext: 'md',\n render(data) {\n const { summary } = data;\n const scorerNames = Object.keys(summary.meanScores);\n const lines: string[] = [];\n const passRate =\n summary.totalCases > 0\n ? ((summary.passCount / summary.totalCases) * 100).toFixed(1)\n : '0.0';\n\n lines.push(`# ${data.name}`);\n lines.push('');\n lines.push(`**Model:** ${data.model}`);\n lines.push(`**Threshold:** ${data.threshold}`);\n lines.push(\n `**Cases:** ${summary.totalCases} (${summary.passCount} pass, ${summary.failCount} fail, ${passRate}%)`,\n );\n lines.push(`**Duration:** ${formatDuration(summary.totalLatencyMs)}`);\n lines.push(\n `**Tokens:** In: ${formatTokens(summary.totalTokensIn)} | Out: ${formatTokens(summary.totalTokensOut)} | Total: ${formatTokens(summary.totalTokensIn + summary.totalTokensOut)}`,\n );\n lines.push('');\n\n lines.push('## Scores');\n lines.push('');\n lines.push('| Scorer | Mean |');\n lines.push('|--------|------|');\n for (const [name, score] of Object.entries(summary.meanScores)) {\n lines.push(`| ${name} | ${score.toFixed(3)} |`);\n }\n lines.push('');\n\n lines.push('## Cases');\n lines.push('');\n\n const caseHeader = [\n '#',\n 'Status',\n 'Input',\n ...scorerNames,\n 'Latency',\n 'Tokens',\n 'Error',\n ];\n lines.push(`| ${caseHeader.join(' | ')} |`);\n lines.push(`| ${caseHeader.map(() => '---').join(' | ')} |`);\n\n for (const c of data.cases) {\n const statusValue = getCaseStatus(c, data.threshold);\n const status =\n statusValue === 'error'\n ? '\uD83D\uDD34 Error'\n : statusValue === 'pass'\n ? '\u2705 Pass'\n : '\u274C Fail';\n const input = formatInputValue(c.input).slice(0, 60);\n const scores = scorerNames.map(\n (name) => c.scores[name]?.score.toFixed(3) ?? '-',\n );\n const error = c.error\n ? formatErrorValue(c.error)\n .replace(/\\r?\\n/g, '<br>')\n .replace(/\\|/g, '\\\\|')\n : '-';\n const row = [\n String(c.index),\n status,\n input,\n ...scores,\n formatDuration(c.latencyMs),\n `${c.tokensIn}/${c.tokensOut}`,\n error,\n ];\n lines.push(`| ${row.join(' | ')} |`);\n }\n lines.push('');\n\n return lines.join('\\n');\n },\n });\n}\n", "import {\n formatDuration,\n formatErrorValue,\n formatInputValue,\n formatTokens,\n stringifyUnknown,\n} from './format.ts';\nimport { createRunEndFileReporter, getCaseStatus } from './shared.ts';\nimport type { Reporter, RunEndData } from './types.ts';\n\nexport interface HtmlReporterOptions {\n outputDir?: string;\n}\n\nexport function htmlReporter(options?: HtmlReporterOptions): Reporter {\n return createRunEndFileReporter({\n outputDir: options?.outputDir,\n ext: 'html',\n render: renderHtml,\n });\n}\n\nfunction esc(str: string): string {\n return str\n .replace(/&/g, '&amp;')\n .replace(/</g, '&lt;')\n .replace(/>/g, '&gt;')\n .replace(/\"/g, '&quot;');\n}\n\nfunction renderHtml(data: RunEndData): string {\n const { summary } = data;\n const scorerNames = Object.keys(summary.meanScores);\n const passRate =\n summary.totalCases > 0\n ? ((summary.passCount / summary.totalCases) * 100).toFixed(1)\n : '0.0';\n\n const caseRows = data.cases\n .map((c) => {\n const status = getCaseStatus(c, data.threshold);\n const statusLabel =\n status === 'error' ? 'ERROR' : status === 'pass' ? 'PASS' : 'FAIL';\n const scoresCells = scorerNames\n .map((name) => {\n const s = c.scores[name];\n const score = s?.score ?? 0;\n const cls = score >= data.threshold ? 'pass' : 'fail';\n const reason = s?.reason ? ` title=\"${esc(s.reason)}\"` : '';\n return `<td class=\"${cls}\"${reason}>${score.toFixed(3)}</td>`;\n })\n .join('');\n\n const expectedStr = stringifyUnknown(c.expected, {\n space: 0,\n fallback: '',\n });\n\n return `<tr class=\"${status}\">\n <td>${c.index}</td>\n <td class=\"${status}\">${statusLabel}</td>\n <td class=\"text\">${esc(formatInputValue(c.input).slice(0, 120))}</td>\n <td class=\"text\">${esc(c.output.slice(0, 120))}</td>\n <td class=\"text\">${esc(expectedStr.slice(0, 120))}</td>\n ${scoresCells}\n <td>${formatDuration(c.latencyMs)}</td>\n <td>${c.tokensIn}/${c.tokensOut}</td>\n <td class=\"error-text\">${c.error ? esc(formatErrorValue(c.error)) : ''}</td>\n </tr>`;\n })\n .join('\\n');\n\n const scorerHeaders = scorerNames.map((n) => `<th>${esc(n)}</th>`).join('');\n const meanScoreRows = Object.entries(summary.meanScores)\n .map(\n ([name, score]) =>\n `<tr><td>${esc(name)}</td><td>${score.toFixed(3)}</td></tr>`,\n )\n .join('');\n\n return `<!DOCTYPE html>\n<html lang=\"en\">\n<head>\n<meta charset=\"utf-8\">\n<title>${esc(data.name)} \u2014 Eval Report</title>\n<style>\n * { box-sizing: border-box; margin: 0; padding: 0; }\n body { font-family: system-ui, -apple-system, sans-serif; background: #f8f9fa; color: #1a1a1a; padding: 2rem; }\n h1 { font-size: 1.5rem; margin-bottom: 0.5rem; }\n .meta { color: #666; margin-bottom: 1.5rem; font-size: 0.9rem; }\n .meta span { margin-right: 1.5rem; }\n .summary-table, .cases-table { width: 100%; border-collapse: collapse; margin-bottom: 2rem; }\n .summary-table th, .summary-table td,\n .cases-table th, .cases-table td { padding: 0.5rem 0.75rem; border: 1px solid #ddd; text-align: left; font-size: 0.85rem; }\n .summary-table th, .cases-table th { background: #f1f3f5; font-weight: 600; }\n .cases-table .text { max-width: 300px; overflow: hidden; text-overflow: ellipsis; white-space: nowrap; }\n .cases-table .error-text { max-width: 480px; white-space: pre-wrap; word-break: break-word; }\n .pass { color: #2b8a3e; }\n .fail { color: #c92a2a; }\n .error { color: #e67700; }\n tr.pass:hover, tr.fail:hover, tr.error:hover { background: #f1f3f5; }\n td.pass { background: #ebfbee; }\n td.fail { background: #fff5f5; }\n h2 { font-size: 1.2rem; margin: 1.5rem 0 0.75rem; }\n</style>\n</head>\n<body>\n <h1>${esc(data.name)}</h1>\n <div class=\"meta\">\n <span><strong>Model:</strong> ${esc(data.model)}</span>\n <span><strong>Threshold:</strong> ${data.threshold}</span>\n <span><strong>Cases:</strong> ${summary.totalCases}</span>\n <span><strong>Pass:</strong> ${summary.passCount}</span>\n <span><strong>Fail:</strong> ${summary.failCount} (${passRate}%)</span>\n <span><strong>Duration:</strong> ${formatDuration(summary.totalLatencyMs)}</span>\n <span><strong>Tokens In:</strong> ${formatTokens(summary.totalTokensIn)}</span>\n <span><strong>Tokens Out:</strong> ${formatTokens(summary.totalTokensOut)}</span>\n <span><strong>Total Tokens:</strong> ${formatTokens(summary.totalTokensIn + summary.totalTokensOut)}</span>\n </div>\n\n <h2>Mean Scores</h2>\n <table class=\"summary-table\">\n <thead><tr><th>Scorer</th><th>Mean</th></tr></thead>\n <tbody>${meanScoreRows}</tbody>\n </table>\n\n <h2>Cases</h2>\n <table class=\"cases-table\">\n <thead>\n <tr>\n <th>#</th>\n <th>Status</th>\n <th>Input</th>\n <th>Output</th>\n <th>Expected</th>\n ${scorerHeaders}\n <th>Latency</th>\n <th>Tokens</th>\n <th>Error</th>\n </tr>\n </thead>\n <tbody>\n ${caseRows}\n </tbody>\n </table>\n</body>\n</html>`;\n}\n"],
5
+ "mappings": ";AAAA,OAAO,WAAW;;;ACKX,SAAS,eAAe,IAAoB;AACjD,MAAI,KAAK,IAAM,QAAO,GAAG,EAAE;AAC3B,SAAO,IAAI,KAAK,KAAM,QAAQ,CAAC,CAAC;AAClC;AAEO,SAAS,aAAa,GAAmB;AAC9C,MAAI,KAAK,IAAW,QAAO,IAAI,IAAI,KAAW,QAAQ,CAAC,CAAC;AACxD,MAAI,KAAK,IAAO,QAAO,IAAI,IAAI,KAAO,QAAQ,CAAC,CAAC;AAChD,SAAO,OAAO,CAAC;AACjB;AAEO,SAAS,iBACd,MACA,OACA,KACQ;AACR,QAAM,OAAO,KAAK,QAAQ,mBAAmB,GAAG,EAAE,YAAY;AAC9D,QAAM,SAAS,MAAM,MAAM,GAAG,CAAC;AAC/B,SAAO,GAAG,IAAI,IAAI,MAAM,IAAI,GAAG;AACjC;AAEO,SAAS,iBACd,OACA,SAIQ;AACR,MAAI,OAAO,UAAU,SAAU,QAAO;AAEtC,QAAM,QAAQ,SAAS,SAAS;AAChC,QAAM,WAAW,SAAS,YAAY;AACtC,MAAI;AACF,WAAO,KAAK,UAAU,OAAO,MAAM,KAAK,KAAK;AAAA,EAC/C,QAAQ;AACN,WAAO,OAAO,KAAK;AAAA,EACrB;AACF;AAEO,SAAS,iBAAiB,OAAwB;AACvD,SAAO,iBAAiB,OAAO,EAAE,OAAO,GAAG,UAAU,GAAG,CAAC;AAC3D;AAEO,SAAS,iBAAiB,OAAwB;AACvD,MAAI,SAAS,KAAM,QAAO;AAC1B,MAAI,OAAO,UAAU,SAAU,QAAO;AACtC,SAAO,iBAAiB,OAAO,EAAE,OAAO,GAAG,UAAU,GAAG,CAAC;AAC3D;AAEO,SAAS,UAAU,OAAwB;AAChD,QAAM,MAAM,iBAAiB,OAAO,EAAE,OAAO,GAAG,UAAU,OAAO,CAAC;AAClE,MAAI,IAAI,SAAS,GAAG,KAAK,IAAI,SAAS,GAAG,KAAK,IAAI,SAAS,IAAI,GAAG;AAChE,WAAO,IAAI,IAAI,QAAQ,MAAM,IAAI,CAAC;AAAA,EACpC;AACA,SAAO;AACT;;;AC5DA,SAAS,OAAO,iBAAiB;AACjC,SAAS,YAAY;AAKrB,IAAM,qBAAqB;AAEpB,SAAS,iBAAiB,WAA4B;AAC3D,SAAO,aAAa;AACtB;AAEO,SAAS,cACd,WACA,MACA,OACA,KACQ;AACR,SAAO,KAAK,WAAW,iBAAiB,MAAM,OAAO,GAAG,CAAC;AAC3D;AAEA,eAAsB,mBACpB,WACA,MACA,OACA,KACA,SACe;AACf,QAAM,MAAM,WAAW,EAAE,WAAW,KAAK,CAAC;AAC1C,QAAM,UAAU,cAAc,WAAW,MAAM,OAAO,GAAG,GAAG,SAAS,OAAO;AAC9E;AAEO,SAAS,cACd,QACA,WAC2B;AAC3B,MAAI,OAAO,MAAO,QAAO;AACzB,QAAM,SAAS,OAAO,OAAO,OAAO,MAAM,EAAE;AAAA,IAC1C,CAAC,MAAM,EAAE,SAAS;AAAA,EACpB;AACA,SAAO,SAAS,SAAS;AAC3B;AAEO,SAAS,yBAAyB,SAI5B;AACX,QAAM,YAAY,iBAAiB,QAAQ,SAAS;AAEpD,SAAO;AAAA,IACL,MAAM,SAAS,MAAM;AACnB,YAAM,UAAU,MAAM,QAAQ,OAAO,IAAI;AACzC,YAAM;AAAA,QACJ;AAAA,QACA,KAAK;AAAA,QACL,KAAK;AAAA,QACL,QAAQ;AAAA,QACR;AAAA,MACF;AAAA,IACF;AAAA,EACF;AACF;;;AF/CA,IAAM,YAAY;AAElB,SAAS,kBACP,WACA,OACA,WACQ;AACR,QAAM,MAAM,QAAQ,IAAI,YAAY,QAAQ;AAC5C,QAAM,SAAS,KAAK,MAAM,MAAM,SAAS;AACzC,QAAM,MAAM,SAAS,OAAO,MAAM,IAAI,SAAS,OAAO,YAAY,MAAM;AACxE,QAAM,SAAS,IAAI,MAAM,KAAK,QAAQ,CAAC,CAAC;AACxC,SAAO,KAAK,GAAG,IAAI,MAAM,KAAK,SAAS,IAAI,KAAK,KAAK,eAAe,SAAS,CAAC;AAChF;AAEA,SAAS,YAAY,QAA2C;AAC9D,MAAI,WAAW,OAAQ,QAAO,MAAM,MAAM,MAAM;AAChD,MAAI,WAAW,QAAS,QAAO,MAAM,OAAO,OAAO;AACnD,SAAO,MAAM,IAAI,MAAM;AACzB;AAEO,SAAS,gBAAgB,SAA4C;AAC1E,QAAM,YAAY,SAAS,aAAa;AAExC,MAAI,aAAa;AACjB,MAAI,YAAY;AAChB,MAAI,YAAY;AAEhB,SAAO;AAAA,IACL,WAAW,MAAM;AACf,mBAAa,KAAK;AAClB,kBAAY;AACZ,kBAAY,KAAK,IAAI;AAErB,UAAI,cAAc,SAAS;AACzB,cAAM,QAAQ,KAAK;AACnB,gBAAQ,IAAI,EAAE;AACd,gBAAQ;AAAA,UACN,KAAK,MAAM,IAAI,cAAc,CAAC,IAAI,MAAM,KAAK,KAAK,CAAC,IAAI,MAAM,IAAI,SAAS,OAAO,KAAK,IAAI,GAAG,KAAK,MAAM,MAAM,CAAC,CAAC,CAAC;AAAA,QACnH;AACA,gBAAQ,IAAI,KAAK,MAAM,IAAI,WAAW,KAAK,UAAU,WAAW,CAAC,EAAE;AACnE,gBAAQ,IAAI,EAAE;AAAA,MAChB;AAAA,IACF;AAAA,IAEA,YAAY;AACV;AACA,UAAI,cAAc,SAAS;AACzB,cAAM,UAAU,KAAK,IAAI,IAAI;AAC7B,gBAAQ,OAAO;AAAA,UACb,KAAK,kBAAkB,WAAW,YAAY,OAAO,CAAC;AAAA,QACxD;AAAA,MACF;AAAA,IACF;AAAA,IAEA,SAAS,MAAM;AACb,UAAI,cAAc,SAAS;AACzB,gBAAQ,OAAO,MAAM,OAAO,IAAI,OAAO,EAAE,IAAI,IAAI;AAAA,MACnD;AAEA,yBAAmB,IAAI;AAEvB,UAAI,cAAc,QAAS;AAE3B,YAAM,SAAS,CAAC,GAAG,KAAK,KAAK,EAAE,KAAK,CAAC,GAAG,MAAM,EAAE,QAAQ,EAAE,KAAK;AAE/D,UAAI,cAAc,WAAW;AAC3B,mBAAW,KAAK,QAAQ;AACtB,2BAAiB,GAAG,KAAK,WAAW;AAAA,YAClC,WAAW;AAAA,YACX,iBAAiB;AAAA,UACnB,CAAC;AAAA,QACH;AAAA,MACF,OAAO;AACL,+BAAuB,QAAQ,KAAK,SAAS;AAAA,MAC/C;AAAA,IACF;AAAA,EACF;AACF;AAEA,SAAS,YAAY,MAAc,QAAwB;AACzD,QAAM,MAAM,IAAI,OAAO,MAAM;AAC7B,SAAO,KACJ,QAAQ,SAAS,IAAI,EACrB,MAAM,IAAI,EACV,IAAI,CAAC,SAAS,MAAM,IAAI,EACxB,KAAK,IAAI;AACd;AAEA,SAAS,eAAe,MAAc,WAA2B;AAC/D,MAAI,KAAK,UAAU,UAAW,QAAO;AACrC,SAAO,KAAK,MAAM,GAAG,SAAS,IAAI;AACpC;AAEA,SAAS,mBAAmB,OAAoC;AAC9D,MAAI,OAAO,UAAU,UAAU;AAC7B,UAAM,UAAU,MAAM,KAAK;AAC3B,WAAO,QAAQ,SAAS,IAAI,UAAU;AAAA,EACxC;AAEA,MAAI,MAAM,QAAQ,KAAK,GAAG;AACxB,UAAM,QAAQ,MACX,IAAI,CAAC,SAAU,OAAO,SAAS,WAAW,KAAK,KAAK,IAAI,EAAG,EAC3D,OAAO,OAAO;AACjB,QAAI,MAAM,SAAS,EAAG,QAAO,MAAM,KAAK,KAAK;AAAA,EAC/C;AAEA,SAAO;AACT;AAEA,SAAS,wBAAwB,OAGV;AACrB,QAAM,SAAS,MAAM,QAAQ,KAAK;AAClC,MAAI,OAAQ,QAAO;AACnB,SAAO,mBAAmB,MAAM,WAAW,WAAW,CAAC;AACzD;AAEA,SAAS,mBAAmB,MAAwB;AAClD,QAAM,EAAE,QAAQ,IAAI;AACpB,QAAM,WACJ,QAAQ,aAAa,KACf,QAAQ,YAAY,QAAQ,aAAc,KAAK,QAAQ,CAAC,IAC1D;AAEN,UAAQ,IAAI,EAAE;AACd,UAAQ,IAAI,MAAM,KAAK,WAAW,CAAC;AACnC,UAAQ,IAAI,MAAM,IAAI,OAAO,SAAS,OAAO,EAAE,CAAC,CAAC;AACjD,UAAQ,IAAI,KAAK,MAAM,IAAI,OAAO,CAAC,SAAS,KAAK,IAAI,EAAE;AACvD,UAAQ,IAAI,KAAK,MAAM,IAAI,QAAQ,CAAC,QAAQ,KAAK,KAAK,EAAE;AACxD,UAAQ,IAAI,KAAK,MAAM,IAAI,YAAY,CAAC,IAAI,KAAK,SAAS,EAAE;AAC5D,UAAQ,IAAI,KAAK,MAAM,IAAI,QAAQ,CAAC,QAAQ,QAAQ,UAAU,EAAE;AAChE,UAAQ;AAAA,IACN,KAAK,MAAM,IAAI,YAAY,CAAC,IAAI,MAAM,MAAM,OAAO,QAAQ,SAAS,CAAC,CAAC,MAAM,MAAM,IAAI,OAAO,QAAQ,SAAS,CAAC,CAAC,IAAI,MAAM,IAAI,IAAI,QAAQ,IAAI,CAAC;AAAA,EACjJ;AACA,UAAQ;AAAA,IACN,KAAK,MAAM,IAAI,WAAW,CAAC,KAAK,eAAe,QAAQ,cAAc,CAAC;AAAA,EACxE;AACA,UAAQ;AAAA,IACN,KAAK,MAAM,IAAI,SAAS,CAAC,OAAO,MAAM,IAAI,KAAK,CAAC,IAAI,aAAa,QAAQ,aAAa,CAAC,KAAK,MAAM,IAAI,MAAM,CAAC,IAAI,aAAa,QAAQ,cAAc,CAAC,KAAK,MAAM,IAAI,QAAQ,CAAC,IAAI,aAAa,QAAQ,gBAAgB,QAAQ,cAAc,CAAC;AAAA,EAC/O;AAEA,QAAM,eAAe,OAAO,QAAQ,QAAQ,UAAU;AACtD,MAAI,aAAa,SAAS,GAAG;AAC3B,YAAQ,IAAI,EAAE;AACd,YAAQ,IAAI,MAAM,KAAK,UAAU,CAAC;AAClC,eAAW,CAAC,MAAM,KAAK,KAAK,cAAc;AACxC,YAAM,aAAa,SAAS,KAAK,YAAY,MAAM,QAAQ,MAAM;AACjE,cAAQ;AAAA,QACN,OAAO,MAAM,IAAI,OAAO,GAAG,CAAC,GAAG,IAAI,OAAO,KAAK,IAAI,GAAG,KAAK,KAAK,MAAM,CAAC,CAAC,GAAG,WAAW,MAAM,QAAQ,CAAC,CAAC,CAAC;AAAA,MACzG;AAAA,IACF;AAAA,EACF;AAEA,UAAQ,IAAI,MAAM,IAAI,OAAO,SAAS,OAAO,EAAE,CAAC,CAAC;AACjD,UAAQ,IAAI,EAAE;AAChB;AAEA,SAAS,iBACP,GACA,WACA,SAIM;AACN,QAAM,UAAU,OAAO,QAAQ,EAAE,MAAM;AACvC,QAAM,SAAS,cAAc,GAAG,SAAS;AACzC,QAAM,SAAS,YAAY,MAAM;AACjC,QAAM,YAAY,SAAS,aAAa;AACxC,QAAM,kBAAkB,SAAS,mBAAmB;AAEpD,QAAM,OAAO,GAAG,MAAM,IAAI,eAAe,EAAE,SAAS,CAAC,CAAC,KAAK,MAAM,IAAI,GAAG,EAAE,QAAQ,IAAI,EAAE,SAAS,SAAS,CAAC;AAC3G,UAAQ,IAAI,KAAK,MAAM,IAAI,MAAM,IAAI,SAAS,EAAE,KAAK,EAAE,CAAC,KAAK,IAAI,EAAE;AAEnE,QAAM,WAAW,iBAAiB,EAAE,OAAO;AAAA,IACzC,OAAO;AAAA,IACP,UAAU,OAAO,EAAE,KAAK;AAAA,EAC1B,CAAC;AACD,UAAQ,IAAI,OAAO,MAAM,IAAI,QAAQ,CAAC,EAAE;AACxC,UAAQ,IAAI,YAAY,eAAe,UAAU,eAAe,GAAG,CAAC,CAAC;AAErE,MAAI,WAAW;AACb,YAAQ,IAAI,OAAO,MAAM,IAAI,SAAS,CAAC,EAAE;AACzC,YAAQ,IAAI,YAAY,eAAe,EAAE,QAAQ,eAAe,GAAG,CAAC,CAAC;AACrE,YAAQ,IAAI,OAAO,MAAM,IAAI,WAAW,CAAC,EAAE;AAC3C,UAAM,iBAAiB,iBAAiB,EAAE,UAAU;AAAA,MAClD,OAAO;AAAA,MACP,UAAU,OAAO,EAAE,QAAQ;AAAA,IAC7B,CAAC;AACD,YAAQ;AAAA,MACN,YAAY,eAAe,gBAAgB,eAAe,GAAG,CAAC;AAAA,IAChE;AAAA,EACF;AAEA,aAAW,CAAC,MAAM,CAAC,KAAK,SAAS;AAC/B,UAAM,aAAa,EAAE,SAAS,YAAY,MAAM,QAAQ,MAAM;AAC9D,UAAM,SAAS,wBAAwB,CAAC;AACxC,UAAM,YAAY,SAAS,WAAW,MAAM,KAAK;AACjD,YAAQ;AAAA,MACN,OAAO,MAAM,IAAI,OAAO,GAAG,CAAC,IAAI,WAAW,EAAE,MAAM,QAAQ,CAAC,CAAC,CAAC,GAAG,SAAS;AAAA,IAC5E;AAAA,EACF;AAEA,MAAI,EAAE,OAAO;AACX,YAAQ,IAAI,OAAO,MAAM,IAAI,QAAQ,CAAC,EAAE;AACxC,UAAM,WAAW,iBAAiB,EAAE,KAAK;AACzC,YAAQ,IAAI,SAAS,MAAM,IAAI,QAAQ,CAAC,EAAE;AAAA,EAC5C;AAEA,UAAQ,IAAI,EAAE;AAChB;AAEA,SAAS,uBAAuB,OAAqB,WAAyB;AAC5E,QAAM,cAAc,oBAAI,IAAY;AACpC,aAAW,KAAK,OAAO;AACrB,eAAW,QAAQ,OAAO,KAAK,EAAE,MAAM,GAAG;AACxC,kBAAY,IAAI,IAAI;AAAA,IACtB;AAAA,EACF;AAEA,MAAI,cAAc;AAElB,aAAW,UAAU,aAAa;AAChC,UAAM,UAAU,MAAM,OAAO,CAAC,MAAM;AAClC,YAAM,IAAI,EAAE,OAAO,MAAM;AACzB,aACG,KAAK,EAAE,QAAQ,aAAc,cAAc,GAAG,SAAS,MAAM;AAAA,IAElE,CAAC;AAED,QAAI,QAAQ,WAAW,EAAG;AAE1B,QAAI,CAAC,aAAa;AAChB,cAAQ,IAAI,MAAM,IAAI,sBAAsB,CAAC;AAC7C,cAAQ,IAAI,EAAE;AACd,oBAAc;AAAA,IAChB;AAEA,YAAQ;AAAA,MACN,KAAK,MAAM,KAAK,MAAM,CAAC,IAAI,MAAM,IAAI,IAAI,QAAQ,MAAM,YAAY,CAAC;AAAA,IACtE;AACA,YAAQ,IAAI,MAAM,IAAI,OAAO,SAAS,OAAO,EAAE,CAAC,CAAC;AAEjD,eAAW,KAAK,SAAS;AACvB,uBAAiB,GAAG,WAAW;AAAA,QAC7B,WAAW;AAAA,QACX,iBAAiB;AAAA,MACnB,CAAC;AAAA,IACH;AAAA,EACF;AACF;;;AG1QA,SAAS,YAAY,SAAAA,cAAa;AAe3B,SAAS,aAAa,SAAyC;AACpE,QAAM,YAAY,iBAAiB,SAAS,SAAS;AACrD,QAAM,SAAS,SAAS,UAAU;AAClC,MAAI,iBAAiB;AAErB,SAAO;AAAA,IACL,MAAM,WAAW,MAAM;AACrB,YAAMC,OAAM,WAAW,EAAE,WAAW,KAAK,CAAC;AAC1C,uBAAiB,cAAc,WAAW,KAAK,MAAM,KAAK,OAAO,OAAO;AAAA,IAC1E;AAAA,IACA,MAAM,UAAU,MAAM;AACpB,YAAM,OAAO,iBAAiB,MAAM,EAAE,OAAO,GAAG,UAAU,OAAO,CAAC;AAClE,YAAM,WAAW,gBAAgB,OAAO,MAAM,OAAO;AAAA,IACvD;AAAA,IACA,MAAM,SAAS,MAAM;AACnB,YAAM,UAAU,iBAAiB,MAAM;AAAA,QACrC,OAAO,SAAS,IAAI;AAAA,QACpB,UAAU;AAAA,MACZ,CAAC;AACD,YAAM;AAAA,QACJ;AAAA,QACA,KAAK;AAAA,QACL,KAAK;AAAA,QACL;AAAA,QACA;AAAA,MACF;AAAA,IACF;AAAA,EACF;AACF;;;ACnCO,SAAS,YAAY,SAAwC;AAClE,SAAO,yBAAyB;AAAA,IAC9B,WAAW,SAAS;AAAA,IACpB,KAAK;AAAA,IACL,OAAO,MAAM;AACX,YAAM,cAAc,OAAO,KAAK,KAAK,QAAQ,UAAU;AAEvD,YAAM,cAAc;AAAA,QAClB;AAAA,QACA;AAAA,QACA;AAAA,QACA;AAAA,QACA;AAAA,QACA;AAAA,QACA;AAAA,QACA;AAAA,QACA;AAAA,MACF;AACA,iBAAW,QAAQ,aAAa;AAC9B,oBAAY,KAAK,GAAG,IAAI,UAAU,GAAG,IAAI,SAAS;AAAA,MACpD;AAEA,YAAM,OAAO,CAAC,YAAY,KAAK,GAAG,CAAC;AAEnC,iBAAW,KAAK,KAAK,OAAO;AAC1B,cAAM,SAAS,cAAc,GAAG,KAAK,SAAS;AAC9C,cAAM,QAAQ;AAAA,UACZ,OAAO,EAAE,KAAK;AAAA,UACd;AAAA,UACA,UAAU,EAAE,KAAK;AAAA,UACjB,UAAU,EAAE,MAAM;AAAA,UAClB,UAAU,EAAE,QAAQ;AAAA,UACpB,UAAU,EAAE,SAAS,EAAE;AAAA,UACvB,OAAO,EAAE,SAAS;AAAA,UAClB,OAAO,EAAE,QAAQ;AAAA,UACjB,OAAO,EAAE,SAAS;AAAA,QACpB;AACA,mBAAW,QAAQ,aAAa;AAC9B,gBAAM,IAAI,EAAE,OAAO,IAAI;AACvB,gBAAM,KAAK,OAAO,GAAG,SAAS,EAAE,GAAG,UAAU,GAAG,UAAU,EAAE,CAAC;AAAA,QAC/D;AACA,aAAK,KAAK,MAAM,KAAK,GAAG,CAAC;AAAA,MAC3B;AAEA,aAAO,KAAK,KAAK,IAAI,IAAI;AAAA,IAC3B;AAAA,EACF,CAAC;AACH;;;AC1CO,SAAS,iBAAiB,SAA6C;AAC5E,SAAO,yBAAyB;AAAA,IAC9B,WAAW,SAAS;AAAA,IACpB,KAAK;AAAA,IACL,OAAO,MAAM;AACX,YAAM,EAAE,QAAQ,IAAI;AACpB,YAAM,cAAc,OAAO,KAAK,QAAQ,UAAU;AAClD,YAAM,QAAkB,CAAC;AACzB,YAAM,WACJ,QAAQ,aAAa,KACf,QAAQ,YAAY,QAAQ,aAAc,KAAK,QAAQ,CAAC,IAC1D;AAEN,YAAM,KAAK,KAAK,KAAK,IAAI,EAAE;AAC3B,YAAM,KAAK,EAAE;AACb,YAAM,KAAK,cAAc,KAAK,KAAK,EAAE;AACrC,YAAM,KAAK,kBAAkB,KAAK,SAAS,EAAE;AAC7C,YAAM;AAAA,QACJ,cAAc,QAAQ,UAAU,KAAK,QAAQ,SAAS,UAAU,QAAQ,SAAS,UAAU,QAAQ;AAAA,MACrG;AACA,YAAM,KAAK,iBAAiB,eAAe,QAAQ,cAAc,CAAC,EAAE;AACpE,YAAM;AAAA,QACJ,mBAAmB,aAAa,QAAQ,aAAa,CAAC,WAAW,aAAa,QAAQ,cAAc,CAAC,aAAa,aAAa,QAAQ,gBAAgB,QAAQ,cAAc,CAAC;AAAA,MAChL;AACA,YAAM,KAAK,EAAE;AAEb,YAAM,KAAK,WAAW;AACtB,YAAM,KAAK,EAAE;AACb,YAAM,KAAK,mBAAmB;AAC9B,YAAM,KAAK,mBAAmB;AAC9B,iBAAW,CAAC,MAAM,KAAK,KAAK,OAAO,QAAQ,QAAQ,UAAU,GAAG;AAC9D,cAAM,KAAK,KAAK,IAAI,MAAM,MAAM,QAAQ,CAAC,CAAC,IAAI;AAAA,MAChD;AACA,YAAM,KAAK,EAAE;AAEb,YAAM,KAAK,UAAU;AACrB,YAAM,KAAK,EAAE;AAEb,YAAM,aAAa;AAAA,QACjB;AAAA,QACA;AAAA,QACA;AAAA,QACA,GAAG;AAAA,QACH;AAAA,QACA;AAAA,QACA;AAAA,MACF;AACA,YAAM,KAAK,KAAK,WAAW,KAAK,KAAK,CAAC,IAAI;AAC1C,YAAM,KAAK,KAAK,WAAW,IAAI,MAAM,KAAK,EAAE,KAAK,KAAK,CAAC,IAAI;AAE3D,iBAAW,KAAK,KAAK,OAAO;AAC1B,cAAM,cAAc,cAAc,GAAG,KAAK,SAAS;AACnD,cAAM,SACJ,gBAAgB,UACZ,oBACA,gBAAgB,SACd,gBACA;AACR,cAAM,QAAQ,iBAAiB,EAAE,KAAK,EAAE,MAAM,GAAG,EAAE;AACnD,cAAM,SAAS,YAAY;AAAA,UACzB,CAAC,SAAS,EAAE,OAAO,IAAI,GAAG,MAAM,QAAQ,CAAC,KAAK;AAAA,QAChD;AACA,cAAM,QAAQ,EAAE,QACZ,iBAAiB,EAAE,KAAK,EACrB,QAAQ,UAAU,MAAM,EACxB,QAAQ,OAAO,KAAK,IACvB;AACJ,cAAM,MAAM;AAAA,UACV,OAAO,EAAE,KAAK;AAAA,UACd;AAAA,UACA;AAAA,UACA,GAAG;AAAA,UACH,eAAe,EAAE,SAAS;AAAA,UAC1B,GAAG,EAAE,QAAQ,IAAI,EAAE,SAAS;AAAA,UAC5B;AAAA,QACF;AACA,cAAM,KAAK,KAAK,IAAI,KAAK,KAAK,CAAC,IAAI;AAAA,MACrC;AACA,YAAM,KAAK,EAAE;AAEb,aAAO,MAAM,KAAK,IAAI;AAAA,IACxB;AAAA,EACF,CAAC;AACH;;;AClFO,SAAS,aAAa,SAAyC;AACpE,SAAO,yBAAyB;AAAA,IAC9B,WAAW,SAAS;AAAA,IACpB,KAAK;AAAA,IACL,QAAQ;AAAA,EACV,CAAC;AACH;AAEA,SAAS,IAAI,KAAqB;AAChC,SAAO,IACJ,QAAQ,MAAM,OAAO,EACrB,QAAQ,MAAM,MAAM,EACpB,QAAQ,MAAM,MAAM,EACpB,QAAQ,MAAM,QAAQ;AAC3B;AAEA,SAAS,WAAW,MAA0B;AAC5C,QAAM,EAAE,QAAQ,IAAI;AACpB,QAAM,cAAc,OAAO,KAAK,QAAQ,UAAU;AAClD,QAAM,WACJ,QAAQ,aAAa,KACf,QAAQ,YAAY,QAAQ,aAAc,KAAK,QAAQ,CAAC,IAC1D;AAEN,QAAM,WAAW,KAAK,MACnB,IAAI,CAAC,MAAM;AACV,UAAM,SAAS,cAAc,GAAG,KAAK,SAAS;AAC9C,UAAMC,eACJ,WAAW,UAAU,UAAU,WAAW,SAAS,SAAS;AAC9D,UAAM,cAAc,YACjB,IAAI,CAAC,SAAS;AACb,YAAM,IAAI,EAAE,OAAO,IAAI;AACvB,YAAM,QAAQ,GAAG,SAAS;AAC1B,YAAM,MAAM,SAAS,KAAK,YAAY,SAAS;AAC/C,YAAM,SAAS,GAAG,SAAS,WAAW,IAAI,EAAE,MAAM,CAAC,MAAM;AACzD,aAAO,cAAc,GAAG,IAAI,MAAM,IAAI,MAAM,QAAQ,CAAC,CAAC;AAAA,IACxD,CAAC,EACA,KAAK,EAAE;AAEV,UAAM,cAAc,iBAAiB,EAAE,UAAU;AAAA,MAC/C,OAAO;AAAA,MACP,UAAU;AAAA,IACZ,CAAC;AAED,WAAO,cAAc,MAAM;AAAA,cACnB,EAAE,KAAK;AAAA,qBACA,MAAM,KAAKA,YAAW;AAAA,2BAChB,IAAI,iBAAiB,EAAE,KAAK,EAAE,MAAM,GAAG,GAAG,CAAC,CAAC;AAAA,2BAC5C,IAAI,EAAE,OAAO,MAAM,GAAG,GAAG,CAAC,CAAC;AAAA,2BAC3B,IAAI,YAAY,MAAM,GAAG,GAAG,CAAC,CAAC;AAAA,UAC/C,WAAW;AAAA,cACP,eAAe,EAAE,SAAS,CAAC;AAAA,cAC3B,EAAE,QAAQ,IAAI,EAAE,SAAS;AAAA,iCACN,EAAE,QAAQ,IAAI,iBAAiB,EAAE,KAAK,CAAC,IAAI,EAAE;AAAA;AAAA,EAE1E,CAAC,EACA,KAAK,IAAI;AAEZ,QAAM,gBAAgB,YAAY,IAAI,CAAC,MAAM,OAAO,IAAI,CAAC,CAAC,OAAO,EAAE,KAAK,EAAE;AAC1E,QAAM,gBAAgB,OAAO,QAAQ,QAAQ,UAAU,EACpD;AAAA,IACC,CAAC,CAAC,MAAM,KAAK,MACX,WAAW,IAAI,IAAI,CAAC,YAAY,MAAM,QAAQ,CAAC,CAAC;AAAA,EACpD,EACC,KAAK,EAAE;AAEV,SAAO;AAAA;AAAA;AAAA;AAAA,SAIA,IAAI,KAAK,IAAI,CAAC;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA,QAuBf,IAAI,KAAK,IAAI,CAAC;AAAA;AAAA,oCAEc,IAAI,KAAK,KAAK,CAAC;AAAA,wCACX,KAAK,SAAS;AAAA,oCAClB,QAAQ,UAAU;AAAA,mCACnB,QAAQ,SAAS;AAAA,mCACjB,QAAQ,SAAS,KAAK,QAAQ;AAAA,uCAC1B,eAAe,QAAQ,cAAc,CAAC;AAAA,wCACrC,aAAa,QAAQ,aAAa,CAAC;AAAA,yCAClC,aAAa,QAAQ,cAAc,CAAC;AAAA,2CAClC,aAAa,QAAQ,gBAAgB,QAAQ,cAAc,CAAC;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA,aAM1F,aAAa;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA,UAYhB,aAAa;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA,QAOf,QAAQ;AAAA;AAAA;AAAA;AAAA;AAKhB;",
6
6
  "names": ["mkdir", "mkdir", "statusLabel"]
7
7
  }
@@ -1,4 +1,3 @@
1
- import type { LanguageModelV3 } from '@ai-sdk/provider';
2
1
  export interface ScorerArgs {
3
2
  input: unknown;
4
3
  output: string;
@@ -7,6 +6,7 @@ export interface ScorerArgs {
7
6
  export interface ScorerResult {
8
7
  score: number;
9
8
  reason?: string;
9
+ metadata?: Record<string, unknown>;
10
10
  }
11
11
  export type Scorer = (args: ScorerArgs) => Promise<ScorerResult>;
12
12
  export declare const exactMatch: Scorer;
@@ -14,12 +14,8 @@ export declare const includes: Scorer;
14
14
  export declare function regex(pattern: RegExp): Scorer;
15
15
  export declare const levenshtein: Scorer;
16
16
  export declare const jsonMatch: Scorer;
17
- export declare function llmJudge(config: {
18
- model: LanguageModelV3;
19
- criteria: string;
20
- }): Scorer;
21
17
  export declare function factuality(config: {
22
- model: LanguageModelV3;
18
+ model: string;
23
19
  }): Scorer;
24
20
  export declare function all(...scorers: Scorer[]): Scorer;
25
21
  export declare function any(...scorers: Scorer[]): Scorer;
@@ -1 +1 @@
1
- {"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../src/scorers/index.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EAAE,eAAe,EAAE,MAAM,kBAAkB,CAAC;AAIxD,MAAM,WAAW,UAAU;IACzB,KAAK,EAAE,OAAO,CAAC;IACf,MAAM,EAAE,MAAM,CAAC;IACf,QAAQ,CAAC,EAAE,OAAO,CAAC;CACpB;AAED,MAAM,WAAW,YAAY;IAC3B,KAAK,EAAE,MAAM,CAAC;IACd,MAAM,CAAC,EAAE,MAAM,CAAC;CACjB;AAED,MAAM,MAAM,MAAM,GAAG,CAAC,IAAI,EAAE,UAAU,KAAK,OAAO,CAAC,YAAY,CAAC,CAAC;AAEjE,eAAO,MAAM,UAAU,EAAE,MAOxB,CAAC;AAEF,eAAO,MAAM,QAAQ,EAAE,MAOtB,CAAC;AAEF,wBAAgB,KAAK,CAAC,OAAO,EAAE,MAAM,GAAG,MAAM,CAI7C;AAuBD,eAAO,MAAM,WAAW,EAAE,MAWzB,CAAC;AA6BF,eAAO,MAAM,SAAS,EAAE,MAUvB,CAAC;AAOF,wBAAgB,QAAQ,CAAC,MAAM,EAAE;IAC/B,KAAK,EAAE,eAAe,CAAC;IACvB,QAAQ,EAAE,MAAM,CAAC;CAClB,GAAG,MAAM,CAgBT;AAED,wBAAgB,UAAU,CAAC,MAAM,EAAE;IAAE,KAAK,EAAE,eAAe,CAAA;CAAE,GAAG,MAAM,CAgBrE;AAED,wBAAgB,GAAG,CAAC,GAAG,OAAO,EAAE,MAAM,EAAE,GAAG,MAAM,CAahD;AAED,wBAAgB,GAAG,CAAC,GAAG,OAAO,EAAE,MAAM,EAAE,GAAG,MAAM,CAShD;AAED,wBAAgB,QAAQ,CACtB,MAAM,EAAE,MAAM,CAAC,MAAM,EAAE;IAAE,MAAM,EAAE,MAAM,CAAC;IAAC,MAAM,EAAE,MAAM,CAAA;CAAE,CAAC,GACzD,MAAM,CAqBR"}
1
+ {"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../src/scorers/index.ts"],"names":[],"mappings":"AAKA,MAAM,WAAW,UAAU;IACzB,KAAK,EAAE,OAAO,CAAC;IACf,MAAM,EAAE,MAAM,CAAC;IACf,QAAQ,CAAC,EAAE,OAAO,CAAC;CACpB;AAED,MAAM,WAAW,YAAY;IAC3B,KAAK,EAAE,MAAM,CAAC;IACd,MAAM,CAAC,EAAE,MAAM,CAAC;IAChB,QAAQ,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,CAAC;CACpC;AAED,MAAM,MAAM,MAAM,GAAG,CAAC,IAAI,EAAE,UAAU,KAAK,OAAO,CAAC,YAAY,CAAC,CAAC;AAEjE,eAAO,MAAM,UAAU,EAAE,MAOxB,CAAC;AAEF,eAAO,MAAM,QAAQ,EAAE,MAOtB,CAAC;AAEF,wBAAgB,KAAK,CAAC,OAAO,EAAE,MAAM,GAAG,MAAM,CAI7C;AAwBD,eAAO,MAAM,WAAW,EAAE,MASzB,CAAC;AA6BF,eAAO,MAAM,SAAS,EAAE,MAUvB,CAAC;AAEF,wBAAgB,UAAU,CAAC,MAAM,EAAE;IAAE,KAAK,EAAE,MAAM,CAAA;CAAE,GAAG,MAAM,CAc5D;AAED,wBAAgB,GAAG,CAAC,GAAG,OAAO,EAAE,MAAM,EAAE,GAAG,MAAM,CAahD;AAED,wBAAgB,GAAG,CAAC,GAAG,OAAO,EAAE,MAAM,EAAE,GAAG,MAAM,CAShD;AAED,wBAAgB,QAAQ,CACtB,MAAM,EAAE,MAAM,CAAC,MAAM,EAAE;IAAE,MAAM,EAAE,MAAM,CAAC;IAAC,MAAM,EAAE,MAAM,CAAA;CAAE,CAAC,GACzD,MAAM,CAqBR"}
@@ -1,6 +1,8 @@
1
1
  // packages/evals/src/scorers/index.ts
2
- import { generateObject } from "ai";
3
- import { z } from "zod";
2
+ import {
3
+ Factuality as AutoevalsFactuality,
4
+ Levenshtein as AutoevalsLevenshtein
5
+ } from "autoevals";
4
6
  var exactMatch = async ({ output, expected }) => {
5
7
  const exp = expected == null ? "" : String(expected);
6
8
  if (output === exp) return { score: 1 };
@@ -22,32 +24,32 @@ function regex(pattern) {
22
24
  return { score: pattern.test(output) ? 1 : 0 };
23
25
  };
24
26
  }
25
- function levenshteinDistance(a, b) {
26
- if (a.length === 0) return b.length;
27
- if (b.length === 0) return a.length;
28
- if (a.length > b.length) [a, b] = [b, a];
29
- let prev = Array.from({ length: a.length + 1 }, (_, i) => i);
30
- let curr = new Array(a.length + 1);
31
- for (let j = 1; j <= b.length; j++) {
32
- curr[0] = j;
33
- for (let i = 1; i <= a.length; i++) {
34
- const cost = a[i - 1] === b[j - 1] ? 0 : 1;
35
- curr[i] = Math.min(prev[i] + 1, curr[i - 1] + 1, prev[i - 1] + cost);
27
+ function normalizeScore(score) {
28
+ if (typeof score !== "number" || !Number.isFinite(score)) return 0;
29
+ return Math.max(0, Math.min(1, score));
30
+ }
31
+ function reasonFromMetadata(metadata) {
32
+ if (!metadata) return void 0;
33
+ const candidates = [
34
+ metadata.reason,
35
+ metadata.rationale,
36
+ metadata.explanation
37
+ ];
38
+ for (const candidate of candidates) {
39
+ if (typeof candidate === "string" && candidate.trim().length > 0) {
40
+ return candidate;
36
41
  }
37
- [prev, curr] = [curr, prev];
38
42
  }
39
- return prev[a.length];
43
+ return void 0;
40
44
  }
41
45
  var levenshtein = async ({ output, expected }) => {
42
46
  const exp = expected == null ? "" : String(expected);
43
- if (output.length === 0 && exp.length === 0) return { score: 1 };
44
- const maxLen = Math.max(output.length, exp.length);
45
- const distance = levenshteinDistance(output, exp);
46
- const score = Math.max(0, 1 - distance / maxLen);
47
- if (score === 1) return { score };
47
+ const result = await AutoevalsLevenshtein({ output, expected: exp });
48
+ const score = normalizeScore(result.score);
48
49
  return {
49
50
  score,
50
- reason: `Levenshtein distance is ${distance} across max length ${maxLen}.`
51
+ reason: reasonFromMetadata(result.metadata),
52
+ metadata: result.metadata
51
53
  };
52
54
  };
53
55
  function deepEqual(a, b) {
@@ -81,42 +83,19 @@ var jsonMatch = async ({ output, expected }) => {
81
83
  return { score: 0, reason: "Failed to parse JSON" };
82
84
  }
83
85
  };
84
- var llmScorerSchema = z.object({
85
- score: z.number().min(0).max(1),
86
- reason: z.string()
87
- });
88
- function llmJudge(config) {
89
- return async ({ input, output, expected }) => {
90
- const { object } = await generateObject({
91
- model: config.model,
92
- schema: llmScorerSchema,
93
- prompt: `You are an expert evaluator. Grade the output based on the following criteria:
94
- ${config.criteria}
95
-
96
- Input: ${JSON.stringify(input)}
97
- Output: ${output}
98
- ${expected != null ? `Expected: ${JSON.stringify(expected)}` : ""}
99
-
100
- Return a score from 0.0 to 1.0 and a brief reason.`
101
- });
102
- return { score: object.score, reason: object.reason };
103
- };
104
- }
105
86
  function factuality(config) {
106
87
  return async ({ input, output, expected }) => {
107
- const { object } = await generateObject({
88
+ const result = await AutoevalsFactuality({
108
89
  model: config.model,
109
- schema: llmScorerSchema,
110
- prompt: `You are a factuality evaluator. Determine whether the output is factually consistent with the expected reference.
111
-
112
- Input: ${JSON.stringify(input)}
113
- Output: ${output}
114
- Expected reference: ${JSON.stringify(expected)}
115
-
116
- Score 1.0 if the output is factually consistent with the reference, 0.0 if it contradicts it. Use intermediate scores for partial consistency.
117
- Return a score from 0.0 to 1.0 and a brief reason.`
90
+ input: typeof input === "string" ? input : JSON.stringify(input),
91
+ output,
92
+ expected: expected == null ? void 0 : String(expected)
118
93
  });
119
- return { score: object.score, reason: object.reason };
94
+ return {
95
+ score: normalizeScore(result.score),
96
+ reason: reasonFromMetadata(result.metadata),
97
+ metadata: result.metadata
98
+ };
120
99
  };
121
100
  }
122
101
  function all(...scorers) {
@@ -168,7 +147,6 @@ export {
168
147
  includes,
169
148
  jsonMatch,
170
149
  levenshtein,
171
- llmJudge,
172
150
  regex,
173
151
  weighted
174
152
  };
@@ -1,7 +1,7 @@
1
1
  {
2
2
  "version": 3,
3
3
  "sources": ["../../src/scorers/index.ts"],
4
- "sourcesContent": ["import type { LanguageModelV3 } from '@ai-sdk/provider';\nimport { generateObject } from 'ai';\nimport { z } from 'zod';\n\nexport interface ScorerArgs {\n input: unknown;\n output: string;\n expected?: unknown;\n}\n\nexport interface ScorerResult {\n score: number;\n reason?: string;\n}\n\nexport type Scorer = (args: ScorerArgs) => Promise<ScorerResult>;\n\nexport const exactMatch: Scorer = async ({ output, expected }) => {\n const exp = expected == null ? '' : String(expected);\n if (output === exp) return { score: 1.0 };\n return {\n score: 0.0,\n reason: `Output does not exactly match expected. Expected \"${exp}\" but got \"${output}\".`,\n };\n};\n\nexport const includes: Scorer = async ({ output, expected }) => {\n const exp = expected == null ? '' : String(expected);\n if (output.includes(exp)) return { score: 1.0 };\n return {\n score: 0.0,\n reason: `Output does not include expected substring \"${exp}\".`,\n };\n};\n\nexport function regex(pattern: RegExp): Scorer {\n return async ({ output }) => {\n return { score: pattern.test(output) ? 1.0 : 0.0 };\n };\n}\n\nfunction levenshteinDistance(a: string, b: string): number {\n if (a.length === 0) return b.length;\n if (b.length === 0) return a.length;\n\n if (a.length > b.length) [a, b] = [b, a];\n\n let prev = Array.from({ length: a.length + 1 }, (_, i) => i);\n let curr = new Array<number>(a.length + 1);\n\n for (let j = 1; j <= b.length; j++) {\n curr[0] = j;\n for (let i = 1; i <= a.length; i++) {\n const cost = a[i - 1] === b[j - 1] ? 0 : 1;\n curr[i] = Math.min(prev[i]! + 1, curr[i - 1]! + 1, prev[i - 1]! + cost);\n }\n [prev, curr] = [curr, prev];\n }\n\n return prev[a.length]!;\n}\n\nexport const levenshtein: Scorer = async ({ output, expected }) => {\n const exp = expected == null ? '' : String(expected);\n if (output.length === 0 && exp.length === 0) return { score: 1.0 };\n const maxLen = Math.max(output.length, exp.length);\n const distance = levenshteinDistance(output, exp);\n const score = Math.max(0, 1 - distance / maxLen);\n if (score === 1.0) return { score };\n return {\n score,\n reason: `Levenshtein distance is ${distance} across max length ${maxLen}.`,\n };\n};\n\nfunction deepEqual(a: unknown, b: unknown): boolean {\n if (a === b) return true;\n if (a == null || b == null) return false;\n if (typeof a !== typeof b) return false;\n\n if (Array.isArray(a)) {\n if (!Array.isArray(b) || a.length !== b.length) return false;\n return a.every((val, i) => deepEqual(val, b[i]));\n }\n\n if (typeof a === 'object') {\n const keysA = Object.keys(a as Record<string, unknown>).sort();\n const keysB = Object.keys(b as Record<string, unknown>).sort();\n if (keysA.length !== keysB.length) return false;\n return keysA.every(\n (key, i) =>\n keysB[i] === key &&\n deepEqual(\n (a as Record<string, unknown>)[key],\n (b as Record<string, unknown>)[key],\n ),\n );\n }\n\n return false;\n}\n\nexport const jsonMatch: Scorer = async ({ output, expected }) => {\n try {\n const parsedOutput = JSON.parse(output);\n const parsedExpected =\n typeof expected === 'string' ? JSON.parse(expected) : expected;\n if (deepEqual(parsedOutput, parsedExpected)) return { score: 1.0 };\n return { score: 0.0, reason: 'JSON payload differs from expected JSON.' };\n } catch {\n return { score: 0.0, reason: 'Failed to parse JSON' };\n }\n};\n\nconst llmScorerSchema = z.object({\n score: z.number().min(0).max(1),\n reason: z.string(),\n});\n\nexport function llmJudge(config: {\n model: LanguageModelV3;\n criteria: string;\n}): Scorer {\n return async ({ input, output, expected }) => {\n const { object } = await generateObject({\n model: config.model,\n schema: llmScorerSchema,\n prompt: `You are an expert evaluator. Grade the output based on the following criteria:\n${config.criteria}\n\nInput: ${JSON.stringify(input)}\nOutput: ${output}\n${expected != null ? `Expected: ${JSON.stringify(expected)}` : ''}\n\nReturn a score from 0.0 to 1.0 and a brief reason.`,\n });\n return { score: object.score, reason: object.reason };\n };\n}\n\nexport function factuality(config: { model: LanguageModelV3 }): Scorer {\n return async ({ input, output, expected }) => {\n const { object } = await generateObject({\n model: config.model,\n schema: llmScorerSchema,\n prompt: `You are a factuality evaluator. Determine whether the output is factually consistent with the expected reference.\n\nInput: ${JSON.stringify(input)}\nOutput: ${output}\nExpected reference: ${JSON.stringify(expected)}\n\nScore 1.0 if the output is factually consistent with the reference, 0.0 if it contradicts it. Use intermediate scores for partial consistency.\nReturn a score from 0.0 to 1.0 and a brief reason.`,\n });\n return { score: object.score, reason: object.reason };\n };\n}\n\nexport function all(...scorers: Scorer[]): Scorer {\n return async (args) => {\n if (scorers.length === 0) return { score: 1.0 };\n const results = await Promise.all(scorers.map((s) => s(args)));\n const minResult = results.reduce((min, r) =>\n r.score < min.score ? r : min,\n );\n const reasons = results\n .filter((r) => r.reason)\n .map((r) => r.reason)\n .join('; ');\n return { score: minResult.score, reason: reasons || undefined };\n };\n}\n\nexport function any(...scorers: Scorer[]): Scorer {\n return async (args) => {\n if (scorers.length === 0) return { score: 0.0 };\n const results = await Promise.all(scorers.map((s) => s(args)));\n const maxResult = results.reduce((max, r) =>\n r.score > max.score ? r : max,\n );\n return { score: maxResult.score, reason: maxResult.reason };\n };\n}\n\nexport function weighted(\n config: Record<string, { scorer: Scorer; weight: number }>,\n): Scorer {\n return async (args) => {\n const entries = Object.entries(config);\n const results = await Promise.all(\n entries.map(async ([name, { scorer, weight }]) => ({\n name,\n result: await scorer(args),\n weight,\n })),\n );\n const totalWeight = results.reduce((sum, r) => sum + r.weight, 0);\n const weightedScore = results.reduce(\n (sum, r) => sum + r.result.score * r.weight,\n 0,\n );\n const score = totalWeight > 0 ? weightedScore / totalWeight : 0;\n const reasons = results\n .map((r) => `${r.name}: ${r.result.score.toFixed(2)} (w=${r.weight})`)\n .join(', ');\n return { score, reason: reasons || undefined };\n };\n}\n"],
5
- "mappings": ";AACA,SAAS,sBAAsB;AAC/B,SAAS,SAAS;AAeX,IAAM,aAAqB,OAAO,EAAE,QAAQ,SAAS,MAAM;AAChE,QAAM,MAAM,YAAY,OAAO,KAAK,OAAO,QAAQ;AACnD,MAAI,WAAW,IAAK,QAAO,EAAE,OAAO,EAAI;AACxC,SAAO;AAAA,IACL,OAAO;AAAA,IACP,QAAQ,qDAAqD,GAAG,cAAc,MAAM;AAAA,EACtF;AACF;AAEO,IAAM,WAAmB,OAAO,EAAE,QAAQ,SAAS,MAAM;AAC9D,QAAM,MAAM,YAAY,OAAO,KAAK,OAAO,QAAQ;AACnD,MAAI,OAAO,SAAS,GAAG,EAAG,QAAO,EAAE,OAAO,EAAI;AAC9C,SAAO;AAAA,IACL,OAAO;AAAA,IACP,QAAQ,+CAA+C,GAAG;AAAA,EAC5D;AACF;AAEO,SAAS,MAAM,SAAyB;AAC7C,SAAO,OAAO,EAAE,OAAO,MAAM;AAC3B,WAAO,EAAE,OAAO,QAAQ,KAAK,MAAM,IAAI,IAAM,EAAI;AAAA,EACnD;AACF;AAEA,SAAS,oBAAoB,GAAW,GAAmB;AACzD,MAAI,EAAE,WAAW,EAAG,QAAO,EAAE;AAC7B,MAAI,EAAE,WAAW,EAAG,QAAO,EAAE;AAE7B,MAAI,EAAE,SAAS,EAAE,OAAQ,EAAC,GAAG,CAAC,IAAI,CAAC,GAAG,CAAC;AAEvC,MAAI,OAAO,MAAM,KAAK,EAAE,QAAQ,EAAE,SAAS,EAAE,GAAG,CAAC,GAAG,MAAM,CAAC;AAC3D,MAAI,OAAO,IAAI,MAAc,EAAE,SAAS,CAAC;AAEzC,WAAS,IAAI,GAAG,KAAK,EAAE,QAAQ,KAAK;AAClC,SAAK,CAAC,IAAI;AACV,aAAS,IAAI,GAAG,KAAK,EAAE,QAAQ,KAAK;AAClC,YAAM,OAAO,EAAE,IAAI,CAAC,MAAM,EAAE,IAAI,CAAC,IAAI,IAAI;AACzC,WAAK,CAAC,IAAI,KAAK,IAAI,KAAK,CAAC,IAAK,GAAG,KAAK,IAAI,CAAC,IAAK,GAAG,KAAK,IAAI,CAAC,IAAK,IAAI;AAAA,IACxE;AACA,KAAC,MAAM,IAAI,IAAI,CAAC,MAAM,IAAI;AAAA,EAC5B;AAEA,SAAO,KAAK,EAAE,MAAM;AACtB;AAEO,IAAM,cAAsB,OAAO,EAAE,QAAQ,SAAS,MAAM;AACjE,QAAM,MAAM,YAAY,OAAO,KAAK,OAAO,QAAQ;AACnD,MAAI,OAAO,WAAW,KAAK,IAAI,WAAW,EAAG,QAAO,EAAE,OAAO,EAAI;AACjE,QAAM,SAAS,KAAK,IAAI,OAAO,QAAQ,IAAI,MAAM;AACjD,QAAM,WAAW,oBAAoB,QAAQ,GAAG;AAChD,QAAM,QAAQ,KAAK,IAAI,GAAG,IAAI,WAAW,MAAM;AAC/C,MAAI,UAAU,EAAK,QAAO,EAAE,MAAM;AAClC,SAAO;AAAA,IACL;AAAA,IACA,QAAQ,2BAA2B,QAAQ,sBAAsB,MAAM;AAAA,EACzE;AACF;AAEA,SAAS,UAAU,GAAY,GAAqB;AAClD,MAAI,MAAM,EAAG,QAAO;AACpB,MAAI,KAAK,QAAQ,KAAK,KAAM,QAAO;AACnC,MAAI,OAAO,MAAM,OAAO,EAAG,QAAO;AAElC,MAAI,MAAM,QAAQ,CAAC,GAAG;AACpB,QAAI,CAAC,MAAM,QAAQ,CAAC,KAAK,EAAE,WAAW,EAAE,OAAQ,QAAO;AACvD,WAAO,EAAE,MAAM,CAAC,KAAK,MAAM,UAAU,KAAK,EAAE,CAAC,CAAC,CAAC;AAAA,EACjD;AAEA,MAAI,OAAO,MAAM,UAAU;AACzB,UAAM,QAAQ,OAAO,KAAK,CAA4B,EAAE,KAAK;AAC7D,UAAM,QAAQ,OAAO,KAAK,CAA4B,EAAE,KAAK;AAC7D,QAAI,MAAM,WAAW,MAAM,OAAQ,QAAO;AAC1C,WAAO,MAAM;AAAA,MACX,CAAC,KAAK,MACJ,MAAM,CAAC,MAAM,OACb;AAAA,QACG,EAA8B,GAAG;AAAA,QACjC,EAA8B,GAAG;AAAA,MACpC;AAAA,IACJ;AAAA,EACF;AAEA,SAAO;AACT;AAEO,IAAM,YAAoB,OAAO,EAAE,QAAQ,SAAS,MAAM;AAC/D,MAAI;AACF,UAAM,eAAe,KAAK,MAAM,MAAM;AACtC,UAAM,iBACJ,OAAO,aAAa,WAAW,KAAK,MAAM,QAAQ,IAAI;AACxD,QAAI,UAAU,cAAc,cAAc,EAAG,QAAO,EAAE,OAAO,EAAI;AACjE,WAAO,EAAE,OAAO,GAAK,QAAQ,2CAA2C;AAAA,EAC1E,QAAQ;AACN,WAAO,EAAE,OAAO,GAAK,QAAQ,uBAAuB;AAAA,EACtD;AACF;AAEA,IAAM,kBAAkB,EAAE,OAAO;AAAA,EAC/B,OAAO,EAAE,OAAO,EAAE,IAAI,CAAC,EAAE,IAAI,CAAC;AAAA,EAC9B,QAAQ,EAAE,OAAO;AACnB,CAAC;AAEM,SAAS,SAAS,QAGd;AACT,SAAO,OAAO,EAAE,OAAO,QAAQ,SAAS,MAAM;AAC5C,UAAM,EAAE,OAAO,IAAI,MAAM,eAAe;AAAA,MACtC,OAAO,OAAO;AAAA,MACd,QAAQ;AAAA,MACR,QAAQ;AAAA,EACZ,OAAO,QAAQ;AAAA;AAAA,SAER,KAAK,UAAU,KAAK,CAAC;AAAA,UACpB,MAAM;AAAA,EACd,YAAY,OAAO,aAAa,KAAK,UAAU,QAAQ,CAAC,KAAK,EAAE;AAAA;AAAA;AAAA,IAG7D,CAAC;AACD,WAAO,EAAE,OAAO,OAAO,OAAO,QAAQ,OAAO,OAAO;AAAA,EACtD;AACF;AAEO,SAAS,WAAW,QAA4C;AACrE,SAAO,OAAO,EAAE,OAAO,QAAQ,SAAS,MAAM;AAC5C,UAAM,EAAE,OAAO,IAAI,MAAM,eAAe;AAAA,MACtC,OAAO,OAAO;AAAA,MACd,QAAQ;AAAA,MACR,QAAQ;AAAA;AAAA,SAEL,KAAK,UAAU,KAAK,CAAC;AAAA,UACpB,MAAM;AAAA,sBACM,KAAK,UAAU,QAAQ,CAAC;AAAA;AAAA;AAAA;AAAA,IAI1C,CAAC;AACD,WAAO,EAAE,OAAO,OAAO,OAAO,QAAQ,OAAO,OAAO;AAAA,EACtD;AACF;AAEO,SAAS,OAAO,SAA2B;AAChD,SAAO,OAAO,SAAS;AACrB,QAAI,QAAQ,WAAW,EAAG,QAAO,EAAE,OAAO,EAAI;AAC9C,UAAM,UAAU,MAAM,QAAQ,IAAI,QAAQ,IAAI,CAAC,MAAM,EAAE,IAAI,CAAC,CAAC;AAC7D,UAAM,YAAY,QAAQ;AAAA,MAAO,CAAC,KAAK,MACrC,EAAE,QAAQ,IAAI,QAAQ,IAAI;AAAA,IAC5B;AACA,UAAM,UAAU,QACb,OAAO,CAAC,MAAM,EAAE,MAAM,EACtB,IAAI,CAAC,MAAM,EAAE,MAAM,EACnB,KAAK,IAAI;AACZ,WAAO,EAAE,OAAO,UAAU,OAAO,QAAQ,WAAW,OAAU;AAAA,EAChE;AACF;AAEO,SAAS,OAAO,SAA2B;AAChD,SAAO,OAAO,SAAS;AACrB,QAAI,QAAQ,WAAW,EAAG,QAAO,EAAE,OAAO,EAAI;AAC9C,UAAM,UAAU,MAAM,QAAQ,IAAI,QAAQ,IAAI,CAAC,MAAM,EAAE,IAAI,CAAC,CAAC;AAC7D,UAAM,YAAY,QAAQ;AAAA,MAAO,CAAC,KAAK,MACrC,EAAE,QAAQ,IAAI,QAAQ,IAAI;AAAA,IAC5B;AACA,WAAO,EAAE,OAAO,UAAU,OAAO,QAAQ,UAAU,OAAO;AAAA,EAC5D;AACF;AAEO,SAAS,SACd,QACQ;AACR,SAAO,OAAO,SAAS;AACrB,UAAM,UAAU,OAAO,QAAQ,MAAM;AACrC,UAAM,UAAU,MAAM,QAAQ;AAAA,MAC5B,QAAQ,IAAI,OAAO,CAAC,MAAM,EAAE,QAAQ,OAAO,CAAC,OAAO;AAAA,QACjD;AAAA,QACA,QAAQ,MAAM,OAAO,IAAI;AAAA,QACzB;AAAA,MACF,EAAE;AAAA,IACJ;AACA,UAAM,cAAc,QAAQ,OAAO,CAAC,KAAK,MAAM,MAAM,EAAE,QAAQ,CAAC;AAChE,UAAM,gBAAgB,QAAQ;AAAA,MAC5B,CAAC,KAAK,MAAM,MAAM,EAAE,OAAO,QAAQ,EAAE;AAAA,MACrC;AAAA,IACF;AACA,UAAM,QAAQ,cAAc,IAAI,gBAAgB,cAAc;AAC9D,UAAM,UAAU,QACb,IAAI,CAAC,MAAM,GAAG,EAAE,IAAI,KAAK,EAAE,OAAO,MAAM,QAAQ,CAAC,CAAC,OAAO,EAAE,MAAM,GAAG,EACpE,KAAK,IAAI;AACZ,WAAO,EAAE,OAAO,QAAQ,WAAW,OAAU;AAAA,EAC/C;AACF;",
4
+ "sourcesContent": ["import {\n Factuality as AutoevalsFactuality,\n Levenshtein as AutoevalsLevenshtein,\n} from 'autoevals';\n\nexport interface ScorerArgs {\n input: unknown;\n output: string;\n expected?: unknown;\n}\n\nexport interface ScorerResult {\n score: number;\n reason?: string;\n metadata?: Record<string, unknown>;\n}\n\nexport type Scorer = (args: ScorerArgs) => Promise<ScorerResult>;\n\nexport const exactMatch: Scorer = async ({ output, expected }) => {\n const exp = expected == null ? '' : String(expected);\n if (output === exp) return { score: 1.0 };\n return {\n score: 0.0,\n reason: `Output does not exactly match expected. Expected \"${exp}\" but got \"${output}\".`,\n };\n};\n\nexport const includes: Scorer = async ({ output, expected }) => {\n const exp = expected == null ? '' : String(expected);\n if (output.includes(exp)) return { score: 1.0 };\n return {\n score: 0.0,\n reason: `Output does not include expected substring \"${exp}\".`,\n };\n};\n\nexport function regex(pattern: RegExp): Scorer {\n return async ({ output }) => {\n return { score: pattern.test(output) ? 1.0 : 0.0 };\n };\n}\n\nfunction normalizeScore(score: number | null | undefined): number {\n if (typeof score !== 'number' || !Number.isFinite(score)) return 0;\n return Math.max(0, Math.min(1, score));\n}\n\nfunction reasonFromMetadata(\n metadata?: Record<string, unknown>,\n): string | undefined {\n if (!metadata) return undefined;\n const candidates = [\n metadata.reason,\n metadata.rationale,\n metadata.explanation,\n ];\n for (const candidate of candidates) {\n if (typeof candidate === 'string' && candidate.trim().length > 0) {\n return candidate;\n }\n }\n return undefined;\n}\n\nexport const levenshtein: Scorer = async ({ output, expected }) => {\n const exp = expected == null ? '' : String(expected);\n const result = await AutoevalsLevenshtein({ output, expected: exp });\n const score = normalizeScore(result.score);\n return {\n score,\n reason: reasonFromMetadata(result.metadata),\n metadata: result.metadata,\n };\n};\n\nfunction deepEqual(a: unknown, b: unknown): boolean {\n if (a === b) return true;\n if (a == null || b == null) return false;\n if (typeof a !== typeof b) return false;\n\n if (Array.isArray(a)) {\n if (!Array.isArray(b) || a.length !== b.length) return false;\n return a.every((val, i) => deepEqual(val, b[i]));\n }\n\n if (typeof a === 'object') {\n const keysA = Object.keys(a as Record<string, unknown>).sort();\n const keysB = Object.keys(b as Record<string, unknown>).sort();\n if (keysA.length !== keysB.length) return false;\n return keysA.every(\n (key, i) =>\n keysB[i] === key &&\n deepEqual(\n (a as Record<string, unknown>)[key],\n (b as Record<string, unknown>)[key],\n ),\n );\n }\n\n return false;\n}\n\nexport const jsonMatch: Scorer = async ({ output, expected }) => {\n try {\n const parsedOutput = JSON.parse(output);\n const parsedExpected =\n typeof expected === 'string' ? JSON.parse(expected) : expected;\n if (deepEqual(parsedOutput, parsedExpected)) return { score: 1.0 };\n return { score: 0.0, reason: 'JSON payload differs from expected JSON.' };\n } catch {\n return { score: 0.0, reason: 'Failed to parse JSON' };\n }\n};\n\nexport function factuality(config: { model: string }): Scorer {\n return async ({ input, output, expected }) => {\n const result = await AutoevalsFactuality({\n model: config.model,\n input: typeof input === 'string' ? input : JSON.stringify(input),\n output,\n expected: expected == null ? undefined : String(expected),\n });\n return {\n score: normalizeScore(result.score),\n reason: reasonFromMetadata(result.metadata),\n metadata: result.metadata,\n };\n };\n}\n\nexport function all(...scorers: Scorer[]): Scorer {\n return async (args) => {\n if (scorers.length === 0) return { score: 1.0 };\n const results = await Promise.all(scorers.map((s) => s(args)));\n const minResult = results.reduce((min, r) =>\n r.score < min.score ? r : min,\n );\n const reasons = results\n .filter((r) => r.reason)\n .map((r) => r.reason)\n .join('; ');\n return { score: minResult.score, reason: reasons || undefined };\n };\n}\n\nexport function any(...scorers: Scorer[]): Scorer {\n return async (args) => {\n if (scorers.length === 0) return { score: 0.0 };\n const results = await Promise.all(scorers.map((s) => s(args)));\n const maxResult = results.reduce((max, r) =>\n r.score > max.score ? r : max,\n );\n return { score: maxResult.score, reason: maxResult.reason };\n };\n}\n\nexport function weighted(\n config: Record<string, { scorer: Scorer; weight: number }>,\n): Scorer {\n return async (args) => {\n const entries = Object.entries(config);\n const results = await Promise.all(\n entries.map(async ([name, { scorer, weight }]) => ({\n name,\n result: await scorer(args),\n weight,\n })),\n );\n const totalWeight = results.reduce((sum, r) => sum + r.weight, 0);\n const weightedScore = results.reduce(\n (sum, r) => sum + r.result.score * r.weight,\n 0,\n );\n const score = totalWeight > 0 ? weightedScore / totalWeight : 0;\n const reasons = results\n .map((r) => `${r.name}: ${r.result.score.toFixed(2)} (w=${r.weight})`)\n .join(', ');\n return { score, reason: reasons || undefined };\n };\n}\n"],
5
+ "mappings": ";AAAA;AAAA,EACE,cAAc;AAAA,EACd,eAAe;AAAA,OACV;AAgBA,IAAM,aAAqB,OAAO,EAAE,QAAQ,SAAS,MAAM;AAChE,QAAM,MAAM,YAAY,OAAO,KAAK,OAAO,QAAQ;AACnD,MAAI,WAAW,IAAK,QAAO,EAAE,OAAO,EAAI;AACxC,SAAO;AAAA,IACL,OAAO;AAAA,IACP,QAAQ,qDAAqD,GAAG,cAAc,MAAM;AAAA,EACtF;AACF;AAEO,IAAM,WAAmB,OAAO,EAAE,QAAQ,SAAS,MAAM;AAC9D,QAAM,MAAM,YAAY,OAAO,KAAK,OAAO,QAAQ;AACnD,MAAI,OAAO,SAAS,GAAG,EAAG,QAAO,EAAE,OAAO,EAAI;AAC9C,SAAO;AAAA,IACL,OAAO;AAAA,IACP,QAAQ,+CAA+C,GAAG;AAAA,EAC5D;AACF;AAEO,SAAS,MAAM,SAAyB;AAC7C,SAAO,OAAO,EAAE,OAAO,MAAM;AAC3B,WAAO,EAAE,OAAO,QAAQ,KAAK,MAAM,IAAI,IAAM,EAAI;AAAA,EACnD;AACF;AAEA,SAAS,eAAe,OAA0C;AAChE,MAAI,OAAO,UAAU,YAAY,CAAC,OAAO,SAAS,KAAK,EAAG,QAAO;AACjE,SAAO,KAAK,IAAI,GAAG,KAAK,IAAI,GAAG,KAAK,CAAC;AACvC;AAEA,SAAS,mBACP,UACoB;AACpB,MAAI,CAAC,SAAU,QAAO;AACtB,QAAM,aAAa;AAAA,IACjB,SAAS;AAAA,IACT,SAAS;AAAA,IACT,SAAS;AAAA,EACX;AACA,aAAW,aAAa,YAAY;AAClC,QAAI,OAAO,cAAc,YAAY,UAAU,KAAK,EAAE,SAAS,GAAG;AAChE,aAAO;AAAA,IACT;AAAA,EACF;AACA,SAAO;AACT;AAEO,IAAM,cAAsB,OAAO,EAAE,QAAQ,SAAS,MAAM;AACjE,QAAM,MAAM,YAAY,OAAO,KAAK,OAAO,QAAQ;AACnD,QAAM,SAAS,MAAM,qBAAqB,EAAE,QAAQ,UAAU,IAAI,CAAC;AACnE,QAAM,QAAQ,eAAe,OAAO,KAAK;AACzC,SAAO;AAAA,IACL;AAAA,IACA,QAAQ,mBAAmB,OAAO,QAAQ;AAAA,IAC1C,UAAU,OAAO;AAAA,EACnB;AACF;AAEA,SAAS,UAAU,GAAY,GAAqB;AAClD,MAAI,MAAM,EAAG,QAAO;AACpB,MAAI,KAAK,QAAQ,KAAK,KAAM,QAAO;AACnC,MAAI,OAAO,MAAM,OAAO,EAAG,QAAO;AAElC,MAAI,MAAM,QAAQ,CAAC,GAAG;AACpB,QAAI,CAAC,MAAM,QAAQ,CAAC,KAAK,EAAE,WAAW,EAAE,OAAQ,QAAO;AACvD,WAAO,EAAE,MAAM,CAAC,KAAK,MAAM,UAAU,KAAK,EAAE,CAAC,CAAC,CAAC;AAAA,EACjD;AAEA,MAAI,OAAO,MAAM,UAAU;AACzB,UAAM,QAAQ,OAAO,KAAK,CAA4B,EAAE,KAAK;AAC7D,UAAM,QAAQ,OAAO,KAAK,CAA4B,EAAE,KAAK;AAC7D,QAAI,MAAM,WAAW,MAAM,OAAQ,QAAO;AAC1C,WAAO,MAAM;AAAA,MACX,CAAC,KAAK,MACJ,MAAM,CAAC,MAAM,OACb;AAAA,QACG,EAA8B,GAAG;AAAA,QACjC,EAA8B,GAAG;AAAA,MACpC;AAAA,IACJ;AAAA,EACF;AAEA,SAAO;AACT;AAEO,IAAM,YAAoB,OAAO,EAAE,QAAQ,SAAS,MAAM;AAC/D,MAAI;AACF,UAAM,eAAe,KAAK,MAAM,MAAM;AACtC,UAAM,iBACJ,OAAO,aAAa,WAAW,KAAK,MAAM,QAAQ,IAAI;AACxD,QAAI,UAAU,cAAc,cAAc,EAAG,QAAO,EAAE,OAAO,EAAI;AACjE,WAAO,EAAE,OAAO,GAAK,QAAQ,2CAA2C;AAAA,EAC1E,QAAQ;AACN,WAAO,EAAE,OAAO,GAAK,QAAQ,uBAAuB;AAAA,EACtD;AACF;AAEO,SAAS,WAAW,QAAmC;AAC5D,SAAO,OAAO,EAAE,OAAO,QAAQ,SAAS,MAAM;AAC5C,UAAM,SAAS,MAAM,oBAAoB;AAAA,MACvC,OAAO,OAAO;AAAA,MACd,OAAO,OAAO,UAAU,WAAW,QAAQ,KAAK,UAAU,KAAK;AAAA,MAC/D;AAAA,MACA,UAAU,YAAY,OAAO,SAAY,OAAO,QAAQ;AAAA,IAC1D,CAAC;AACD,WAAO;AAAA,MACL,OAAO,eAAe,OAAO,KAAK;AAAA,MAClC,QAAQ,mBAAmB,OAAO,QAAQ;AAAA,MAC1C,UAAU,OAAO;AAAA,IACnB;AAAA,EACF;AACF;AAEO,SAAS,OAAO,SAA2B;AAChD,SAAO,OAAO,SAAS;AACrB,QAAI,QAAQ,WAAW,EAAG,QAAO,EAAE,OAAO,EAAI;AAC9C,UAAM,UAAU,MAAM,QAAQ,IAAI,QAAQ,IAAI,CAAC,MAAM,EAAE,IAAI,CAAC,CAAC;AAC7D,UAAM,YAAY,QAAQ;AAAA,MAAO,CAAC,KAAK,MACrC,EAAE,QAAQ,IAAI,QAAQ,IAAI;AAAA,IAC5B;AACA,UAAM,UAAU,QACb,OAAO,CAAC,MAAM,EAAE,MAAM,EACtB,IAAI,CAAC,MAAM,EAAE,MAAM,EACnB,KAAK,IAAI;AACZ,WAAO,EAAE,OAAO,UAAU,OAAO,QAAQ,WAAW,OAAU;AAAA,EAChE;AACF;AAEO,SAAS,OAAO,SAA2B;AAChD,SAAO,OAAO,SAAS;AACrB,QAAI,QAAQ,WAAW,EAAG,QAAO,EAAE,OAAO,EAAI;AAC9C,UAAM,UAAU,MAAM,QAAQ,IAAI,QAAQ,IAAI,CAAC,MAAM,EAAE,IAAI,CAAC,CAAC;AAC7D,UAAM,YAAY,QAAQ;AAAA,MAAO,CAAC,KAAK,MACrC,EAAE,QAAQ,IAAI,QAAQ,IAAI;AAAA,IAC5B;AACA,WAAO,EAAE,OAAO,UAAU,OAAO,QAAQ,UAAU,OAAO;AAAA,EAC5D;AACF;AAEO,SAAS,SACd,QACQ;AACR,SAAO,OAAO,SAAS;AACrB,UAAM,UAAU,OAAO,QAAQ,MAAM;AACrC,UAAM,UAAU,MAAM,QAAQ;AAAA,MAC5B,QAAQ,IAAI,OAAO,CAAC,MAAM,EAAE,QAAQ,OAAO,CAAC,OAAO;AAAA,QACjD;AAAA,QACA,QAAQ,MAAM,OAAO,IAAI;AAAA,QACzB;AAAA,MACF,EAAE;AAAA,IACJ;AACA,UAAM,cAAc,QAAQ,OAAO,CAAC,KAAK,MAAM,MAAM,EAAE,QAAQ,CAAC;AAChE,UAAM,gBAAgB,QAAQ;AAAA,MAC5B,CAAC,KAAK,MAAM,MAAM,EAAE,OAAO,QAAQ,EAAE;AAAA,MACrC;AAAA,IACF;AACA,UAAM,QAAQ,cAAc,IAAI,gBAAgB,cAAc;AAC9D,UAAM,UAAU,QACb,IAAI,CAAC,MAAM,GAAG,EAAE,IAAI,KAAK,EAAE,OAAO,MAAM,QAAQ,CAAC,CAAC,OAAO,EAAE,MAAM,GAAG,EACpE,KAAK,IAAI;AACZ,WAAO,EAAE,OAAO,QAAQ,WAAW,OAAU;AAAA,EAC/C;AACF;",
6
6
  "names": []
7
7
  }
@@ -80,6 +80,9 @@ export declare class RunStore {
80
80
  #private;
81
81
  constructor(pathOrDb?: string | DatabaseSync);
82
82
  createSuite(name: string): SuiteRow;
83
+ getSuite(id: string): SuiteRow | undefined;
84
+ renameSuite(id: string, name: string): void;
85
+ renameRun(id: string, name: string): void;
83
86
  createRun(run: {
84
87
  suite_id: string;
85
88
  name: string;
@@ -1 +1 @@
1
- {"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../src/store/index.ts"],"names":[],"mappings":"AAEA,OAAO,EAAE,YAAY,EAAE,MAAM,aAAa,CAAC;AAI3C,MAAM,WAAW,QAAQ;IACvB,EAAE,EAAE,MAAM,CAAC;IACX,IAAI,EAAE,MAAM,CAAC;IACb,UAAU,EAAE,MAAM,CAAC;CACpB;AAED,MAAM,WAAW,MAAM;IACrB,EAAE,EAAE,MAAM,CAAC;IACX,QAAQ,EAAE,MAAM,CAAC;IACjB,IAAI,EAAE,MAAM,CAAC;IACb,KAAK,EAAE,MAAM,CAAC;IACd,MAAM,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,GAAG,IAAI,CAAC;IACvC,UAAU,EAAE,MAAM,CAAC;IACnB,WAAW,EAAE,MAAM,GAAG,IAAI,CAAC;IAC3B,MAAM,EAAE,SAAS,GAAG,WAAW,GAAG,QAAQ,CAAC;IAC3C,OAAO,EAAE,UAAU,GAAG,IAAI,CAAC;CAC5B;AAED,MAAM,WAAW,OAAO;IACtB,EAAE,EAAE,MAAM,CAAC;IACX,MAAM,EAAE,MAAM,CAAC;IACf,GAAG,EAAE,MAAM,CAAC;IACZ,KAAK,EAAE,OAAO,CAAC;IACf,MAAM,EAAE,MAAM,GAAG,IAAI,CAAC;IACtB,QAAQ,EAAE,OAAO,GAAG,IAAI,CAAC;IACzB,UAAU,EAAE,MAAM,CAAC;IACnB,SAAS,EAAE,MAAM,CAAC;IAClB,UAAU,EAAE,MAAM,CAAC;IACnB,KAAK,EAAE,MAAM,GAAG,IAAI,CAAC;CACtB;AAED,MAAM,WAAW,cAAe,SAAQ,OAAO;IAC7C,MAAM,EAAE,KAAK,CAAC;QAAE,WAAW,EAAE,MAAM,CAAC;QAAC,KAAK,EAAE,MAAM,CAAC;QAAC,MAAM,EAAE,MAAM,GAAG,IAAI,CAAA;KAAE,CAAC,CAAC;CAC9E;AAED,MAAM,WAAW,QAAQ;IACvB,EAAE,EAAE,MAAM,CAAC;IACX,OAAO,EAAE,MAAM,CAAC;IAChB,WAAW,EAAE,MAAM,CAAC;IACpB,KAAK,EAAE,MAAM,CAAC;IACd,MAAM,EAAE,MAAM,GAAG,IAAI,CAAC;CACvB;AAED,MAAM,WAAW,UAAU;IACzB,UAAU,EAAE,MAAM,CAAC;IACnB,SAAS,EAAE,MAAM,CAAC;IAClB,SAAS,EAAE,MAAM,CAAC;IAClB,UAAU,EAAE,MAAM,CAAC,MAAM,EAAE,MAAM,CAAC,CAAC;IACnC,cAAc,EAAE,MAAM,CAAC;IACvB,aAAa,EAAE,MAAM,CAAC;IACtB,cAAc,EAAE,MAAM,CAAC;CACxB;AAED,MAAM,WAAW,SAAS;IACxB,EAAE,EAAE,MAAM,CAAC;IACX,IAAI,EAAE,MAAM,CAAC;IACb,OAAO,EAAE,MAAM,CAAC;IAChB,OAAO,EAAE,MAAM,CAAC;IAChB,UAAU,EAAE,MAAM,CAAC;CACpB;AAED,MAAM,WAAW,QAAQ;IACvB,EAAE,EAAE,MAAM,CAAC;IACX,MAAM,EAAE,MAAM,CAAC;IACf,GAAG,EAAE,MAAM,CAAC;IACZ,KAAK,EAAE,OAAO,CAAC;IACf,MAAM,EAAE,MAAM,GAAG,IAAI,CAAC;IACtB,QAAQ,CAAC,EAAE,OAAO,CAAC;IACnB,UAAU,EAAE,MAAM,CAAC;IACnB,SAAS,EAAE,MAAM,CAAC;IAClB,UAAU,EAAE,MAAM,CAAC;IACnB,KAAK,CAAC,EAAE,MAAM,CAAC;CAChB;AAED,MAAM,WAAW,SAAS;IACxB,EAAE,EAAE,MAAM,CAAC;IACX,OAAO,EAAE,MAAM,CAAC;IAChB,WAAW,EAAE,MAAM,CAAC;IACpB,KAAK,EAAE,MAAM,CAAC;IACd,MAAM,CAAC,EAAE,MAAM,CAAC;CACjB;AAED,qBAAa,QAAQ;;gBAyBP,QAAQ,CAAC,EAAE,MAAM,GAAG,YAAY;IAmH5C,WAAW,CAAC,IAAI,EAAE,MAAM,GAAG,QAAQ;IASnC,SAAS,CAAC,GAAG,EAAE;QACb,QAAQ,EAAE,MAAM,CAAC;QACjB,IAAI,EAAE,MAAM,CAAC;QACb,KAAK,EAAE,MAAM,CAAC;QACd,MAAM,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,CAAC;KAClC,GAAG,MAAM;IAgBV,SAAS,CACP,KAAK,EAAE,MAAM,EACb,MAAM,EAAE,WAAW,GAAG,QAAQ,EAC9B,OAAO,CAAC,EAAE,UAAU,GACnB,IAAI;IAMP,SAAS,CAAC,KAAK,EAAE,QAAQ,EAAE,GAAG,IAAI;IAsBlC,UAAU,CAAC,MAAM,EAAE,SAAS,EAAE,GAAG,IAAI;IAWrC,MAAM,CAAC,KAAK,EAAE,MAAM,GAAG,MAAM,GAAG,SAAS;IA4BzC,QAAQ,CAAC,OAAO,CAAC,EAAE,MAAM,GAAG,MAAM,EAAE;IA8BpC,QAAQ,CAAC,KAAK,EAAE,MAAM,GAAG,OAAO,EAAE;IA6BlC,eAAe,CAAC,KAAK,EAAE,MAAM,EAAE,SAAS,SAAM,GAAG,cAAc,EAAE;IAmDjE,aAAa,CAAC,KAAK,EAAE,MAAM,EAAE,SAAS,SAAM,GAAG,UAAU;IAuDzD,eAAe,CAAC,IAAI,EAAE,MAAM,GAAG,QAAQ,GAAG,SAAS;IAOnD,qBAAqB,CAAC,OAAO,EAAE,MAAM,EAAE,KAAK,CAAC,EAAE,MAAM,GAAG,MAAM,GAAG,SAAS;IAmC1E,UAAU,IAAI,QAAQ,EAAE;IAWxB,YAAY,CAAC,IAAI,EAAE,MAAM,EAAE,OAAO,EAAE,MAAM,GAAG,SAAS;IAetD,WAAW,IAAI,SAAS,EAAE;IAmB1B,SAAS,CAAC,EAAE,EAAE,MAAM,GAAG,SAAS,GAAG,SAAS;IAoB5C,YAAY,CAAC,EAAE,EAAE,MAAM,GAAG,IAAI;CAG/B"}
1
+ {"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../src/store/index.ts"],"names":[],"mappings":"AAEA,OAAO,EAAE,YAAY,EAAE,MAAM,aAAa,CAAC;AAI3C,MAAM,WAAW,QAAQ;IACvB,EAAE,EAAE,MAAM,CAAC;IACX,IAAI,EAAE,MAAM,CAAC;IACb,UAAU,EAAE,MAAM,CAAC;CACpB;AAED,MAAM,WAAW,MAAM;IACrB,EAAE,EAAE,MAAM,CAAC;IACX,QAAQ,EAAE,MAAM,CAAC;IACjB,IAAI,EAAE,MAAM,CAAC;IACb,KAAK,EAAE,MAAM,CAAC;IACd,MAAM,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,GAAG,IAAI,CAAC;IACvC,UAAU,EAAE,MAAM,CAAC;IACnB,WAAW,EAAE,MAAM,GAAG,IAAI,CAAC;IAC3B,MAAM,EAAE,SAAS,GAAG,WAAW,GAAG,QAAQ,CAAC;IAC3C,OAAO,EAAE,UAAU,GAAG,IAAI,CAAC;CAC5B;AAED,MAAM,WAAW,OAAO;IACtB,EAAE,EAAE,MAAM,CAAC;IACX,MAAM,EAAE,MAAM,CAAC;IACf,GAAG,EAAE,MAAM,CAAC;IACZ,KAAK,EAAE,OAAO,CAAC;IACf,MAAM,EAAE,MAAM,GAAG,IAAI,CAAC;IACtB,QAAQ,EAAE,OAAO,GAAG,IAAI,CAAC;IACzB,UAAU,EAAE,MAAM,CAAC;IACnB,SAAS,EAAE,MAAM,CAAC;IAClB,UAAU,EAAE,MAAM,CAAC;IACnB,KAAK,EAAE,MAAM,GAAG,IAAI,CAAC;CACtB;AAED,MAAM,WAAW,cAAe,SAAQ,OAAO;IAC7C,MAAM,EAAE,KAAK,CAAC;QAAE,WAAW,EAAE,MAAM,CAAC;QAAC,KAAK,EAAE,MAAM,CAAC;QAAC,MAAM,EAAE,MAAM,GAAG,IAAI,CAAA;KAAE,CAAC,CAAC;CAC9E;AAED,MAAM,WAAW,QAAQ;IACvB,EAAE,EAAE,MAAM,CAAC;IACX,OAAO,EAAE,MAAM,CAAC;IAChB,WAAW,EAAE,MAAM,CAAC;IACpB,KAAK,EAAE,MAAM,CAAC;IACd,MAAM,EAAE,MAAM,GAAG,IAAI,CAAC;CACvB;AAED,MAAM,WAAW,UAAU;IACzB,UAAU,EAAE,MAAM,CAAC;IACnB,SAAS,EAAE,MAAM,CAAC;IAClB,SAAS,EAAE,MAAM,CAAC;IAClB,UAAU,EAAE,MAAM,CAAC,MAAM,EAAE,MAAM,CAAC,CAAC;IACnC,cAAc,EAAE,MAAM,CAAC;IACvB,aAAa,EAAE,MAAM,CAAC;IACtB,cAAc,EAAE,MAAM,CAAC;CACxB;AAED,MAAM,WAAW,SAAS;IACxB,EAAE,EAAE,MAAM,CAAC;IACX,IAAI,EAAE,MAAM,CAAC;IACb,OAAO,EAAE,MAAM,CAAC;IAChB,OAAO,EAAE,MAAM,CAAC;IAChB,UAAU,EAAE,MAAM,CAAC;CACpB;AAED,MAAM,WAAW,QAAQ;IACvB,EAAE,EAAE,MAAM,CAAC;IACX,MAAM,EAAE,MAAM,CAAC;IACf,GAAG,EAAE,MAAM,CAAC;IACZ,KAAK,EAAE,OAAO,CAAC;IACf,MAAM,EAAE,MAAM,GAAG,IAAI,CAAC;IACtB,QAAQ,CAAC,EAAE,OAAO,CAAC;IACnB,UAAU,EAAE,MAAM,CAAC;IACnB,SAAS,EAAE,MAAM,CAAC;IAClB,UAAU,EAAE,MAAM,CAAC;IACnB,KAAK,CAAC,EAAE,MAAM,CAAC;CAChB;AAED,MAAM,WAAW,SAAS;IACxB,EAAE,EAAE,MAAM,CAAC;IACX,OAAO,EAAE,MAAM,CAAC;IAChB,WAAW,EAAE,MAAM,CAAC;IACpB,KAAK,EAAE,MAAM,CAAC;IACd,MAAM,CAAC,EAAE,MAAM,CAAC;CACjB;AAED,qBAAa,QAAQ;;gBAyBP,QAAQ,CAAC,EAAE,MAAM,GAAG,YAAY;IAmH5C,WAAW,CAAC,IAAI,EAAE,MAAM,GAAG,QAAQ;IASnC,QAAQ,CAAC,EAAE,EAAE,MAAM,GAAG,QAAQ,GAAG,SAAS;IAO1C,WAAW,CAAC,EAAE,EAAE,MAAM,EAAE,IAAI,EAAE,MAAM,GAAG,IAAI;IAI3C,SAAS,CAAC,EAAE,EAAE,MAAM,EAAE,IAAI,EAAE,MAAM,GAAG,IAAI;IAIzC,SAAS,CAAC,GAAG,EAAE;QACb,QAAQ,EAAE,MAAM,CAAC;QACjB,IAAI,EAAE,MAAM,CAAC;QACb,KAAK,EAAE,MAAM,CAAC;QACd,MAAM,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,CAAC;KAClC,GAAG,MAAM;IAgBV,SAAS,CACP,KAAK,EAAE,MAAM,EACb,MAAM,EAAE,WAAW,GAAG,QAAQ,EAC9B,OAAO,CAAC,EAAE,UAAU,GACnB,IAAI;IAMP,SAAS,CAAC,KAAK,EAAE,QAAQ,EAAE,GAAG,IAAI;IAsBlC,UAAU,CAAC,MAAM,EAAE,SAAS,EAAE,GAAG,IAAI;IAWrC,MAAM,CAAC,KAAK,EAAE,MAAM,GAAG,MAAM,GAAG,SAAS;IA4BzC,QAAQ,CAAC,OAAO,CAAC,EAAE,MAAM,GAAG,MAAM,EAAE;IA8BpC,QAAQ,CAAC,KAAK,EAAE,MAAM,GAAG,OAAO,EAAE;IA6BlC,eAAe,CAAC,KAAK,EAAE,MAAM,EAAE,SAAS,SAAM,GAAG,cAAc,EAAE;IAmDjE,aAAa,CAAC,KAAK,EAAE,MAAM,EAAE,SAAS,SAAM,GAAG,UAAU;IAuDzD,eAAe,CAAC,IAAI,EAAE,MAAM,GAAG,QAAQ,GAAG,SAAS;IAOnD,qBAAqB,CAAC,OAAO,EAAE,MAAM,EAAE,KAAK,CAAC,EAAE,MAAM,GAAG,MAAM,GAAG,SAAS;IAmC1E,UAAU,IAAI,QAAQ,EAAE;IAWxB,YAAY,CAAC,IAAI,EAAE,MAAM,EAAE,OAAO,EAAE,MAAM,GAAG,SAAS;IAetD,WAAW,IAAI,SAAS,EAAE;IAmB1B,SAAS,CAAC,EAAE,EAAE,MAAM,GAAG,SAAS,GAAG,SAAS;IAoB5C,YAAY,CAAC,EAAE,EAAE,MAAM,GAAG,IAAI;CAG/B"}
@@ -129,6 +129,16 @@ var RunStore = class {
129
129
  ).run(id, name, now);
130
130
  return { id, name, created_at: now };
131
131
  }
132
+ getSuite(id) {
133
+ const row = this.#stmt("SELECT * FROM suites WHERE id = ?").get(id);
134
+ return row ?? void 0;
135
+ }
136
+ renameSuite(id, name) {
137
+ this.#stmt("UPDATE suites SET name = ? WHERE id = ?").run(name, id);
138
+ }
139
+ renameRun(id, name) {
140
+ this.#stmt("UPDATE runs SET name = ? WHERE id = ?").run(name, id);
141
+ }
132
142
  createRun(run) {
133
143
  const id = crypto.randomUUID();
134
144
  const now = Date.now();