npm - patina-cli - Versions diffs - 3.11.0 → 4.0.0 - Mend

patina-cli 3.11.0 → 4.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (193) hide show

package/.patina.default.yaml +29 -29
package/CHANGELOG.md +53 -0
package/NOTICE +21 -0
package/README.md +117 -224
package/README_JA.md +134 -77
package/README_KR.md +132 -74
package/README_ZH.md +137 -80
package/SKILL.md +11 -20
package/artifacts/rebaseline-2025/README.md +147 -0
package/artifacts/rebaseline-2025/human-controls.public.jsonl +250 -0
package/artifacts/rebaseline-2025/intake.example.jsonl +2 -0
package/artifacts/rebaseline-2025/intake.local.example.jsonl +25 -0
package/artifacts/rebaseline-2025/prompts.template.jsonl +7 -0
package/artifacts/rebaseline-2025/sources.ko-public.jsonl +39 -0
package/assets/brand/patina-badge.svg +18 -0
package/assets/brand/patina-mark.svg +8 -0
package/assets/demo/README.md +79 -0
package/core/scoring.md +12 -12
package/core/standalone-prompt.md +3 -1
package/core/stylometry.md +93 -22
package/docs/API.md +1554 -0
package/docs/AUTHENTICATION.md +50 -26
package/docs/AUTHENTICATION_KR.md +54 -29
package/docs/BRANDING.md +9 -8
package/docs/CLI.md +55 -14
package/docs/COOKBOOK.md +8 -21
package/docs/DEMO.md +32 -5
package/docs/EXIT-CODES.md +2 -3
package/docs/FALSE-POSITIVES.md +63 -0
package/docs/FAQ.md +9 -1
package/docs/FAQ_KR.md +3 -1
package/docs/FLAG-PARITY.md +33 -47
package/docs/ISSUE-WAVES.md +57 -0
package/docs/PATTERNS-EN.md +67 -3
package/docs/PATTERNS-JA.md +68 -2
package/docs/PATTERNS-KO.md +70 -7
package/docs/PATTERNS-ZH.md +67 -3
package/docs/PATTERNS.md +5 -5
package/docs/RESEARCH-DOCS-PLATFORM.md +54 -0
package/docs/ROADMAP.md +46 -66
package/docs/TRANSLATIONESE-KO.md +51 -0
package/docs/audits/2026-05-deep-research.md +3 -1
package/docs/benchmarks/README.md +51 -0
package/docs/benchmarks/detector-comparison.json +69 -9
package/docs/benchmarks/detector-comparison.md +10 -5
package/docs/benchmarks/katfish-ko-latest.json +657 -0
package/docs/benchmarks/katfish-ko-latest.md +77 -0
package/docs/benchmarks/latest.json +1183 -108
package/docs/benchmarks/latest.md +84 -60
package/docs/benchmarks/lexicon-freshness-en-2026-05-22.json +1121 -0
package/docs/benchmarks/lexicon-freshness-en-2026-05-22.md +136 -0
package/docs/benchmarks/rebaseline-latest.json +381 -0
package/docs/benchmarks/rebaseline-latest.md +121 -0
package/docs/benchmarks/register-stratified-latest.json +164 -0
package/docs/benchmarks/register-stratified-latest.md +99 -0
package/docs/benchmarks/register-stratified.md +43 -0
package/docs/integrations/github-action.md +44 -11
package/docs/integrations/playground.md +58 -0
package/docs/integrations/pre-commit.md +5 -5
package/docs/integrations/release.md +5 -3
package/docs/integrations/static-sites.md +83 -0
package/docs/research/2025-rebaseline-plan.md +71 -2
package/docs/research/2026-rebaseline.md +102 -0
package/docs/research/adversarial-mps.md +41 -0
package/docs/research/ai-human-metrics.md +35 -23
package/docs/research/human-eval-panel.md +42 -0
package/docs/research/judge-agreement.md +24 -0
package/docs/research/ko-2025-corpus-sources.md +135 -0
package/docs/research/lexicon-freshness-audit.md +64 -0
package/docs/research/zh-ja-lexicon-calibration.md +60 -0
package/docs/social/patina-launch-copy.md +173 -100
package/docs/social/patina-launch-execution.md +94 -0
package/docs/social/patina-launch-korean-first.md +83 -0
package/docs/social/signs-of-ai-writing.md +26 -0
package/docs/social/signs-of-ai-writing_KR.md +26 -0
package/lexicon/ai-en.md +21 -24
package/lexicon/ai-ja.md +158 -0
package/lexicon/ai-ko.md +9 -9
package/lexicon/ai-zh.md +158 -0
package/lexicon/provenance/ai-en.json +970 -0
package/lexicon/provenance/ai-ja.json +542 -0
package/lexicon/provenance/ai-ko.json +866 -0
package/lexicon/provenance/ai-zh.json +542 -0
package/package.json +49 -8
package/patterns/en-communication.md +5 -0
package/patterns/en-content.md +5 -0
package/patterns/en-filler.md +5 -0
package/patterns/en-language.md +29 -1
package/patterns/en-structure.md +5 -0
package/patterns/en-style.md +5 -0
package/patterns/en-viral-hook.md +42 -2
package/patterns/ja-communication.md +5 -0
package/patterns/ja-content.md +5 -0
package/patterns/ja-filler.md +5 -0
package/patterns/ja-language.md +33 -1
package/patterns/ja-structure.md +12 -0
package/patterns/ja-style.md +5 -0
package/patterns/ja-viral-hook.md +41 -2
package/patterns/ko-communication.md +5 -0
package/patterns/ko-content.md +5 -0
package/patterns/ko-filler.md +5 -0
package/patterns/ko-language.md +33 -1
package/patterns/ko-structure.md +25 -6
package/patterns/ko-style.md +5 -0
package/patterns/ko-viral-hook.md +38 -2
package/patterns/zh-communication.md +5 -0
package/patterns/zh-content.md +5 -0
package/patterns/zh-filler.md +5 -0
package/patterns/zh-language.md +37 -1
package/patterns/zh-structure.md +12 -0
package/patterns/zh-style.md +5 -0
package/patterns/zh-viral-hook.md +38 -2
package/playground/README.md +55 -0
package/playground/analytics.js +4 -0
package/playground/analyzer.js +883 -0
package/playground/app.js +157 -0
package/playground/data/lexicons.js +343 -0
package/playground/index.html +138 -0
package/playground/styles.css +267 -0
package/profiles/namuwiki.md +111 -0
package/scripts/adversarial-mps-report.mjs +201 -0
package/scripts/badge-json.mjs +79 -0
package/scripts/benchmark-report.mjs +56 -9
package/scripts/check-release-metadata.mjs +0 -2
package/scripts/detector-comparison.mjs +7 -7
package/scripts/generate-playground-data.mjs +77 -0
package/scripts/katfish-calibration.mjs +464 -0
package/scripts/lexicon-freshness.mjs +485 -0
package/scripts/lint.mjs +1 -1
package/scripts/precommit-score.mjs +4 -3
package/scripts/prose-score.mjs +81 -5
package/scripts/rebaseline-intake.mjs +242 -0
package/scripts/rebaseline-score.mjs +268 -0
package/scripts/rebaseline-summary.mjs +773 -0
package/scripts/rebaseline-web-collect.mjs +410 -0
package/scripts/update-benchmark-ranges.mjs +1 -0
package/src/api.js +69 -105
package/src/auth.js +50 -2
package/src/backends/claude-cli.js +19 -4
package/src/backends/codex-cli.js +19 -3
package/src/backends/contract.js +230 -1
package/src/backends/gemini-cli.js +18 -5
package/src/backends/index.js +87 -12
package/src/backends/kimi-cli.js +161 -0
package/src/cli.js +577 -567
package/src/commands/doctor.js +2 -2
package/src/config.js +29 -0
package/src/errors.js +53 -1
package/src/features/discourse-tells.js +68 -0
package/src/features/index.js +82 -8
package/src/features/lexicon.js +40 -6
package/src/features/markup-leakage.js +69 -0
package/src/features/segment.js +41 -0
package/src/features/signal-strength.js +81 -0
package/src/features/stylometry.js +231 -1
package/src/features/translationese.js +127 -0
package/src/loader.js +76 -0
package/src/logger.js +22 -23
package/src/model-defaults.js +55 -0
package/src/ouroboros.js +31 -0
package/src/output.js +102 -90
package/src/prompt-builder.js +103 -68
package/src/providers.js +51 -4
package/src/scoring.js +210 -2
package/src/security.js +75 -0
package/tests/fixtures/live-quality/en/public-docs-01.md +26 -0
package/tests/fixtures/live-quality/ko/public-docs-01.md +26 -0
package/tests/fixtures/suspect-zones/expected-ranges.json +207 -16
package/tests/fixtures/suspect-zones/ja/ai/ja-ai-04-lexicon.md +11 -0
package/tests/fixtures/suspect-zones/ja/natural/ja-nat-04-lexicon-cold.md +11 -0
package/tests/fixtures/suspect-zones/ko/ai/ko-ai-02.md +4 -5
package/tests/fixtures/suspect-zones/ko/ai/ko-ai-07-ko-diagnostic.md +11 -0
package/tests/fixtures/suspect-zones/zh/ai/zh-ai-04-lexicon.md +11 -0
package/tests/fixtures/suspect-zones/zh/natural/zh-nat-04-lexicon-cold.md +11 -0
package/tests/quality/README.md +188 -11
package/tests/quality/adversarial-mps/fixtures.jsonl +10 -0
package/tests/quality/benchmark.mjs +39 -1
package/tests/quality/dogfood.mjs +5 -3
package/tests/quality/live-fixtures.jsonl +2 -0
package/tests/quality/live-quality.mjs +596 -0
package/tests/quality/ranking-metrics.mjs +136 -0
package/tests/quality/rebaseline-manifest.example.jsonl +5 -0
package/vercel.json +53 -0
package/SKILL-MAX.md +0 -455
package/docs/internal/HARNESS.md +0 -14
package/docs/internal/README.md +0 -14
package/docs/internal/WARP.md +0 -23
package/patina-max/SKILL.md +0 -523
package/patina-max/composite.py +0 -457
package/src/cache.js +0 -106
package/src/commands/init.js +0 -208
package/src/manifest.js +0 -162
package/src/max-mode.js +0 -207

package/scripts/rebaseline-web-collect.mjs ADDED Viewed

@@ -0,0 +1,410 @@
+#!/usr/bin/env node
+// Fetch public Korean web pages into the private 2025+ rebaseline workspace.
+//
+// The output intentionally keeps full text in an ignored private JSONL file.
+// Run scripts/rebaseline-score.mjs afterward to publish only hash/metadata and
+// deterministic outcome fields.
+import { createHash } from 'node:crypto';
+import { existsSync, mkdirSync, readFileSync, writeFileSync } from 'node:fs';
+import { dirname, relative, resolve } from 'node:path';
+import { fileURLToPath } from 'node:url';
+import { MATRIX } from './rebaseline-summary.mjs';
+const __dirname = dirname(fileURLToPath(import.meta.url));
+const REPO_ROOT = resolve(__dirname, '..');
+export const DEFAULT_SOURCE_INPUT = 'artifacts/rebaseline-2025/sources.ko-public.jsonl';
+export const DEFAULT_PRIVATE_OUTPUT = 'artifacts/rebaseline-2025/private/web-human-controls.generated.private.jsonl';
+export const DEFAULT_MIN_CHARS = 90;
+export const DEFAULT_MAX_CHARS = 700;
+export const DEFAULT_MAX_PER_SOURCE = 8;
+export const DEFAULT_TARGET_PER_REGISTER = 50;
+export const DEFAULT_DELAY_MS = 250;
+const HANGUL_RE = /[\u3131-\u318e\uac00-\ud7a3]/gu;
+const BAD_BOILERPLATE_RE = /(본문듣기|말하기 속도|글자크기|인쇄하기|공유하기|목록|검색|닫기|저작권자|무단 전재|재배포 금지|자료출처|문의:|페이스북|트위터|카카오|Copyright|All rights reserved|View all|Apply now)/iu;
+export function parseArgs(argv = process.argv.slice(2)) {
+  const args = {
+    input: DEFAULT_SOURCE_INPUT,
+    output: DEFAULT_PRIVATE_OUTPUT,
+    minChars: DEFAULT_MIN_CHARS,
+    maxChars: DEFAULT_MAX_CHARS,
+    maxPerSource: DEFAULT_MAX_PER_SOURCE,
+    targetPerRegister: DEFAULT_TARGET_PER_REGISTER,
+    delayMs: DEFAULT_DELAY_MS,
+    collectedAt: new Date().toISOString().slice(0, 10),
+    dryRun: false,
+    json: false,
+    help: false,
+  };
+  for (let i = 0; i < argv.length; i++) {
+    const arg = argv[i];
+    if (arg === '--input') args.input = argv[++i];
+    else if (arg === '--output') args.output = argv[++i];
+    else if (arg === '--min-chars') args.minChars = Number(argv[++i]);
+    else if (arg === '--max-chars') args.maxChars = Number(argv[++i]);
+    else if (arg === '--max-per-source') args.maxPerSource = Number(argv[++i]);
+    else if (arg === '--target-per-register') args.targetPerRegister = Number(argv[++i]);
+    else if (arg === '--delay-ms') args.delayMs = Number(argv[++i]);
+    else if (arg === '--collected-at') args.collectedAt = argv[++i];
+    else if (arg === '--dry-run') args.dryRun = true;
+    else if (arg === '--json') args.json = true;
+    else if (arg === '--help' || arg === '-h') args.help = true;
+    else throw new Error(`Unknown argument: ${arg}`);
+  }
+  for (const [name, value] of Object.entries({
+    minChars: args.minChars,
+    maxChars: args.maxChars,
+    maxPerSource: args.maxPerSource,
+    targetPerRegister: args.targetPerRegister,
+    delayMs: args.delayMs,
+  })) {
+    if (!Number.isFinite(value) || value < 0) throw new Error(`${name} must be a non-negative number`);
+  }
+  if (args.minChars > args.maxChars) throw new Error('minChars cannot exceed maxChars');
+  if (Number.isNaN(Date.parse(args.collectedAt))) throw new Error('collected-at must be an ISO-like date');
+  return args;
+}
+export function loadSourceRows(inputPath = DEFAULT_SOURCE_INPUT) {
+  const abs = resolveRepoPath(inputPath);
+  const result = {
+    path: abs,
+    relativePath: toRepoRelative(abs),
+    rows: [],
+    errors: [],
+  };
+  if (!existsSync(abs)) {
+    result.errors.push(`source input not found: ${result.relativePath}`);
+    return result;
+  }
+  const lines = readFileSync(abs, 'utf8').split(/\r?\n/u);
+  for (let index = 0; index < lines.length; index++) {
+    const lineNumber = index + 1;
+    const line = lines[index].trim();
+    if (!line || line.startsWith('#')) continue;
+    try {
+      result.rows.push({ lineNumber, value: normalizeSource(JSON.parse(line), lineNumber) });
+    } catch (error) {
+      result.errors.push(`line ${lineNumber}: ${error.message}`);
+    }
+  }
+  return result;
+}
+function normalizeSource(input, lineNumber) {
+  if (!input || typeof input !== 'object' || Array.isArray(input)) {
+    throw new Error('source row must be a JSON object');
+  }
+  const source = { ...input };
+  for (const field of ['source_id', 'url', 'register', 'source_title', 'source_license']) {
+    if (typeof source[field] !== 'string' || source[field].trim() === '') {
+      throw new Error(`${field} is required`);
+    }
+    source[field] = source[field].trim();
+  }
+  if (!MATRIX.registers.includes(source.register)) {
+    throw new Error(`register must be one of ${MATRIX.registers.join(', ')}`);
+  }
+  try {
+    const parsed = new URL(source.url);
+    if (parsed.protocol !== 'https:') throw new Error('source url must use https');
+  } catch (error) {
+    throw new Error(`invalid url on line ${lineNumber}: ${error.message}`);
+  }
+  if (source.source_published_at && Number.isNaN(Date.parse(source.source_published_at))) {
+    throw new Error('source_published_at must be an ISO-like date when present');
+  }
+  if (source.max_rows !== undefined && (!Number.isFinite(Number(source.max_rows)) || Number(source.max_rows) < 0)) {
+    throw new Error('max_rows must be a non-negative number when present');
+  }
+  source.max_rows = source.max_rows === undefined ? null : Number(source.max_rows);
+  source.sample_prefix = typeof source.sample_prefix === 'string' && source.sample_prefix.trim()
+    ? source.sample_prefix.trim()
+    : `ko-human-web-${slugify(source.source_id)}`;
+  source.source_kind = typeof source.source_kind === 'string' && source.source_kind.trim()
+    ? source.source_kind.trim()
+    : 'public-web';
+  return source;
+}
+export async function collectSources(sources, options = {}) {
+  const opts = {
+    minChars: options.minChars ?? DEFAULT_MIN_CHARS,
+    maxChars: options.maxChars ?? DEFAULT_MAX_CHARS,
+    maxPerSource: options.maxPerSource ?? DEFAULT_MAX_PER_SOURCE,
+    targetPerRegister: options.targetPerRegister ?? DEFAULT_TARGET_PER_REGISTER,
+    delayMs: options.delayMs ?? DEFAULT_DELAY_MS,
+    collectedAt: options.collectedAt || new Date().toISOString().slice(0, 10),
+    fetchImpl: options.fetchImpl || globalThis.fetch,
+  };
+  if (typeof opts.fetchImpl !== 'function') throw new Error('fetch is not available in this runtime');
+  const records = [];
+  const errors = [];
+  const warnings = [];
+  const seenHashes = new Set();
+  const registerCounts = Object.fromEntries(MATRIX.registers.map((register) => [register, 0]));
+  for (const source of sources) {
+    if (registerCounts[source.register] >= opts.targetPerRegister) continue;
+    let html;
+    try {
+      html = await fetchHtml(source.url, opts.fetchImpl);
+    } catch (error) {
+      warnings.push(`${source.source_id}: ${error.message}`);
+      continue;
+    }
+    const candidates = extractTextCandidates(html, opts);
+    const sourceLimit = Math.min(
+      source.max_rows ?? opts.maxPerSource,
+      opts.maxPerSource,
+      opts.targetPerRegister - registerCounts[source.register]
+    );
+    let acceptedFromSource = 0;
+    for (const text of candidates) {
+      if (acceptedFromSource >= sourceLimit) break;
+      const textHash = hashText(text);
+      if (seenHashes.has(textHash)) continue;
+      seenHashes.add(textHash);
+      acceptedFromSource++;
+      registerCounts[source.register]++;
+      records.push(buildPrivateRecord({
+        source,
+        text,
+        textHash,
+        ordinal: acceptedFromSource,
+        collectedAt: opts.collectedAt,
+      }));
+    }
+    if (acceptedFromSource === 0) {
+      warnings.push(`${source.source_id}: no paragraphs accepted from ${source.url}`);
+    }
+    if (opts.delayMs > 0) await sleep(opts.delayMs);
+  }
+  return {
+    records,
+    errors,
+    warnings,
+    registerCounts,
+    sources: sources.length,
+  };
+}
+async function fetchHtml(url, fetchImpl) {
+  const response = await fetchImpl(url, {
+    headers: {
+      'user-agent': 'patina-rebaseline-corpus-builder/1.0 (+https://github.com/devswha/patina)',
+      accept: 'text/html,application/xhtml+xml',
+    },
+  });
+  if (!response || !response.ok) {
+    throw new Error(`fetch failed: HTTP ${response?.status ?? 'unknown'}`);
+  }
+  const contentType = response.headers?.get?.('content-type') || '';
+  if (contentType && !/text\/html|application\/xhtml\+xml/iu.test(contentType)) {
+    throw new Error(`expected HTML but got ${contentType}`);
+  }
+  return response.text();
+}
+export function extractTextCandidates(html, options = {}) {
+  const minChars = options.minChars ?? DEFAULT_MIN_CHARS;
+  const maxChars = options.maxChars ?? DEFAULT_MAX_CHARS;
+  const plain = decodeHtmlEntities(String(html || ''))
+    .replace(/<!--[\s\S]*?-->/gu, ' ')
+    .replace(/<script\b[\s\S]*?<\/script>/giu, ' ')
+    .replace(/<style\b[\s\S]*?<\/style>/giu, ' ')
+    .replace(/<noscript\b[\s\S]*?<\/noscript>/giu, ' ')
+    .replace(/<(?:p|div|section|article|main|br|li|h[1-6]|tr|td|blockquote)\b[^>]*>/giu, '\n')
+    .replace(/<[^>]+>/gu, ' ')
+    .replace(/\u00a0/gu, ' ');
+  const seen = new Set();
+  const candidates = [];
+  for (const raw of plain.split(/\n+/u)) {
+    const text = normalizeParagraph(raw);
+    if (!isUsefulKoreanParagraph(text, { minChars, maxChars })) continue;
+    const key = text.toLowerCase();
+    if (seen.has(key)) continue;
+    seen.add(key);
+    candidates.push(text);
+  }
+  return candidates;
+}
+function isUsefulKoreanParagraph(text, { minChars, maxChars }) {
+  const chars = Array.from(text);
+  if (chars.length < minChars || chars.length > maxChars) return false;
+  if (BAD_BOILERPLATE_RE.test(text)) return false;
+  const hangulCount = (text.match(HANGUL_RE) || []).length;
+  if (hangulCount < 25) return false;
+  const letterish = chars.filter((char) => /[\p{L}\p{N}]/u.test(char)).length || 1;
+  if (hangulCount / letterish < 0.35) return false;
+  if ((text.match(/https?:\/\//giu) || []).length > 0) return false;
+  if ((text.match(/[|{}[\]<>]/gu) || []).length > 5) return false;
+  return true;
+}
+function buildPrivateRecord({ source, text, textHash, ordinal, collectedAt }) {
+  const suffix = String(ordinal).padStart(2, '0');
+  return {
+    language: 'ko',
+    class: 'natural-human',
+    model_family: 'human-reference',
+    provider: 'web-human-control',
+    model: 'human-authored-web-candidate',
+    generated_at: source.source_published_at || collectedAt,
+    decoding: 'not-applicable',
+    postprocess: {
+      editing_pass: 'none',
+      extraction: 'scripted web paragraph candidate',
+      source_kind: source.source_kind,
+    },
+    redistribution: 'hash-only',
+    source_review: source.source_review || {
+      status: 'hash-only-web-candidate',
+      rationale: 'Raw text stays in gitignored private intake. Commit only URL, license note, metadata, score, and sha256 digest until redistribution review is complete.',
+      license_basis: source.source_license,
+    },
+    reviewer_notes: source.reviewer_notes || 'Human-control candidate from public Korean web source; not a public benchmark claim.',
+    sample_id: `${source.sample_prefix}-${suffix}`,
+    register: source.register,
+    source_url: source.url,
+    source_title: source.source_title,
+    source_license: source.source_license,
+    ...(source.source_published_at ? { source_published_at: source.source_published_at } : {}),
+    prompt_id: `${source.sample_prefix}-${suffix}`,
+    text_hash: textHash,
+    text,
+  };
+}
+export function writePrivateOutput(result, outputPath = DEFAULT_PRIVATE_OUTPUT) {
+  if (result.errors.length) throw new Error('refusing to write web corpus output with collection errors');
+  const abs = resolveRepoPath(outputPath);
+  mkdirSync(dirname(abs), { recursive: true });
+  writeFileSync(abs, result.records.map((record) => JSON.stringify(record)).join('\n') + (result.records.length ? '\n' : ''));
+  return { output: toRepoRelative(abs) };
+}
+export function renderSummary(result, written = null) {
+  const lines = [
+    '# Rebaseline Web Collect Summary',
+    '',
+    `- Sources: ${result.sources}`,
+    `- Private rows: ${result.records.length}`,
+    `- Validation: **${result.errors.length ? 'FAIL' : 'PASS'}**`,
+  ];
+  if (written) lines.push(`- Private output: \`${written.output}\``);
+  lines.push('', '## Register counts');
+  for (const register of MATRIX.registers) {
+    lines.push(`- ${register}: ${result.registerCounts[register] || 0}`);
+  }
+  if (result.errors.length) lines.push('', '## Errors', ...result.errors.map((error) => `- ${escapeMarkdown(error)}`));
+  if (result.warnings.length) lines.push('', '## Warnings', ...result.warnings.map((warning) => `- ${escapeMarkdown(warning)}`));
+  return `${lines.join('\n')}\n`;
+}
+function normalizeParagraph(text) {
+  return String(text || '')
+    .replace(/\s+/gu, ' ')
+    .replace(/^[·•*\\-–—\s]+/u, '')
+    .trim();
+}
+function decodeHtmlEntities(text) {
+  return text
+    .replace(/&nbsp;/giu, ' ')
+    .replace(/&amp;/giu, '&')
+    .replace(/&lt;/giu, '<')
+    .replace(/&gt;/giu, '>')
+    .replace(/&quot;/giu, '"')
+    .replace(/&#39;/giu, "'")
+    .replace(/&#x([0-9a-f]+);/giu, (_, hex) => String.fromCodePoint(Number.parseInt(hex, 16)))
+    .replace(/&#([0-9]+);/gu, (_, num) => String.fromCodePoint(Number.parseInt(num, 10)));
+}
+function hashText(text) {
+  return `sha256:${createHash('sha256').update(String(text)).digest('hex')}`;
+}
+function slugify(value) {
+  return String(value || '')
+    .normalize('NFKD')
+    .toLowerCase()
+    .replace(/[^a-z0-9]+/gu, '-')
+    .replace(/^-+|-+$/gu, '')
+    .slice(0, 64) || 'source';
+}
+function sleep(ms) {
+  return new Promise((resolveSleep) => setTimeout(resolveSleep, ms));
+}
+function resolveRepoPath(path) {
+  return resolve(REPO_ROOT, path);
+}
+function toRepoRelative(path) {
+  return relative(REPO_ROOT, path) || path;
+}
+function escapeMarkdown(value) {
+  return String(value ?? '').replace(/\|/gu, '\\|').replace(/\n/gu, ' ');
+}
+function printHelp() {
+  console.log(`Usage: node scripts/rebaseline-web-collect.mjs [--input <sources.jsonl>] [--output <private.jsonl>] [--target-per-register <n>] [--max-per-source <n>] [--dry-run] [--json]
+Fetches public Korean web pages listed in a JSONL source inventory and writes
+private raw-text rows for the 2025+ rebaseline workflow. The output path should
+stay under artifacts/rebaseline-2025/private/ and must not be committed.
+Default input: ${DEFAULT_SOURCE_INPUT}
+Default output: ${DEFAULT_PRIVATE_OUTPUT}`);
+}
+async function main() {
+  const args = parseArgs();
+  if (args.help) {
+    printHelp();
+    return;
+  }
+  const loaded = loadSourceRows(args.input);
+  if (loaded.errors.length) {
+    const result = { sources: 0, records: [], registerCounts: {}, errors: loaded.errors, warnings: [] };
+    console.log(args.json ? JSON.stringify(result, null, 2) : renderSummary(result));
+    process.exitCode = 1;
+    return;
+  }
+  const result = await collectSources(loaded.rows.map((row) => row.value), args);
+  const written = !args.dryRun && result.errors.length === 0
+    ? writePrivateOutput(result, args.output)
+    : null;
+  if (args.json) console.log(JSON.stringify({ ...result, written }, null, 2));
+  else console.log(renderSummary(result, written));
+  if (result.errors.length) process.exitCode = 1;
+}
+if (process.argv[1] && resolve(process.argv[1]) === fileURLToPath(import.meta.url)) {
+  main().catch((error) => {
+    console.error(`rebaseline-web-collect: ${error.message}`);
+    process.exitCode = 1;
+  });
+}

package/scripts/update-benchmark-ranges.mjs CHANGED Viewed

@@ -60,6 +60,7 @@ function range(value, tolerance, floor = 0) {
 function detectorHot(result) {
   return {
     burstiness: result.paragraphs.some((p) => p.burstiness?.band === 'low'),
+    koDiagnostics: result.paragraphs.some((p) => p.koDiagnostics?.hot),
     mattr: result.paragraphs.some((p) => p.mattr?.band === 'low'),
     lexicon: result.paragraphs.some((p) => p.lexicon?.hot),
   };

package/src/api.js CHANGED Viewed

@@ -1,9 +1,18 @@
+// @ts-check
 import { validateBaseURL } from './security.js';
+import { DEFAULT_BEST_MODELS } from './model-defaults.js';
 const DEFAULT_TIMEOUT = 120000;
 const DEFAULT_MAX_RETRIES = 2;
 const DEFAULT_BASE_BACKOFF_MS = 1000;
 const DEFAULT_MAX_BACKOFF_MS = 30000;
+/**
+ * Default sampling temperature for OpenAI-compatible chat completion calls.
+ *
+ * @type {number}
+ * @example
+ * const temperature = DEFAULT_TEMPERATURE; // 0.7
+ */
 export const DEFAULT_TEMPERATURE = 0.7;
 // Status codes that warrant a retry. Network errors (no status, AbortError)
@@ -12,6 +21,15 @@ const RETRYABLE_STATUS = new Set([408, 425, 429, 500, 502, 503, 504]);
 // Subclassed error so the retry loop can read `.status` + `.retryAfter`
 // without re-parsing strings.
+/**
+ * Error raised for non-2xx HTTP responses from an LLM provider.
+ *
+ * @param {number} status HTTP status code returned by the provider.
+ * @param {string} body Response body text, truncated in the message.
+ * @param {string|null} retryAfter Raw Retry-After response header, if present.
+ * @example
+ * throw new HttpError(429, 'rate limit', '2');
+ */
 export class HttpError extends Error {
   constructor(status, body, retryAfter) {
     super(`HTTP ${status}: ${truncate(body)}`);
@@ -67,6 +85,15 @@ function sleepWithSignal(sleep, ms, signal) {
   });
 }
+/**
+ * Decide whether an LLM call failure should be retried.
+ *
+ * @param {Error|Object} err Error thrown by fetch or {@link HttpError}.
+ * @returns {boolean} True for retryable HTTP statuses, aborts, and common network failures.
+ * @throws {Error} Does not intentionally throw; unexpected Error-like inputs may still propagate JavaScript runtime failures.
+ * @example
+ * const retry = isRetryable(new HttpError(429, 'rate limit', '1'));
+ */
 export function isRetryable(err) {
   if (!err) return false;
   if (err.name === 'AbortError') return true;
@@ -77,6 +104,21 @@ export function isRetryable(err) {
 // Honors Retry-After (seconds or HTTP-date). Falls back to exponential
 // backoff with up to 50% jitter, capped at maxDelay.
+/**
+ * Compute retry delay from Retry-After or exponential backoff with jitter.
+ *
+ * @param {number} attempt Zero-based retry attempt.
+ * @param {string|null|undefined} retryAfter Retry-After seconds or HTTP-date header.
+ * @param {object} [opts] Backoff tuning and deterministic test hooks.
+ * @param {number} [opts.base=1000] Initial exponential backoff in milliseconds.
+ * @param {number} [opts.max=30000] Maximum returned delay in milliseconds.
+ * @param {Function} [opts.now] Clock returning epoch milliseconds.
+ * @param {Function} [opts.random] Random number provider used for jitter.
+ * @returns {number} Delay in milliseconds, capped at opts.max.
+ * @throws {Error} Propagates validation, filesystem, network, or dependency failures when the underlying operation cannot complete.
+ * @example
+ * const delay = computeBackoffMs(1, '2'); // 2000
+ */
 export function computeBackoffMs(attempt, retryAfter, opts = {}) {
   const {
     base = DEFAULT_BASE_BACKOFF_MS,
@@ -101,39 +143,36 @@ export function computeBackoffMs(attempt, retryAfter, opts = {}) {
   return Math.min(exp + jitter, max);
 }
-// Bounded-concurrency semaphore. `max <= 0` yields a no-op gate for callers
-// that explicitly opt into unlimited fanout.
-export function createSemaphore(max) {
-  if (!max || max <= 0) {
-    return { acquire: () => Promise.resolve(() => {}) };
-  }
-  let active = 0;
-  const queue = [];
-  const drain = () => {
-    if (active < max && queue.length) {
-      active++;
-      const resolve = queue.shift();
-      resolve(() => {
-        active--;
-        drain();
-      });
-    }
-  };
-  return {
-    acquire() {
-      return new Promise((resolve) => {
-        queue.push(resolve);
-        if (active < max) drain();
-      });
-    },
-  };
-}
+/**
+ * Call an OpenAI-compatible chat completions endpoint with retries, timeout, and abort support.
+ *
+ * @param {object} options LLM request options.
+ * @param {string} options.prompt User prompt sent as the single chat message.
+ * @param {string} [options.apiKey] Bearer token for the provider.
+ * @param {string} [options.baseURL] OpenAI-compatible API base URL. Defaults to https://api.openai.com/v1.
+ * @param {string} [options.model] Model id to request. Defaults to gpt-5.5.
+ * @param {number} [options.temperature=DEFAULT_TEMPERATURE] Sampling temperature.
+ * @param {number|string} [options.seed] Optional deterministic seed forwarded to the provider.
+ * @param {number} [options.timeout=120000] Per-attempt timeout in milliseconds.
+ * @param {number} [options.maxRetries=2] Retry count after the first attempt.
+ * @param {number} [options.deadline] Absolute epoch-millisecond deadline for all attempts.
+ * @param {AbortSignal} [options.signal] External cancellation signal.
+ * @param {boolean} [options.allowInsecureBaseURL=false] Allow non-loopback HTTP base URLs.
+ * @param {Function} [options.onResponse] Callback receiving provider metadata.
+ * @param {Function} [options.sleep] Injectable sleep function for tests.
+ * @param {Function} [options.now] Clock returning epoch milliseconds.
+ * @returns {Promise<string>} Assistant message content.
+ * @throws {HttpError} When the provider returns a non-2xx response after retries.
+ * @throws {Error} On abort, timeout, malformed provider payload, or base URL validation failure.
+ * @example
+ * const text = await callLLM({ prompt: 'Rewrite this', apiKey: process.env.OPENAI_API_KEY });
+ */
 export async function callLLM({
   prompt,
   apiKey,
   baseURL = 'https://api.openai.com/v1',
-  model = 'gpt-4o',
+  model = DEFAULT_BEST_MODELS.openai,
   temperature = DEFAULT_TEMPERATURE,
   seed,
   timeout = DEFAULT_TIMEOUT,
@@ -142,7 +181,6 @@ export async function callLLM({
   signal,
   allowInsecureBaseURL = false,
   onResponse,
-  cache,
   // Allows tests to inject a deterministic delay function.
   sleep = (ms) => new Promise((r) => setTimeout(r, ms)),
   now = () => Date.now(),
@@ -156,21 +194,6 @@ export async function callLLM({
   };
   if (seed !== undefined && seed !== null) body.seed = seed;
-  const cached = cache?.get?.({ prompt, model, temperature, baseURL });
-  if (cached) {
-    onResponse?.({
-      provider: 'cache',
-      model: cached.responseModel ?? cached.model ?? model,
-      requestedModel: model,
-      temperature,
-      seed: seed ?? null,
-      usage: cached.usage ?? null,
-      rawResponse: null,
-      content: cached.content,
-      cache: { hit: true, key: cached.key, path: cached.path },
-    });
-    return cached.content;
-  }
   let lastError;
   let attemptsMade = 0;
@@ -234,9 +257,7 @@ export async function callLLM({
         usage: data.usage ?? null,
         rawResponse: data,
         content,
-        cache: cache ? { hit: false } : null,
       };
-      cache?.set?.({ prompt, model, temperature, baseURL }, content, metadata);
       onResponse?.(metadata);
       return content;
@@ -266,65 +287,8 @@ export async function callLLM({
   const err = new Error(`LLM API failed after ${attemptsMade || 1} attempts: ${lastError?.message ?? 'unknown'}`);
   if (lastError?.name === 'AbortError') err.name = 'AbortError';
-  if (typeof lastError?.status === 'number') err.status = lastError.status;
+  const lastStatus = lastError ? /** @type {any} */ (lastError).status : undefined;
+  if (typeof lastStatus === 'number') /** @type {any} */ (err).status = lastStatus;
   throw err;
 }
-export async function callLLMMultiple({
-  prompt,
-  models,
-  apiKey,
-  baseURL = 'https://api.openai.com/v1',
-  temperature = DEFAULT_TEMPERATURE,
-  seed,
-  timeout = DEFAULT_TIMEOUT,
-  allowInsecureBaseURL = false,
-  deadline,
-  signal,
-  maxConcurrency,
-  onStart,
-  onComplete,
-  onResponse,
-  cache,
-  callLLM: callLLMImpl = callLLM,
-  sleep,
-  now = () => Date.now(),
-}) {
-  validateBaseURL(baseURL, { allowInsecure: allowInsecureBaseURL });
-  const effectiveMaxConcurrency =
-    maxConcurrency === undefined || maxConcurrency === null
-      ? Math.min(models.length, 3)
-      : maxConcurrency;
-  const sem = createSemaphore(effectiveMaxConcurrency);
-  const promises = models.map(async (model) => {
-    const release = await sem.acquire();
-    if (onStart) onStart(model);
-    try {
-      const result = await callLLMImpl({
-        prompt,
-        apiKey,
-        baseURL,
-        model,
-        temperature,
-        seed,
-        timeout,
-        deadline,
-        signal,
-        allowInsecureBaseURL,
-        onResponse,
-        cache,
-        sleep,
-        now,
-      });
-      if (onComplete) onComplete(model, true);
-      return { model, result, ok: true };
-    } catch (err) {
-      if (onComplete) onComplete(model, false);
-      return { model, error: err.message, ok: false };
-    } finally {
-      release();
-    }
-  });
-  return Promise.all(promises);
-}