npm - @draig/lexis-two - Versions diffs - 1.0.2 → 1.0.4 - Mend

@draig/lexis-two 1.0.2 → 1.0.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (115) hide show

package/package.json +7 -1
package/.agents/plugins/marketplace.json +0 -21
package/.claude-plugin/marketplace.json +0 -29
package/.claude-plugin/plugin.json +0 -9
package/.clinerules/lexis-two.md +0 -163
package/.codex-plugin/plugin.json +0 -31
package/.cursor/rules/lexis-two.mdc +0 -169
package/.env.example +0 -8
package/.github/FUNDING.yml +0 -1
package/.github/copilot-instructions.md +0 -47
package/.github/plugin/marketplace.json +0 -20
package/.github/plugin/plugin.json +0 -16
package/.github/workflows/deploy-site.yml +0 -53
package/.github/workflows/test.yml +0 -29
package/.kiro/steering/lexis-two.md +0 -167
package/.nojekyll +0 -0
package/.windsurf/rules/lexis-two.md +0 -163
package/AGENTS.md +0 -163
package/AUDIT.md +0 -74
package/CNAME +0 -1
package/SPECXIS.md +0 -576
package/assets/benchmark-3model.svg +0 -21
package/assets/lexis-two-complete.webp +0 -0
package/assets/lexis-two-nobg.png +0 -0
package/assets/logo.png +0 -0
package/assets/social-preview.png +0 -0
package/benchmarks/README.md +0 -114
package/benchmarks/arms/baseline.js +0 -2
package/benchmarks/arms/caveman-SKILL.md +0 -67
package/benchmarks/arms/caveman.js +0 -8
package/benchmarks/arms/lexis-two.js +0 -10
package/benchmarks/arms/ponytail.js +0 -6
package/benchmarks/behavior.js +0 -58
package/benchmarks/behavior.yaml +0 -40
package/benchmarks/benchmark-local.py +0 -156
package/benchmarks/benchmark-opencode-go.js +0 -294
package/benchmarks/correctness.js +0 -294
package/benchmarks/lib/aggregate-opencode-go.js +0 -103
package/benchmarks/lib/load-env.js +0 -31
package/benchmarks/lib/opencode-go-client.js +0 -151
package/benchmarks/loc.js +0 -13
package/benchmarks/opencode-go-models.json +0 -31
package/benchmarks/promptfooconfig.yaml +0 -41
package/benchmarks/prompts.json +0 -15
package/benchmarks/render-opencode-go-report.js +0 -28
package/benchmarks/results/2026-06-15-llama3.2-local.md +0 -76
package/benchmarks/results/2026-06-16-opencode-go.md +0 -56
package/benchmarks/results/opencode-go-2026-06-16-report.html +0 -226
package/benchmarks/results/opencode-go-2026-06-16.json +0 -1339
package/commands/lexis-two-audit.toml +0 -3
package/commands/lexis-two-debt.toml +0 -3
package/commands/lexis-two-help.toml +0 -3
package/commands/lexis-two-plan.toml +0 -3
package/commands/lexis-two-review.toml +0 -3
package/commands/lexis-two-security.toml +0 -3
package/commands/lexis-two.toml +0 -3
package/docs/assets/lexis-two-nobg.png +0 -0
package/docs/assets/logo.png +0 -0
package/docs/assets/logo.svg +0 -4
package/docs/portability.md +0 -147
package/docs/site.md +0 -52
package/examples/api-endpoint.md +0 -68
package/examples/caching.md +0 -74
package/examples/date-picker.md +0 -48
package/examples/email-validation.md +0 -51
package/examples/sorting.md +0 -42
package/gemini-extension.json +0 -7
package/opencode.json +0 -4
package/pi-extension/index.js +0 -161
package/pi-extension/package.json +0 -8
package/pi-extension/test/extension.test.js +0 -89
package/pi-extension/test/helpers.test.js +0 -35
package/scripts/check-rule-copies.js +0 -82
package/site/astro.config.mjs +0 -18
package/site/package-lock.json +0 -4913
package/site/package.json +0 -14
package/site/public/CNAME +0 -1
package/site/public/assets/lexis-two-nobg.png +0 -0
package/site/public/assets/logo.png +0 -0
package/site/public/assets/logo.svg +0 -4
package/site/public/robots.txt +0 -4
package/site/src/components/Adapt.astro +0 -33
package/site/src/components/Benchmarks.astro +0 -232
package/site/src/components/Commands.astro +0 -33
package/site/src/components/Ecosystem.astro +0 -30
package/site/src/components/Example.astro +0 -77
package/site/src/components/Footer.astro +0 -28
package/site/src/components/Header.astro +0 -87
package/site/src/components/Hero.astro +0 -58
package/site/src/components/Home.astro +0 -46
package/site/src/components/Hosts.astro +0 -62
package/site/src/components/Install.astro +0 -139
package/site/src/components/LanguageSwitcher.astro +0 -82
package/site/src/components/Philosophy.astro +0 -23
package/site/src/components/Stacks.astro +0 -33
package/site/src/components/Suggested.astro +0 -39
package/site/src/data/opencode-go-benchmark.json +0 -230
package/site/src/i18n/en.ts +0 -155
package/site/src/i18n/es.ts +0 -158
package/site/src/i18n/index.ts +0 -14
package/site/src/layouts/Layout.astro +0 -114
package/site/src/pages/benchmarks.astro +0 -4
package/site/src/pages/es/benchmarks.astro +0 -4
package/site/src/pages/es/index.astro +0 -10
package/site/src/pages/index.astro +0 -10
package/site/src/styles/global.css +0 -780
package/site/tsconfig.json +0 -3
package/tests/behavior.test.js +0 -80
package/tests/commands.test.js +0 -40
package/tests/copilot-plugin.test.js +0 -33
package/tests/correctness.test.js +0 -191
package/tests/gemini-extension.test.js +0 -78
package/tests/hooks-windows.test.js +0 -48
package/tests/hooks.test.js +0 -177
package/tests/opencode-plugin.test.js +0 -64

package/benchmarks/lib/load-env.js DELETED Viewed

@@ -1,31 +0,0 @@
-// Load KEY=VALUE lines from a .env file into process.env (no dotenv dependency).
-const fs = require('fs');
-function loadEnvFile(envPath) {
-  if (!fs.existsSync(envPath)) return false;
-  const raw = fs.readFileSync(envPath, 'utf8').replace(/^\uFEFF/, '');
-  for (const line of raw.split(/\r?\n/)) {
-    const trimmed = line.trim();
-    if (!trimmed || trimmed.startsWith('#')) continue;
-    const eq = trimmed.indexOf('=');
-    if (eq <= 0) continue;
-    const key = trimmed.slice(0, eq).trim();
-    if (process.env[key] !== undefined) continue;
-    let value = trimmed.slice(eq + 1).trim();
-    if (
-      (value.startsWith('"') && value.endsWith('"')) ||
-      (value.startsWith("'") && value.endsWith("'"))
-    ) {
-      value = value.slice(1, -1);
-    }
-    process.env[key] = value;
-  }
-  return true;
-}
-module.exports = { loadEnvFile };

package/benchmarks/lib/opencode-go-client.js DELETED Viewed

@@ -1,151 +0,0 @@
-// OpenCode Go API client — OpenAI chat/completions + Anthropic /messages transports.
-// Docs: https://opencode.ai/docs/go/#endpoints
-const fs = require('fs');
-const path = require('path');
-const DEFAULT_BASE = 'https://opencode.ai/zen/go/v1';
-const ENV_PATH = path.join(__dirname, '..', '..', '.env');
-function getApiKey() {
-  const key = (process.env.OPENCODE_API_KEY || process.env.OPENCODE_GO_API_KEY || '').trim();
-  if (!key) {
-    const hint = fs.existsSync(ENV_PATH)
-      ? `OPENCODE_API_KEY is empty in ${ENV_PATH}. Paste your OpenCode Go key after the = sign.`
-      : `Create ${ENV_PATH} from .env.example and set OPENCODE_API_KEY=your-key`;
-    throw new Error(`Missing OPENCODE_API_KEY. ${hint}`);
-  }
-  return key;
-}
-async function readJsonResponse(res) {
-  const text = await res.text();
-  let body;
-  try {
-    body = text ? JSON.parse(text) : {};
-  } catch {
-    body = { raw: text };
-  }
-  if (!res.ok) {
-    const msg =
-      body?.error?.message ||
-      body?.message ||
-      (typeof body?.error === 'string' ? body.error : null) ||
-      text.slice(0, 500) ||
-      res.statusText;
-    throw new Error(`HTTP ${res.status}: ${msg}`);
-  }
-  return body;
-}
-function extractOpenAiText(body) {
-  return body?.choices?.[0]?.message?.content ?? '';
-}
-function extractAnthropicText(body) {
-  const blocks = body?.content;
-  if (!Array.isArray(blocks)) return '';
-  return blocks
-    .filter((b) => b?.type === 'text' && typeof b.text === 'string')
-    .map((b) => b.text)
-    .join('');
-}
-function extractUsage(body, transport) {
-  if (transport === 'openai-chat') {
-    const u = body?.usage;
-    if (!u) return null;
-    return {
-      inputTokens: u.prompt_tokens ?? 0,
-      outputTokens: u.completion_tokens ?? 0,
-    };
-  }
-  const u = body?.usage;
-  if (!u) return null;
-  return {
-    inputTokens: u.input_tokens ?? 0,
-    outputTokens: u.output_tokens ?? 0,
-  };
-}
-async function chatOpenAi({ baseUrl, apiKey, model, system, user, maxTokens, temperature }) {
-  const messages = [];
-  if (system) messages.push({ role: 'system', content: system });
-  messages.push({ role: 'user', content: user });
-  const res = await fetch(`${baseUrl}/chat/completions`, {
-    method: 'POST',
-    headers: {
-      Authorization: `Bearer ${apiKey}`,
-      'Content-Type': 'application/json',
-    },
-    body: JSON.stringify({
-      model,
-      messages,
-      max_tokens: maxTokens,
-      temperature,
-    }),
-  });
-  const body = await readJsonResponse(res);
-  return {
-    text: extractOpenAiText(body),
-    usage: extractUsage(body, 'openai-chat'),
-    raw: body,
-  };
-}
-async function chatAnthropic({ baseUrl, apiKey, model, system, user, maxTokens, temperature }) {
-  const payload = {
-    model,
-    max_tokens: maxTokens,
-    messages: [{ role: 'user', content: user }],
-  };
-  if (system) payload.system = system;
-  if (typeof temperature === 'number') payload.temperature = temperature;
-  // lexis: Go /messages rejects Bearer — x-api-key only (qwen3.7-max, minimax-m3)
-  const res = await fetch(`${baseUrl}/messages`, {
-    method: 'POST',
-    headers: {
-      'x-api-key': apiKey,
-      'Content-Type': 'application/json',
-      'anthropic-version': '2023-06-01',
-    },
-    body: JSON.stringify(payload),
-  });
-  const body = await readJsonResponse(res);
-  return {
-    text: extractAnthropicText(body),
-    usage: extractUsage(body, 'anthropic-messages'),
-    raw: body,
-  };
-}
-async function complete({
-  modelId,
-  modelConfig,
-  system,
-  user,
-  baseUrl = DEFAULT_BASE,
-  apiKey = getApiKey(),
-  temperature = 1,
-}) {
-  const maxTokens = modelConfig.maxTokens ?? 8192;
-  const args = { baseUrl, apiKey, model: modelId, system, user, maxTokens, temperature };
-  if (modelConfig.transport === 'anthropic-messages') {
-    return chatAnthropic(args);
-  }
-  if (modelConfig.transport === 'openai-chat') {
-    return chatOpenAi(args);
-  }
-  throw new Error(`Unknown transport for ${modelId}: ${modelConfig.transport}`);
-}
-module.exports = {
-  DEFAULT_BASE,
-  getApiKey,
-  complete,
-};

package/benchmarks/loc.js DELETED Viewed

@@ -1,13 +0,0 @@
-// Deterministic code-size metric: non-blank, non-comment lines of code. Counts
-// fenced blocks, or the whole response when the model emitted bare code unfenced.
-// Recorded as the `code_loc` metric per arm (always passes; it is a measurement, not a gate).
-module.exports = (output) => {
-  const text = String(output || '');
-  const blocks = [...text.matchAll(/```[a-zA-Z0-9_+-]*\n([\s\S]*?)```/g)].map((m) => m[1]);
-  const code = blocks.length ? blocks.join('\n') : text;
-  const loc = code
-    .split('\n')
-    .map((l) => l.trim())
-    .filter((l) => l && !l.startsWith('//') && !l.startsWith('#') && l !== '*/' && !l.startsWith('/*') && !l.startsWith('*')).length;
-  return { pass: true, score: loc, reason: loc + ' code LOC' };
-};

package/benchmarks/opencode-go-models.json DELETED Viewed

@@ -1,31 +0,0 @@
-{
-  "baseUrl": "https://opencode.ai/zen/go/v1",
-  "defaultModels": [
-    "kimi-k2.6",
-    "deepseek-v4-pro",
-    "qwen3.7-max",
-    "minimax-m3"
-  ],
-  "models": {
-    "kimi-k2.6": {
-      "name": "Kimi K2.6",
-      "transport": "openai-chat",
-      "maxTokens": 8192
-    },
-    "deepseek-v4-pro": {
-      "name": "DeepSeek V4 Pro",
-      "transport": "openai-chat",
-      "maxTokens": 8192
-    },
-    "qwen3.7-max": {
-      "name": "Qwen3.7 Max",
-      "transport": "anthropic-messages",
-      "maxTokens": 8192
-    },
-    "minimax-m3": {
-      "name": "MiniMax M3",
-      "transport": "anthropic-messages",
-      "maxTokens": 8192
-    }
-  }
-}

package/benchmarks/promptfooconfig.yaml DELETED Viewed

@@ -1,41 +0,0 @@
-# Ponytail benchmark: code size + cost across three arms, same model, same tasks.
-#
-#   Run:   npx promptfoo@latest eval -c benchmarks/promptfooconfig.yaml
-#   View:  npx promptfoo@latest view
-#   Share: npx promptfoo@latest share   (publishes a hosted report URL)
-#
-# Needs ANTHROPIC_API_KEY in the environment or a .env file (see benchmarks/README.md).
-# Caveman arm uses JuliusBrussee/caveman SKILL.md (MIT), vendored at arms/caveman-SKILL.md.
-description: "Ponytail vs caveman vs no-skill: same model, same tasks. Measures code LOC (deterministic) and tokens/cost (API telemetry)."
-providers:
-  - id: anthropic:messages:claude-haiku-4-5-20251001
-    config: { max_tokens: 8192, temperature: 1 }
-  - id: anthropic:messages:claude-sonnet-4-6
-    config: { max_tokens: 8192, temperature: 1 }
-  - id: anthropic:messages:claude-opus-4-8
-    config: { max_tokens: 8192, temperature: 1 }
-prompts:
-  - id: file://arms/baseline.js
-    label: baseline (no skill)
-  - id: file://arms/caveman.js
-    label: caveman
-  - id: file://arms/ponytail.js
-    label: ponytail
-defaultTest:
-  assert:
-    - type: javascript
-      value: file://loc.js
-      metric: code_loc
-    - type: javascript
-      value: file://correctness.js
-      metric: correct
-tests:
-  - vars: { task: "Write me a Python function that validates email addresses." }
-  - vars: { task: "Add debounce to a search input in vanilla JavaScript. It currently fires an API call on every keystroke." }
-  - vars: { task: "Write Python code that reads sales.csv and sums the 'amount' column." }
-  - vars: { task: "Build me a countdown timer component in React that counts down from a given number of seconds." }
-  - vars: { task: "Add rate limiting to my FastAPI endpoint so users can't spam it." }

package/benchmarks/prompts.json DELETED Viewed

@@ -1,15 +0,0 @@
-{
-  "method": "One fresh Claude Code subagent per task x config, same model, no file outputs. Metrics from task telemetry: total tokens (includes thinking), duration. Code lines counted from fenced blocks in the deliverable.",
-  "configs": [
-    "baseline — no skill",
-    "caveman — caveman SKILL.md (full) as operating instructions",
-    "ponytail — ponytail SKILL.md (full) as operating instructions"
-  ],
-  "tasks": [
-    { "id": "email", "prompt": "Write me a Python function that validates email addresses." },
-    { "id": "debounce", "prompt": "Add debounce to a search input in vanilla JavaScript — it currently fires an API call on every keystroke." },
-    { "id": "csv-sum", "prompt": "Write Python code that reads sales.csv and sums the 'amount' column." },
-    { "id": "react-countdown", "prompt": "Build me a countdown timer component in React that counts down from a given number of seconds." },
-    { "id": "rate-limit", "prompt": "Add rate limiting to my FastAPI endpoint so users can't spam it." }
-  ]
-}

package/benchmarks/render-opencode-go-report.js DELETED Viewed

@@ -1,28 +0,0 @@
-#!/usr/bin/env node
-/**
- * Sync aggregated benchmark data for the Astro site.
- *
- * Usage:
- *   node benchmarks/render-opencode-go-report.js
- *   node benchmarks/render-opencode-go-report.js benchmarks/results/opencode-go-2026-06-16.json
- */
-const fs = require('fs');
-const path = require('path');
-const { aggregateOpencodeGo, findLatestJson } = require('./lib/aggregate-opencode-go.js');
-const SITE_DATA = path.join(__dirname, '..', 'site', 'src', 'data', 'opencode-go-benchmark.json');
-function main() {
-  const input = process.argv[2] ? path.resolve(process.argv[2]) : findLatestJson();
-  const data = JSON.parse(fs.readFileSync(input, 'utf8'));
-  const chart = aggregateOpencodeGo(data);
-  fs.mkdirSync(path.dirname(SITE_DATA), { recursive: true });
-  fs.writeFileSync(SITE_DATA, `${JSON.stringify(chart, null, 2)}\n`, 'utf8');
-  console.log(`Site data → ${SITE_DATA}`);
-  console.log('Preview charts: npm run site:dev → http://localhost:4321/benchmarks/');
-}
-main();

package/benchmarks/results/2026-06-15-llama3.2-local.md DELETED Viewed

@@ -1,76 +0,0 @@
-# Local model benchmark: llama3.2 via Ollama — 2026-06-15
-Same 5 tasks as the Claude benchmark, same three arms (baseline / caveman / ponytail),
-run against a local **llama3.2:latest** (3.2B, Q4_K_M) via Ollama on a Windows 11 machine.
-Tooling: `benchmarks/benchmark-local.py` (no promptfoo needed).
-> **Updated 2026-06-15:** the LOC counter now counts bare, unfenced code. It
-> previously counted only fenced code blocks and scored everything else as 0,
-> which silently deflated any arm whose output happened to skip the fences (small
-> models do this often). Numbers below use the corrected counter at n=5 median.
-> Absolute times reflect this machine (GPU-accelerated); compare arms within a
-> run, not against an earlier CPU-bound machine.
-## Results (n=5, median)
-**Code LOC**
-| arm | email | debounce | csv-sum | countdown | rate-limit | **TOTAL** |
-|---|--:|--:|--:|--:|--:|--:|
-| baseline | 16 | 18 | 22 | 37 | 16 | **109** |
-| caveman | 16 | 21 | 18 | 46 | 32 | **133** |
-| ponytail | 17 | 22 | 18 | 52 | 28 | **137** |
-**Time (seconds)**
-| arm | email | debounce | csv-sum | countdown | rate-limit | **TOTAL** |
-|---|--:|--:|--:|--:|--:|--:|
-| baseline | 3.1 | 3.7 | 3.6 | 4.2 | 4.8 | **19.4** |
-| caveman | 4.1 | 4.2 | 3.6 | 4.4 | 4.8 | **21.1** |
-| ponytail | 4.1 | 4.2 | 3.8 | 4.8 | 4.9 | **21.8** |
-## Key findings
-**On llama3.2 the LOC effect is inside the noise floor.** At temperature 0.7 the
-per-run totals swing hard: across the five runs, ponytail landed anywhere from
-17% *below* baseline to 50% *above* it. The n=5 median came out +26%; a separate
-n=3 median came out −17%. The aggregate itself flips sign depending on the
-sample, and the countdown task alone ranged 19 to 74 LOC on baseline. There is no
-stable LOC reduction to report.
-**Ponytail does not transfer to llama3.2.** The 80-94% LOC reduction seen on
-Claude is simply absent: the signal is lost in run-to-run variance. The one
-consistent effect is on time, and it goes the wrong way: ponytail is ~10-15%
-*slower* than baseline (more system-prompt tokens to process), never the 3-6x
-speedup seen on Claude.
-**Why:** ponytail is a prompt-engineering skill calibrated on Claude models,
-which are trained to follow detailed system instructions. A 3.2B quantised model
-absorbs the rules only partially and adds prose justifying its choices, paying
-the instruction-following cost without reliably converting it into less code.
-## Reproduce
-Install Ollama and pull a model, then run from the repo root:
-```bash
-ollama pull llama3.2
-python benchmarks/benchmark-local.py --model llama3.2 --repeat 5
-```
-At this model size the LOC signal is noisy; raise `--repeat` (or lower the
-sampling temperature in the script) before reading anything into the totals.
-Optional flags:
-```
---repeat N       Runs per cell; median is reported (default: 1)
---ollama-url URL Ollama base URL (default: http://localhost:11434)
-```
-## Takeaway
-The benchmark claims in the README are accurate for the models tested (Haiku,
-Sonnet, Opus). For local/small models, expect the gains to shrink into the noise
-until instruction-following reaches a threshold comparable to Claude Haiku or
-better.

package/benchmarks/results/2026-06-16-opencode-go.md DELETED Viewed

@@ -1,56 +0,0 @@
-# Lexis-Two benchmark — OpenCode Go (2026-06-16)
-Provider: [OpenCode Go](https://opencode.ai/docs/go/).
-Repeat: 3 per cell. Temperature: 1.
-## Kimi K2.6 (`kimi-k2.6`)
-Repeat: 3. Arms: baseline, lexis-two.
-**Code LOC (median)**
-| arm | email | debounce | csv-sum | countdown | rate-limit | TOTAL | correct |
-| --- | ---: | ---: | ---: | ---: | ---: | ---: | ---: |
-| baseline | 46 | 63 | 18 | 413 | 62 | 602 | 12/15 |
-| lexis-two | 13 | 10 | 4 | 13 | 23 | 63 | 12/15 |
-**lexis-two vs baseline (median total LOC):** 90% less code.
-## DeepSeek V4 Pro (`deepseek-v4-pro`)
-Repeat: 3. Arms: baseline, lexis-two.
-**Code LOC (median)**
-| arm | email | debounce | csv-sum | countdown | rate-limit | TOTAL | correct |
-| --- | ---: | ---: | ---: | ---: | ---: | ---: | ---: |
-| baseline | 36 | 61 | 25 | 113 | 53 | 288 | 14/15 |
-| lexis-two | 9 | 12 | 4 | 12 | 20 | 57 | 13/15 |
-**lexis-two vs baseline (median total LOC):** 80% less code.
-## Qwen3.7 Max (`qwen3.7-max`)
-Repeat: 3. Arms: baseline, lexis-two.
-**Code LOC (median)**
-| arm | email | debounce | csv-sum | countdown | rate-limit | TOTAL | correct |
-| --- | ---: | ---: | ---: | ---: | ---: | ---: | ---: |
-| baseline | 39 | 48 | 19 | 124 | 40 | 270 | 12/15 |
-| lexis-two | 14 | 9 | 4 | 10 | 17 | 54 | 13/15 |
-**lexis-two vs baseline (median total LOC):** 80% less code.
-## MiniMax M3 (`minimax-m3`)
-Repeat: 3. Arms: baseline, lexis-two.
-**Code LOC (median)**
-| arm | email | debounce | csv-sum | countdown | rate-limit | TOTAL | correct |
-| --- | ---: | ---: | ---: | ---: | ---: | ---: | ---: |
-| baseline | 55 | 66 | 33 | 112 | 59 | 325 | 11/15 |
-| lexis-two | 9 | 10 | 4 | 18 | 15 | 56 | 15/15 |
-**lexis-two vs baseline (median total LOC):** 83% less code.

package/benchmarks/results/opencode-go-2026-06-16-report.html DELETED Viewed

@@ -1,226 +0,0 @@
-<!DOCTYPE html>
-<html lang="en">
-<head>
-  <meta charset="utf-8" />
-  <meta name="viewport" content="width=device-width, initial-scale=1" />
-  <title>Lexis-Two benchmark — OpenCode Go (2026-06-16)</title>
-  <script src="https://cdn.jsdelivr.net/npm/chart.js@4.4.1/dist/chart.umd.min.js"></script>
-  <style>
-    :root {
-      --bg: #0b0d0c;
-      --panel: #121614;
-      --border: #1e2420;
-      --text: #e8ece9;
-      --muted: #8a948d;
-      --accent: #7cba8a;
-      --baseline: #c97a7a;
-    }
-    * { box-sizing: border-box; }
-    body {
-      margin: 0;
-      font-family: system-ui, sans-serif;
-      background: var(--bg);
-      color: var(--text);
-      line-height: 1.5;
-    }
-    .wrap { max-width: 1100px; margin: 0 auto; padding: 2rem 1rem 3rem; }
-    h1 { font-size: 1.75rem; margin: 0 0 0.25rem; }
-    .sub { color: var(--muted); margin-bottom: 2rem; font-size: 0.95rem; }
-    .grid {
-      display: grid;
-      gap: 1.25rem;
-      grid-template-columns: repeat(auto-fit, minmax(320px, 1fr));
-    }
-    .card {
-      background: var(--panel);
-      border: 1px solid var(--border);
-      border-radius: 0.5rem;
-      padding: 1rem 1rem 0.5rem;
-    }
-    .card h2 {
-      font-size: 0.85rem;
-      text-transform: uppercase;
-      letter-spacing: 0.06em;
-      color: var(--muted);
-      margin: 0 0 0.75rem;
-    }
-    .card canvas { max-height: 280px; }
-    .wide { grid-column: 1 / -1; }
-    table {
-      width: 100%;
-      border-collapse: collapse;
-      font-size: 0.875rem;
-    }
-    th, td {
-      padding: 0.5rem 0.75rem;
-      border-bottom: 1px solid var(--border);
-      text-align: right;
-    }
-    th:first-child, td:first-child { text-align: left; }
-    th { color: var(--muted); font-weight: 600; }
-    .good { color: var(--accent); }
-    footer { margin-top: 2rem; color: var(--muted); font-size: 0.8rem; }
-    a { color: var(--accent); }
-  </style>
-</head>
-<body>
-  <div class="wrap">
-    <h1>Lexis-Two × OpenCode Go</h1>
-    <p class="sub">
-      Source: <code>opencode-go-2026-06-16.json</code> · 3 runs/cell · median LOC ·
-      arms: baseline, lexis-two
-    </p>
-    <div class="grid">
-      <div class="card wide">
-        <h2>Total code LOC (median, 5 tasks)</h2>
-        <canvas id="chart-total-loc"></canvas>
-      </div>
-      <div class="card">
-        <h2>LOC reduction vs baseline</h2>
-        <canvas id="chart-reduction"></canvas>
-      </div>
-      <div class="card">
-        <h2>Wall time (median total seconds)</h2>
-        <canvas id="chart-time"></canvas>
-      </div>
-      <div class="card wide">
-        <h2>LOC by task — lexis-two arm</h2>
-        <canvas id="chart-by-task"></canvas>
-      </div>
-      <div class="card wide">
-        <h2>Summary table</h2>
-        <table id="summary-table">
-          <thead>
-            <tr>
-              <th>Model</th>
-              <th>Baseline LOC</th>
-              <th>Lexis-Two LOC</th>
-              <th>Reduction</th>
-              <th>Correct (lexis)</th>
-            </tr>
-          </thead>
-          <tbody></tbody>
-        </table>
-      </div>
-    </div>
-    <footer>
-      Regenerate: <code>node benchmarks/render-opencode-go-report.js</code>
-    </footer>
-  </div>
-  <script>
-    const DATA = {"date":"2026-06-16","repeat":3,"models":[{"id":"kimi-k2.6","locByArmTask":{"baseline":{"email":56,"debounce":71,"csv-sum":19,"countdown":366,"rate-limit":49},"lexis-two":{"email":10,"debounce":5,"csv-sum":4,"countdown":16,"rate-limit":14}},"timeByArmTask":{"baseline":{"email":12.973,"debounce":14.098,"csv-sum":5.08,"countdown":21.987,"rate-limit":16.836},"lexis-two":{"email":16.23,"debounce":8.363,"csv-sum":9.846,"countdown":18.389,"rate-limit":16.189}},"correctByArm":{"baseline":{"pass":11,"total":15},"lexis-two":{"pass":10,"total":15}},"totals":{"baselineLoc":561,"lexisLoc":49,"reductionPct":91,"baselineTimeSec":71,"lexisTimeSec":69}},{"id":"deepseek-v4-pro","locByArmTask":{"baseline":{"email":60,"debounce":39,"csv-sum":26,"countdown":90,"rate-limit":66},"lexis-two":{"email":7,"debounce":7,"csv-sum":4,"countdown":10,"rate-limit":18}},"timeByArmTask":{"baseline":{"email":35.051,"debounce":14.509,"csv-sum":13.422,"countdown":46.762,"rate-limit":32.401},"lexis-two":{"email":27.456,"debounce":16.982,"csv-sum":24.931,"countdown":36.191,"rate-limit":39.952}},"correctByArm":{"baseline":{"pass":13,"total":15},"lexis-two":{"pass":12,"total":15}},"totals":{"baselineLoc":281,"lexisLoc":46,"reductionPct":84,"baselineTimeSec":142.1,"lexisTimeSec":145.5}},{"id":"qwen3.7-max","locByArmTask":{"baseline":{"email":34,"debounce":44,"csv-sum":17,"countdown":128,"rate-limit":47},"lexis-two":{"email":7,"debounce":5,"csv-sum":3,"countdown":10,"rate-limit":13}},"timeByArmTask":{"baseline":{"email":43.542,"debounce":17.58,"csv-sum":25.876,"countdown":32.586,"rate-limit":41.602},"lexis-two":{"email":39.323,"debounce":28.275,"csv-sum":23.769,"countdown":28.775,"rate-limit":40.786}},"correctByArm":{"baseline":{"pass":14,"total":15},"lexis-two":{"pass":11,"total":15}},"totals":{"baselineLoc":270,"lexisLoc":38,"reductionPct":86,"baselineTimeSec":161.2,"lexisTimeSec":160.9}},{"id":"minimax-m3","locByArmTask":{"baseline":{"email":62,"debounce":58,"csv-sum":43,"countdown":117,"rate-limit":76},"lexis-two":{"email":12,"debounce":6,"csv-sum":2,"countdown":13,"rate-limit":14}},"timeByArmTask":{"baseline":{"email":18.398,"debounce":14.916,"csv-sum":10.237,"countdown":19.516,"rate-limit":22.131},"lexis-two":{"email":8.002,"debounce":2.393,"csv-sum":2.423,"countdown":2.753,"rate-limit":4.209}},"correctByArm":{"baseline":{"pass":12,"total":15},"lexis-two":{"pass":9,"total":15}},"totals":{"baselineLoc":356,"lexisLoc":47,"reductionPct":87,"baselineTimeSec":85.2,"lexisTimeSec":19.8}}],"tasks":["email","debounce","csv-sum","countdown","rate-limit"],"arms":["baseline","lexis-two"]};
-    const labels = DATA.models.map((m) => m.id.replace('kimi-k2.6','Kimi K2.6').replace('deepseek-v4-pro','DeepSeek V4').replace('qwen3.7-max','Qwen3.7 Max').replace('minimax-m3','MiniMax M3'));
-    Chart.defaults.color = '#8a948d';
-    Chart.defaults.borderColor = '#1e2420';
-    Chart.defaults.font.family = 'system-ui, sans-serif';
-    new Chart(document.getElementById('chart-total-loc'), {
-      type: 'bar',
-      data: {
-        labels,
-        datasets: [
-          {
-            label: 'baseline',
-            data: DATA.models.map((m) => m.totals.baselineLoc),
-            backgroundColor: '#c97a7a',
-          },
-          {
-            label: 'lexis-two',
-            data: DATA.models.map((m) => m.totals.lexisLoc),
-            backgroundColor: '#7cba8a',
-          },
-        ],
-      },
-      options: {
-        responsive: true,
-        plugins: { legend: { position: 'bottom' } },
-        scales: { y: { beginAtZero: true, title: { display: true, text: 'lines of code' } } },
-      },
-    });
-    new Chart(document.getElementById('chart-reduction'), {
-      type: 'bar',
-      data: {
-        labels,
-        datasets: [{
-          label: '% less code',
-          data: DATA.models.map((m) => m.totals.reductionPct),
-          backgroundColor: '#7cba8a',
-        }],
-      },
-      options: {
-        indexAxis: 'y',
-        responsive: true,
-        plugins: { legend: { display: false } },
-        scales: {
-          x: { beginAtZero: true, max: 100, ticks: { callback: (v) => v + '%' } },
-        },
-      },
-    });
-    new Chart(document.getElementById('chart-time'), {
-      type: 'bar',
-      data: {
-        labels,
-        datasets: [
-          {
-            label: 'baseline',
-            data: DATA.models.map((m) => m.totals.baselineTimeSec),
-            backgroundColor: '#c97a7a',
-          },
-          {
-            label: 'lexis-two',
-            data: DATA.models.map((m) => m.totals.lexisTimeSec),
-            backgroundColor: '#7cba8a',
-          },
-        ],
-      },
-      options: {
-        responsive: true,
-        plugins: { legend: { position: 'bottom' } },
-        scales: { y: { beginAtZero: true, title: { display: true, text: 'seconds' } } },
-      },
-    });
-    const taskLabels = DATA.tasks;
-    const taskColors = ['#7cba8a', '#5a9a6a', '#9fd4a8', '#4a7356', '#3d5f48'];
-    new Chart(document.getElementById('chart-by-task'), {
-      type: 'bar',
-      data: {
-        labels,
-        datasets: taskLabels.map((taskId, i) => ({
-          label: taskId,
-          data: DATA.models.map((m) => m.locByArmTask['lexis-two'][taskId]),
-          backgroundColor: taskColors[i % taskColors.length],
-        })),
-      },
-      options: {
-        responsive: true,
-        plugins: { legend: { position: 'bottom' } },
-        scales: {
-          x: { stacked: false },
-          y: { beginAtZero: true, title: { display: true, text: 'LOC (lexis-two)' } },
-        },
-      },
-    });
-    const tbody = document.querySelector('#summary-table tbody');
-    for (const m of DATA.models) {
-      const c = m.correctByArm['lexis-two'];
-      const tr = document.createElement('tr');
-      tr.innerHTML = `
-        <td>${m.id}</td>
-        <td>${m.totals.baselineLoc}</td>
-        <td class="good">${m.totals.lexisLoc}</td>
-        <td class="good">${m.totals.reductionPct}%</td>
-        <td>${c.pass}/${c.total}</td>
-      `;
-      tbody.appendChild(tr);
-    }
-  </script>
-</body>
-</html>