npm - benchforge - Versions diffs - 0.1.9 → 0.2.4 - Mend

benchforge 0.1.9 → 0.2.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (253) hide show

package/LICENSE +20 -0
package/README.md +99 -260
package/bin/benchforge +1 -2
package/dist/AnalyzeArchive-8NCJhmhS.mjs +145 -0
package/dist/AnalyzeArchive-8NCJhmhS.mjs.map +1 -0
package/dist/BenchMatrix-BZVrBB_h.mjs +1050 -0
package/dist/BenchMatrix-BZVrBB_h.mjs.map +1 -0
package/dist/BenchRunner-DglX1NOn.d.mts +302 -0
package/dist/CoverageSampler-D5T9DRqe.mjs +27 -0
package/dist/CoverageSampler-D5T9DRqe.mjs.map +1 -0
package/dist/Formatters-BWj3d4sv.mjs +95 -0
package/dist/Formatters-BWj3d4sv.mjs.map +1 -0
package/dist/{HeapSampler-B8dtKHn1.mjs → HeapSampler-Dq-hpXem.mjs} +4 -4
package/dist/HeapSampler-Dq-hpXem.mjs.map +1 -0
package/dist/RunBenchCLI-C17DrJz8.mjs +3075 -0
package/dist/RunBenchCLI-C17DrJz8.mjs.map +1 -0
package/dist/StatisticalUtils-BD92crgM.mjs +255 -0
package/dist/StatisticalUtils-BD92crgM.mjs.map +1 -0
package/dist/TimeSampler-Ds8n7l2B.mjs +29 -0
package/dist/TimeSampler-Ds8n7l2B.mjs.map +1 -0
package/dist/ViewerServer-BJhdnxlN.mjs +639 -0
package/dist/ViewerServer-BJhdnxlN.mjs.map +1 -0
package/dist/ViewerServer-CuMNdNBz.mjs +2 -0
package/dist/bin/benchforge.mjs +4 -5
package/dist/bin/benchforge.mjs.map +1 -1
package/dist/index.d.mts +731 -522
package/dist/index.mjs +98 -3
package/dist/index.mjs.map +1 -0
package/dist/runners/WorkerScript.d.mts +12 -4
package/dist/runners/WorkerScript.mjs +92 -120
package/dist/runners/WorkerScript.mjs.map +1 -1
package/dist/viewer/assets/CIPlot-BkOvMoMa.js +1 -0
package/dist/viewer/assets/HistogramKde-CmSyUFY0.js +1 -0
package/dist/viewer/assets/LegendUtils-BJpbn_jr.js +55 -0
package/dist/viewer/assets/SampleTimeSeries-C4VBhXr3.js +1 -0
package/dist/viewer/assets/index-Br9bp_cX.js +153 -0
package/dist/viewer/assets/index-NzXXe_CC.css +1 -0
package/dist/viewer/index.html +19 -0
package/dist/viewer/speedscope/LICENSE +21 -0
package/dist/viewer/speedscope/SourceCodePro-Regular.ttf-ILST5JV6.woff2 +0 -0
package/dist/viewer/speedscope/favicon-16x16-V2DMIAZS.js +2 -0
package/dist/viewer/speedscope/favicon-16x16-V2DMIAZS.js.map +7 -0
package/dist/viewer/speedscope/favicon-16x16-VSI62OPJ.png +0 -0
package/dist/viewer/speedscope/favicon-32x32-3EB2YCUY.png +0 -0
package/dist/viewer/speedscope/favicon-32x32-THY3JDJL.js +2 -0
package/dist/viewer/speedscope/favicon-32x32-THY3JDJL.js.map +7 -0
package/dist/viewer/speedscope/favicon-FOKUP5Y5.ico +0 -0
package/dist/viewer/speedscope/favicon-M34RF7BI.js +2 -0
package/dist/viewer/speedscope/favicon-M34RF7BI.js.map +7 -0
package/dist/viewer/speedscope/file-format-schema.json +274 -0
package/dist/viewer/speedscope/index.html +19 -0
package/dist/viewer/speedscope/jfrview_bg-BLJXNNQB.wasm +0 -0
package/dist/viewer/speedscope/perf-vertx-stacks-01-collapsed-all-ZNUIGAJL.txt +199 -0
package/dist/viewer/speedscope/release.txt +3 -0
package/dist/viewer/speedscope/source-code-pro.LICENSE.md +93 -0
package/dist/viewer/speedscope/speedscope-GHPHNKXC.css +2 -0
package/dist/viewer/speedscope/speedscope-GHPHNKXC.css.map +7 -0
package/dist/viewer/speedscope/speedscope-QZFMJ7VP.js +212 -0
package/dist/viewer/speedscope/speedscope-QZFMJ7VP.js.map +7 -0
package/package.json +52 -26
package/src/bin/benchforge.ts +2 -2
package/src/cli/AnalyzeArchive.ts +232 -0
package/src/cli/BrowserBench.ts +322 -0
package/src/cli/CliArgs.ts +164 -48
package/src/cli/CliExport.ts +179 -0
package/src/cli/CliOptions.ts +147 -0
package/src/cli/CliReport.ts +197 -0
package/src/cli/FilterBenchmarks.ts +18 -30
package/src/cli/RunBenchCLI.ts +138 -844
package/src/cli/SuiteRunner.ts +160 -0
package/src/cli/ViewerServer.ts +282 -0
package/src/export/AllocExport.ts +121 -0
package/src/export/ArchiveExport.ts +146 -0
package/src/export/ArchiveFormat.ts +50 -0
package/src/export/CoverageExport.ts +148 -0
package/src/export/EditorUri.ts +10 -0
package/src/export/PerfettoExport.ts +91 -126
package/src/export/SpeedscopeTypes.ts +98 -0
package/src/export/TimeExport.ts +115 -0
package/src/index.ts +87 -62
package/src/matrix/BenchMatrix.ts +230 -0
package/src/matrix/CaseLoader.ts +8 -6
package/src/matrix/MatrixDirRunner.ts +153 -0
package/src/matrix/MatrixFilter.ts +55 -53
package/src/matrix/MatrixInlineRunner.ts +50 -0
package/src/matrix/MatrixReport.ts +94 -254
package/src/matrix/VariantLoader.ts +9 -9
package/src/profiling/browser/BenchLoop.ts +51 -0
package/src/profiling/browser/BrowserCDP.ts +133 -0
package/src/profiling/browser/BrowserGcStats.ts +33 -0
package/src/profiling/browser/BrowserProfiler.ts +160 -0
package/src/profiling/browser/CdpClient.ts +82 -0
package/src/profiling/browser/CdpPage.ts +138 -0
package/src/profiling/browser/ChromeLauncher.ts +158 -0
package/src/profiling/browser/ChromeTraceEvent.ts +28 -0
package/src/profiling/browser/PageLoadMode.ts +61 -0
package/src/profiling/node/CoverageSampler.ts +27 -0
package/src/profiling/node/CoverageTypes.ts +23 -0
package/src/profiling/node/HeapSampleReport.ts +261 -0
package/src/{heap-sample → profiling/node}/HeapSampler.ts +55 -13
package/src/profiling/node/ResolvedProfile.ts +98 -0
package/src/profiling/node/TimeSampler.ts +57 -0
package/src/report/BenchmarkReport.ts +146 -0
package/src/report/Colors.ts +9 -0
package/src/report/Formatters.ts +110 -0
package/src/report/GcSections.ts +151 -0
package/src/{GitUtils.ts → report/GitUtils.ts} +18 -19
package/src/report/HtmlReport.ts +223 -0
package/src/report/ParseStats.ts +73 -0
package/src/report/StandardSections.ts +147 -0
package/src/report/ViewerSections.ts +286 -0
package/src/report/text/TableReport.ts +253 -0
package/src/report/text/TextReport.ts +123 -0
package/src/runners/AdaptiveWrapper.ts +167 -287
package/src/runners/BenchRunner.ts +27 -22
package/src/{Benchmark.ts → runners/BenchmarkSpec.ts} +5 -6
package/src/runners/CreateRunner.ts +5 -7
package/src/runners/GcStats.ts +58 -61
package/src/{MeasuredResults.ts → runners/MeasuredResults.ts} +43 -37
package/src/runners/MergeBatches.ts +123 -0
package/src/{NodeGC.ts → runners/NodeGC.ts} +2 -3
package/src/runners/RunnerOrchestrator.ts +180 -296
package/src/runners/RunnerUtils.ts +75 -1
package/src/runners/SampleStats.ts +100 -0
package/src/runners/TimingRunner.ts +244 -0
package/src/runners/TimingUtils.ts +3 -2
package/src/runners/WorkerScript.ts +162 -178
package/src/stats/BootstrapDifference.ts +282 -0
package/src/{PermutationTest.ts → stats/PermutationTest.ts} +31 -40
package/src/stats/StatisticalUtils.ts +445 -0
package/src/{tests → test}/AdaptiveConvergence.test.ts +10 -10
package/src/test/AdaptiveRunner.test.ts +39 -41
package/src/{tests → test}/AdaptiveSampling.test.ts +9 -9
package/src/test/AdaptiveStatistics.integration.ts +9 -41
package/src/{tests → test}/BenchMatrix.test.ts +31 -28
package/src/test/BenchmarkReport.test.ts +63 -13
package/src/test/BrowserBench.e2e.test.ts +186 -17
package/src/test/BrowserBench.test.ts +10 -5
package/src/test/BuildTimeSection.test.ts +130 -0
package/src/test/CapSamples.test.ts +82 -0
package/src/test/CoverageExport.test.ts +115 -0
package/src/test/CoverageSampler.test.ts +33 -0
package/src/test/HeapAttribution.test.ts +51 -0
package/src/{tests → test}/MatrixFilter.test.ts +16 -16
package/src/{tests → test}/MatrixReport.test.ts +1 -1
package/src/test/PermutationTest.test.ts +1 -1
package/src/{tests → test}/RealDataValidation.test.ts +6 -6
package/src/test/RunBenchCLI.test.ts +57 -56
package/src/test/RunnerOrchestrator.test.ts +12 -12
package/src/test/StatisticalUtils.test.ts +48 -12
package/src/{table-util/test → test}/TableReport.test.ts +2 -2
package/src/test/TestUtils.ts +35 -30
package/src/test/TimeExport.test.ts +139 -0
package/src/test/TimeSampler.test.ts +37 -0
package/src/test/ViewerLive.e2e.test.ts +159 -0
package/src/test/ViewerStatic.static.e2e.test.ts +137 -0
package/src/{tests → test}/fixtures/baseline/impl.ts +1 -1
package/src/{tests → test}/fixtures/bevy30-samples.ts +3 -1
package/src/test/fixtures/cases/asyncCases.ts +9 -0
package/src/{tests → test}/fixtures/cases/cases.ts +5 -2
package/src/test/fixtures/cases/variants/product.ts +2 -0
package/src/test/fixtures/cases/variants/sum.ts +2 -0
package/src/test/fixtures/discover/fast.ts +1 -0
package/src/{tests → test}/fixtures/discover/slow.ts +1 -1
package/src/test/fixtures/invalid/bad.ts +1 -0
package/src/test/fixtures/loader/fast.ts +1 -0
package/src/{tests → test}/fixtures/loader/slow.ts +1 -1
package/src/test/fixtures/loader/stateful.ts +2 -0
package/src/test/fixtures/stateful/stateful.ts +2 -0
package/src/test/fixtures/variants/extra.ts +1 -0
package/src/test/fixtures/variants/impl.ts +1 -0
package/src/test/fixtures/worker/fast.ts +1 -0
package/src/{tests → test}/fixtures/worker/slow.ts +1 -1
package/src/viewer/DateFormat.ts +30 -0
package/src/viewer/Helpers.ts +23 -0
package/src/viewer/LineData.ts +120 -0
package/src/viewer/Providers.ts +191 -0
package/src/viewer/ReportData.ts +123 -0
package/src/viewer/State.ts +49 -0
package/src/viewer/Theme.ts +15 -0
package/src/viewer/components/App.tsx +73 -0
package/src/viewer/components/DropZone.tsx +71 -0
package/src/viewer/components/LazyPlot.ts +33 -0
package/src/viewer/components/SamplesPanel.tsx +214 -0
package/src/viewer/components/Shell.tsx +26 -0
package/src/viewer/components/SourcePanel.tsx +216 -0
package/src/viewer/components/SummaryPanel.tsx +332 -0
package/src/viewer/components/TabBar.tsx +131 -0
package/src/viewer/components/TabContent.tsx +46 -0
package/src/viewer/components/ThemeToggle.tsx +50 -0
package/src/viewer/index.html +20 -0
package/src/viewer/main.tsx +4 -0
package/src/viewer/plots/CIPlot.ts +313 -0
package/src/{html/browser → viewer/plots}/HistogramKde.ts +42 -47
package/src/viewer/plots/LegendUtils.ts +134 -0
package/src/viewer/plots/PlotTypes.ts +85 -0
package/src/viewer/plots/RenderPlots.ts +230 -0
package/src/viewer/plots/SampleTimeSeries.ts +306 -0
package/src/viewer/plots/SvgHelpers.ts +136 -0
package/src/viewer/plots/TimeSeriesMarks.ts +319 -0
package/src/viewer/report.css +427 -0
package/src/viewer/shell.css +357 -0
package/src/viewer/tsconfig.json +11 -0
package/dist/BenchRunner-CSKN9zPy.d.mts +0 -225
package/dist/BrowserHeapSampler-DCeL42RE.mjs +0 -202
package/dist/BrowserHeapSampler-DCeL42RE.mjs.map +0 -1
package/dist/GcStats-ByEovUi1.mjs +0 -77
package/dist/GcStats-ByEovUi1.mjs.map +0 -1
package/dist/HeapSampler-B8dtKHn1.mjs.map +0 -1
package/dist/TimingUtils-ClclVQ7E.mjs +0 -597
package/dist/TimingUtils-ClclVQ7E.mjs.map +0 -1
package/dist/browser/index.js +0 -914
package/dist/src-Cf_LXwlp.mjs +0 -2873
package/dist/src-Cf_LXwlp.mjs.map +0 -1
package/src/BenchMatrix.ts +0 -380
package/src/BenchmarkReport.ts +0 -156
package/src/HtmlDataPrep.ts +0 -148
package/src/StandardSections.ts +0 -261
package/src/StatisticalUtils.ts +0 -176
package/src/TypeUtil.ts +0 -8
package/src/browser/BrowserGcStats.ts +0 -44
package/src/browser/BrowserHeapSampler.ts +0 -271
package/src/export/JsonExport.ts +0 -103
package/src/export/JsonFormat.ts +0 -91
package/src/heap-sample/HeapSampleReport.ts +0 -196
package/src/html/HtmlReport.ts +0 -131
package/src/html/HtmlTemplate.ts +0 -284
package/src/html/Types.ts +0 -88
package/src/html/browser/CIPlot.ts +0 -287
package/src/html/browser/LegendUtils.ts +0 -163
package/src/html/browser/RenderPlots.ts +0 -263
package/src/html/browser/SampleTimeSeries.ts +0 -389
package/src/html/browser/Types.ts +0 -96
package/src/html/browser/index.ts +0 -1
package/src/html/index.ts +0 -17
package/src/runners/BasicRunner.ts +0 -364
package/src/table-util/ConvergenceFormatters.ts +0 -19
package/src/table-util/Formatters.ts +0 -152
package/src/table-util/README.md +0 -70
package/src/table-util/TableReport.ts +0 -293
package/src/tests/fixtures/cases/asyncCases.ts +0 -7
package/src/tests/fixtures/cases/variants/product.ts +0 -2
package/src/tests/fixtures/cases/variants/sum.ts +0 -2
package/src/tests/fixtures/discover/fast.ts +0 -1
package/src/tests/fixtures/invalid/bad.ts +0 -1
package/src/tests/fixtures/loader/fast.ts +0 -1
package/src/tests/fixtures/loader/stateful.ts +0 -2
package/src/tests/fixtures/stateful/stateful.ts +0 -2
package/src/tests/fixtures/variants/extra.ts +0 -1
package/src/tests/fixtures/variants/impl.ts +0 -1
package/src/tests/fixtures/worker/fast.ts +0 -1
package/src/{table-util/test → test}/TableValueExtractor.test.ts +0 -0
package/src/{table-util/test → test}/TableValueExtractor.ts +9 -9

package/src/report/text/TextReport.ts ADDED Viewed

@@ -0,0 +1,123 @@
+import {
+  type BenchmarkReport,
+  type ComparisonOptions,
+  computeDiffCI,
+  extractSectionValues,
+  findPrimaryColumn,
+  isHigherIsBetter,
+  type ReportColumn,
+  type ReportGroup,
+  type ReportSection,
+} from "../BenchmarkReport.ts";
+import { formatDiffWithCI, truncate } from "../Formatters.ts";
+import {
+  buildTable,
+  type ColumnGroup,
+  type ResultGroup,
+} from "./TableReport.ts";
+/** Options for text report rendering, including baseline comparison settings. */
+export interface TextReportOptions extends ComparisonOptions {}
+type Row = Record<string, unknown> & { name: string };
+/** Build a formatted text table from benchmark groups, with baseline diff columns when present. */
+export function reportResults(
+  groups: ReportGroup[],
+  sections: ReportSection[],
+  options?: TextReportOptions,
+): string {
+  const primary = findPrimaryColumn(sections);
+  const results = groups.map(g =>
+    resultGroupValues(g, sections, primary, options),
+  );
+  const hasBaseline = results.some(g => g.baseline);
+  const table = buildTable(sectionColumnGroups(sections, hasBaseline), results);
+  const hasSampleCI = results.some(g =>
+    g.results.some(r => r.diffCI && (r.diffCI as any).ciLevel === "sample"),
+  );
+  if (!hasSampleCI) return table;
+  return (
+    table +
+    "\n* Confidence intervals may be too narrow (single batch)." +
+    " Use --batches for more accurate intervals.\n"
+  );
+}
+/** Extract stats from all sections into row objects for each report. */
+export function valuesForReports(
+  reports: BenchmarkReport[],
+  sections: ReportSection[],
+): Row[] {
+  return reports.map(r => ({
+    name: truncate(r.name),
+    ...extractSectionValues(r.measuredResults, sections, r.metadata),
+  }));
+}
+/** Insert a "delta% CI" column after the first comparable column. */
+export function injectDiffColumns(
+  groups: ColumnGroup<Row>[],
+): ColumnGroup<Row>[] {
+  const asSections = groups.map(g => ({
+    title: g.groupTitle ?? "",
+    columns: g.columns as ReportColumn[],
+  }));
+  const higher = isHigherIsBetter(asSections);
+  const fmt = (v: unknown) => formatDiffWithCI(v, higher);
+  const ciCol = { title: "Δ% CI", key: "diffCI" as keyof Row, formatter: fmt };
+  let ciAdded = false;
+  return groups.map(group => ({
+    groupTitle: group.groupTitle,
+    columns: group.columns.flatMap(col => {
+      if ((col as ReportColumn).comparable && !ciAdded) {
+        ciAdded = true;
+        return [col, ciCol];
+      }
+      return [col];
+    }),
+  }));
+}
+/** Build table columns from sections, with name column and optional CI diff columns. */
+export function sectionColumnGroups(
+  sections: ReportSection[],
+  hasBaseline: boolean,
+  nameTitle = "name",
+): ColumnGroup<Row>[] {
+  const nameCol: ColumnGroup<Row> = {
+    columns: [{ key: "name" as keyof Row, title: nameTitle }],
+  };
+  const groups: ColumnGroup<Row>[] = sections.map(s => ({
+    groupTitle: s.title || undefined,
+    columns: s.columns.map(c => ({
+      ...c,
+      key: (c.key ?? c.title) as keyof Row,
+    })),
+  }));
+  const cols = hasBaseline ? injectDiffColumns(groups) : groups;
+  return [nameCol, ...cols];
+}
+/** Extract section stats and bootstrap CI diffs for all reports in a group. */
+function resultGroupValues(
+  group: ReportGroup,
+  sections: ReportSection[],
+  primary?: ReportColumn,
+  options?: TextReportOptions,
+): ResultGroup<Row> {
+  const { reports, baseline } = group;
+  const baseM = baseline?.measuredResults;
+  const { statKind, higherIsBetter } = primary ?? {};
+  const results = reports.map(r => {
+    const { measuredResults: m, metadata } = r;
+    const diffCI = statKind
+      ? computeDiffCI(baseM, m, statKind, options, higherIsBetter)
+      : undefined;
+    const values = extractSectionValues(m, sections, metadata);
+    return { name: truncate(r.name), ...values, ...(diffCI && { diffCI }) };
+  });
+  const baseRow = baseline && valuesForReports([baseline], sections)[0];
+  return { results, baseline: baseRow };
+}

package/src/runners/AdaptiveWrapper.ts CHANGED Viewed

@@ -1,22 +1,23 @@
-import type { BenchmarkSpec } from "../Benchmark.ts";
-import type { MeasuredResults } from "../MeasuredResults.ts";
-import {
-  coefficientOfVariation,
-  medianAbsoluteDeviation,
-  percentile,
-} from "../StatisticalUtils.ts";
+import { median } from "../stats/StatisticalUtils.ts";
+import type { BenchmarkSpec } from "./BenchmarkSpec.ts";
 import type { BenchRunner, RunnerOptions } from "./BenchRunner.ts";
+import type { MeasuredResults } from "./MeasuredResults.ts";
 import { msToNs } from "./RunnerUtils.ts";
+import { computeStats, outlierImpactRatio } from "./SampleStats.ts";
-const minTime = 1000;
-const maxTime = 10000;
-const targetConfidence = 95;
-const fallbackThreshold = 80;
-const windowSize = 50;
-const stability = 0.05; // 5% drift threshold (was 2%, too strict for real benchmarks)
-const initialBatch = 100;
-const continueBatch = 100;
-const continueIterations = 10;
+/** Options for adaptive sampling: collects until statistical convergence or timeout. */
+export interface AdaptiveOptions extends RunnerOptions {
+  /** Enable adaptive sampling (default: true when using adaptive runner) */
+  adaptive?: boolean;
+  /** Minimum measurement time in ms before convergence can stop sampling (default: 1000) */
+  minTime?: number;
+  /** Maximum measurement time in ms, hard stop (default: 10000) */
+  maxTime?: number;
+  /** Target confidence percentage to stop early (default: 95) */
+  targetConfidence?: number;
+  /** Confidence threshold 0-100 (alias for targetConfidence) */
+  convergence?: number;
+}
 type Metrics = {
   medianDrift: number;
@@ -31,112 +32,163 @@ interface ConvergenceResult {
   reason: string;
 }
-export interface AdaptiveOptions extends RunnerOptions {
-  adaptive?: boolean;
-  minTime?: number;
-  maxTime?: number;
-  targetConfidence?: number;
-  convergence?: number; // Confidence threshold (0-100)
-}
+const minTime = 1000;
+const maxTime = 10000;
+const targetConfidence = 95;
+const fallbackThreshold = 80;
+const windowSize = 50;
+const stability = 0.05; // 5% drift threshold (was 2%, too strict for real benchmarks)
+const initialBatch = 100;
+const continueBatch = 100;
+const continueIterations = 10;
-/** @return adaptive sampling runner wrapper */
+/** Wrap a runner with adaptive sampling (convergence detection or timeout). */
 export function createAdaptiveWrapper(
   baseRunner: BenchRunner,
   options: AdaptiveOptions,
 ): BenchRunner {
   return {
     async runBench<T = unknown>(
-      benchmark: BenchmarkSpec<T>,
-      runnerOptions: RunnerOptions,
+      bench: BenchmarkSpec<T>,
+      opts: RunnerOptions,
       params?: T,
     ): Promise<MeasuredResults[]> {
-      return runAdaptiveBench(
-        baseRunner,
-        benchmark,
-        runnerOptions,
-        options,
-        params,
-      );
+      return runAdaptiveBench(baseRunner, bench, opts, options, params);
     },
   };
 }
-/** @return results using adaptive sampling strategy */
+/** Check convergence by comparing sliding windows of samples for stability. */
+export function checkConvergence(samples: number[]): ConvergenceResult {
+  const windowSize = getWindowSize(samples);
+  const minSamples = windowSize * 2;
+  if (samples.length < minSamples) {
+    const confidence = (samples.length / minSamples) * 100;
+    const reason = `Collecting samples: ${samples.length}/${minSamples}`;
+    return { converged: false, confidence, reason };
+  }
+  return buildConvergence(getStability(samples, windowSize));
+}
+/** Run benchmark with adaptive sampling until convergence or timeout. */
 async function runAdaptiveBench<T>(
-  baseRunner: BenchRunner,
-  benchmark: BenchmarkSpec<T>,
-  runnerOptions: RunnerOptions,
-  options: AdaptiveOptions,
+  runner: BenchRunner,
+  bench: BenchmarkSpec<T>,
+  opts: RunnerOptions,
+  adaptive: AdaptiveOptions,
   params?: T,
 ): Promise<MeasuredResults[]> {
-  const {
-    minTime: min = options.minTime ?? minTime,
-    maxTime: max = options.maxTime ?? maxTime,
-    targetConfidence: target = options.convergence ?? targetConfidence,
-  } = runnerOptions as AdaptiveOptions;
+  const overrides = opts as AdaptiveOptions;
+  const min = overrides.minTime ?? adaptive.minTime ?? minTime;
+  const max = overrides.maxTime ?? adaptive.maxTime ?? maxTime;
+  const target =
+    overrides.convergence ?? adaptive.convergence ?? targetConfidence;
   const allSamples: number[] = [];
-  // Collect initial batch (includes warmup + settle)
-  const warmup = await collectInitial(
-    baseRunner,
-    benchmark,
-    runnerOptions,
+  const { warmup, startTime: hrtimeStart } = await collectInitial(
+    runner,
+    bench,
+    opts,
     params,
     allSamples,
   );
-  // Start timing AFTER warmup - warmup time doesn't count against maxTime
+  // Start timing after warmup so warmup time doesn't count against maxTime
   const startTime = performance.now();
   const limits = {
     minTime: min,
     maxTime: max,
     targetConfidence: target,
     startTime,
   };
-  await collectAdaptive(
-    baseRunner,
-    benchmark,
-    runnerOptions,
-    params,
-    allSamples,
-    limits,
-  );
+  await collectAdaptive(runner, bench, opts, params, allSamples, limits);
-  const convergence = checkConvergence(allSamples.map(s => s * msToNs));
+  const samplesNs = allSamples.map(s => s * msToNs);
+  const convergence = checkConvergence(samplesNs);
   return buildResults(
     allSamples,
     startTime,
     convergence,
-    benchmark.name,
+    bench.name,
     warmup,
+    hrtimeStart,
   );
 }
-/** @return warmupSamples from initial batch */
+/** Scale window size inversely with execution time -- fast ops need more samples. */
+function getWindowSize(samples: number[]): number {
+  if (samples.length < 20) return windowSize;
+  const recentMs = samples.slice(-20).map(s => s / msToNs);
+  const recentMedian = median(recentMs);
+  if (recentMedian < 0.01) return 200; // <10μs
+  if (recentMedian < 0.1) return 100; // <100μs
+  if (recentMedian < 1) return 50; // <1ms
+  if (recentMedian < 10) return 30; // <10ms
+  return 20; // >10ms
+}
+/** Convert stability metrics to a convergence result with confidence score. */
+function buildConvergence(metrics: Metrics): ConvergenceResult {
+  const { medianDrift, impactDrift, medianStable, impactStable } = metrics;
+  if (medianStable && impactStable)
+    return {
+      converged: true,
+      confidence: 100,
+      reason: "Stable performance pattern",
+    };
+  const raw =
+    (1 - medianDrift / stability) * 50 + (1 - impactDrift / stability) * 50;
+  const confidence = Math.max(0, Math.min(100, raw));
+  const reason =
+    medianDrift > impactDrift
+      ? `Median drifting: ${(medianDrift * 100).toFixed(1)}%`
+      : `Outlier impact changing: ${(impactDrift * 100).toFixed(1)}%`;
+  return { converged: false, confidence, reason };
+}
+/** Compare median and outlier-impact drift between recent and previous windows. */
+function getStability(samples: number[], windowSize: number): Metrics {
+  const toMs = (s: number) => s / msToNs;
+  const recentMs = samples.slice(-windowSize).map(toMs);
+  const previousMs = samples.slice(-windowSize * 2, -windowSize).map(toMs);
+  const medianRecent = median(recentMs);
+  const medianPrevious = median(previousMs);
+  const medianDrift = Math.abs(medianRecent - medianPrevious) / medianPrevious;
+  const impactRecent = outlierImpactRatio(recentMs);
+  const impactPrevious = outlierImpactRatio(previousMs);
+  const impactDrift = Math.abs(impactRecent - impactPrevious);
+  const medianStable = medianDrift < stability;
+  const impactStable = impactDrift < stability;
+  return { medianDrift, impactDrift, medianStable, impactStable };
+}
+/** Collect the initial batch (warmup + settle), returning warmup samples. */
 async function collectInitial<T>(
-  baseRunner: BenchRunner,
-  benchmark: BenchmarkSpec<T>,
-  runnerOptions: RunnerOptions,
+  runner: BenchRunner,
+  bench: BenchmarkSpec<T>,
+  opts: RunnerOptions,
   params: T | undefined,
   allSamples: number[],
-): Promise<number[] | undefined> {
-  // Don't pass adaptive flag to base runner to avoid double wrapping
-  const opts = {
-    ...(runnerOptions as any),
+): Promise<{ warmup?: number[]; startTime?: number }> {
+  const batchOpts = {
+    ...(opts as any),
     maxTime: initialBatch,
     maxIterations: undefined,
   };
-  const results = await baseRunner.runBench(benchmark, opts, params);
+  const results = await runner.runBench(bench, batchOpts, params);
   appendSamples(results[0], allSamples);
-  return results[0].warmupSamples;
+  return { warmup: results[0].warmupSamples, startTime: results[0].startTime };
 }
-/** @return samples until convergence or timeout */
+/** Collect batches until convergence or timeout, with progress logging. */
 async function collectAdaptive<T>(
-  baseRunner: BenchRunner,
-  benchmark: BenchmarkSpec<T>,
-  runnerOptions: RunnerOptions,
+  runner: BenchRunner,
+  bench: BenchmarkSpec<T>,
+  opts: RunnerOptions,
   params: T | undefined,
   allSamples: number[],
   limits: {
@@ -153,239 +205,67 @@ async function collectAdaptive<T>(
     const convergence = checkConvergence(samplesNs);
     const elapsed = performance.now() - startTime;
-    if (elapsed - lastLog > 1000) {
-      const elapsedSec = (elapsed / 1000).toFixed(1);
-      const conf = convergence.confidence.toFixed(0);
-      process.stderr.write(
-        `\r◊ ${benchmark.name}: ${conf}% confident (${elapsedSec}s)   `,
-      );
-      lastLog = elapsed;
-    }
-    if (shouldStop(convergence, targetConfidence, elapsed, minTime)) {
-      break;
-    }
+    lastLog = logProgress(bench.name, convergence, elapsed, lastLog);
+    if (shouldStop(convergence, targetConfidence, elapsed, minTime)) break;
-    // Skip warmup for continuation batches (warmup done in initial batch)
-    const opts = {
-      ...(runnerOptions as any),
+    const batch = {
+      ...(opts as any),
       maxTime: continueBatch,
       maxIterations: continueIterations,
       skipWarmup: true,
     };
-    const batchResults = await baseRunner.runBench(benchmark, opts, params);
-    appendSamples(batchResults[0], allSamples);
+    const results = await runner.runBench(bench, batch, params);
+    appendSamples(results[0], allSamples);
   }
   process.stderr.write("\r" + " ".repeat(60) + "\r");
 }
-/** Append samples one-by-one to avoid stack overflow from spread on large arrays */
-function appendSamples(result: MeasuredResults, samples: number[]): void {
-  if (!result.samples?.length) return;
-  for (const sample of result.samples) samples.push(sample);
-}
-/** @return true if convergence reached or timeout */
-function shouldStop(
-  convergence: ConvergenceResult,
-  targetConfidence: number,
-  elapsedTime: number,
-  minTime: number,
-): boolean {
-  if (convergence.converged && convergence.confidence >= targetConfidence) {
-    return true;
-  }
-  // After minTime, accept whichever is higher: targetConfidence or fallbackThreshold
-  const threshold = Math.max(targetConfidence, fallbackThreshold);
-  return elapsedTime >= minTime && convergence.confidence >= threshold;
-}
-/** @return measured results with convergence metrics */
+/** Build final MeasuredResults from collected samples and convergence state. */
 function buildResults(
-  samplesMs: number[],
-  startTime: number,
+  samples: number[],
+  elapsedStart: number,
   convergence: ConvergenceResult,
   name: string,
   warmupSamples?: number[],
+  startTime?: number,
 ): MeasuredResults[] {
-  const totalTime = (performance.now() - startTime) / 1000;
-  const samplesNs = samplesMs.map(s => s * msToNs);
-  const timeStats = computeTimeStats(samplesNs);
+  const totalTime = (performance.now() - elapsedStart) / 1000;
+  const time = computeStats(samples);
   return [
-    {
-      name,
-      samples: samplesMs,
-      warmupSamples,
-      time: timeStats,
-      totalTime,
-      convergence,
-    },
+    { name, samples, warmupSamples, time, totalTime, startTime, convergence },
   ];
 }
-/** @return time percentiles and statistics in ms */
-function computeTimeStats(samplesNs: number[]) {
-  const samplesMs = samplesNs.map(s => s / msToNs);
-  const { min, max, sum } = getMinMaxSum(samplesNs);
-  const percentiles = getPercentiles(samplesNs);
-  const robust = getRobustMetrics(samplesMs);
-  return {
-    min: min / msToNs,
-    max: max / msToNs,
-    avg: sum / samplesNs.length / msToNs,
-    ...percentiles,
-    ...robust,
-  };
-}
-/** @return min, max, sum of samples */
-function getMinMaxSum(samples: number[]) {
-  const min = samples.reduce(
-    (a, b) => Math.min(a, b),
-    Number.POSITIVE_INFINITY,
-  );
-  const max = samples.reduce(
-    (a, b) => Math.max(a, b),
-    Number.NEGATIVE_INFINITY,
-  );
-  const sum = samples.reduce((a, b) => a + b, 0);
-  return { min, max, sum };
-}
-/** @return percentiles in ms */
-function getPercentiles(samples: number[]) {
-  return {
-    p25: percentile(samples, 0.25) / msToNs,
-    p50: percentile(samples, 0.5) / msToNs,
-    p75: percentile(samples, 0.75) / msToNs,
-    p95: percentile(samples, 0.95) / msToNs,
-    p99: percentile(samples, 0.99) / msToNs,
-    p999: percentile(samples, 0.999) / msToNs,
-  };
-}
-/** @return robust variability metrics */
-function getRobustMetrics(samplesMs: number[]) {
-  const impact = getOutlierImpact(samplesMs);
-  return {
-    cv: coefficientOfVariation(samplesMs),
-    mad: medianAbsoluteDeviation(samplesMs),
-    outlierRate: impact.ratio,
-  };
-}
-/** @return outlier impact as proportion of total time */
-function getOutlierImpact(samples: number[]): { ratio: number; count: number } {
-  if (samples.length === 0) return { ratio: 0, count: 0 };
-  const median = percentile(samples, 0.5);
-  const q75 = percentile(samples, 0.75);
-  const threshold = median + 1.5 * (q75 - median);
-  let excessTime = 0;
-  let count = 0;
-  for (const sample of samples) {
-    if (sample > threshold) {
-      excessTime += sample - median;
-      count++;
-    }
-  }
-  const totalTime = samples.reduce((a, b) => a + b, 0);
-  return {
-    ratio: totalTime > 0 ? excessTime / totalTime : 0,
-    count,
-  };
-}
-/** @return convergence based on window stability */
-export function checkConvergence(samples: number[]): ConvergenceResult {
-  const windowSize = getWindowSize(samples);
-  const minSamples = windowSize * 2;
-  if (samples.length < minSamples) {
-    return buildProgressResult(samples.length, minSamples);
-  }
-  const metrics = getStability(samples, windowSize);
-  return buildConvergence(metrics);
-}
-/** @return progress when samples insufficient */
-function buildProgressResult(
-  currentSamples: number,
-  minSamples: number,
-): ConvergenceResult {
-  return {
-    converged: false,
-    confidence: (currentSamples / minSamples) * 100,
-    reason: `Collecting samples: ${currentSamples}/${minSamples}`,
-  };
+/** Append samples one-by-one to avoid stack overflow from spread on large arrays. */
+function appendSamples(result: MeasuredResults, samples: number[]): void {
+  if (!result.samples?.length) return;
+  for (const sample of result.samples) samples.push(sample);
 }
-/** @return stability metrics between windows */
-function getStability(samples: number[], windowSize: number): Metrics {
-  const recent = samples.slice(-windowSize);
-  const previous = samples.slice(-windowSize * 2, -windowSize);
-  const recentMs = recent.map(s => s / msToNs);
-  const previousMs = previous.map(s => s / msToNs);
-  const medianRecent = percentile(recentMs, 0.5);
-  const medianPrevious = percentile(previousMs, 0.5);
-  const medianDrift = Math.abs(medianRecent - medianPrevious) / medianPrevious;
-  const impactRecent = getOutlierImpact(recentMs);
-  const impactPrevious = getOutlierImpact(previousMs);
-  const impactDrift = Math.abs(impactRecent.ratio - impactPrevious.ratio);
-  return {
-    medianDrift,
-    impactDrift,
-    medianStable: medianDrift < stability,
-    impactStable: impactDrift < stability,
-  };
+/** Log adaptive sampling progress at ~1s intervals. */
+function logProgress(
+  name: string,
+  convergence: ConvergenceResult,
+  elapsed: number,
+  lastLog: number,
+): number {
+  if (elapsed - lastLog <= 1000) return lastLog;
+  const sec = (elapsed / 1000).toFixed(1);
+  const conf = convergence.confidence.toFixed(0);
+  process.stderr.write(`\r◊ ${name}: ${conf}% confident (${sec}s)   `);
+  return elapsed;
 }
-/** @return convergence from stability metrics */
-function buildConvergence(metrics: Metrics): ConvergenceResult {
-  const { medianDrift, impactDrift, medianStable, impactStable } = metrics;
-  if (medianStable && impactStable) {
-    return {
-      converged: true,
-      confidence: 100,
-      reason: "Stable performance pattern",
-    };
-  }
-  const confidence = Math.min(
-    100,
-    (1 - medianDrift / stability) * 50 + (1 - impactDrift / stability) * 50,
+/** @return true if convergence target met, or minTime elapsed with fallback confidence. */
+function shouldStop(
+  convergence: ConvergenceResult,
+  target: number,
+  elapsed: number,
+  minElapsed: number,
+): boolean {
+  if (convergence.converged && convergence.confidence >= target) return true;
+  return (
+    elapsed >= minElapsed &&
+    convergence.confidence >= Math.max(target, fallbackThreshold)
   );
-  const reason =
-    medianDrift > impactDrift
-      ? `Median drifting: ${(medianDrift * 100).toFixed(1)}%`
-      : `Outlier impact changing: ${(impactDrift * 100).toFixed(1)}%`;
-  return { converged: false, confidence: Math.max(0, confidence), reason };
-}
-/** @return window size scaled to execution time */
-function getWindowSize(samples: number[]): number {
-  if (samples.length < 20) return windowSize; // Default for initial samples
-  const recentMs = samples.slice(-20).map(s => s / msToNs);
-  const recentMedian = percentile(recentMs, 0.5);
-  // Inverse scaling with execution time
-  if (recentMedian < 0.01) return 200; // <10μs
-  if (recentMedian < 0.1) return 100; // <100μs
-  if (recentMedian < 1) return 50; // <1ms
-  if (recentMedian < 10) return 30; // <10ms
-  return 20; // >10ms
 }