npm - benchforge - Versions diffs - 0.1.11 → 0.2.4 - Mend

benchforge 0.1.11 → 0.2.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (253) hide show

package/LICENSE +20 -0
package/README.md +99 -294
package/bin/benchforge +1 -2
package/dist/AnalyzeArchive-8NCJhmhS.mjs +145 -0
package/dist/AnalyzeArchive-8NCJhmhS.mjs.map +1 -0
package/dist/BenchMatrix-BZVrBB_h.mjs +1050 -0
package/dist/BenchMatrix-BZVrBB_h.mjs.map +1 -0
package/dist/{BenchRunner-BzyUfiyB.d.mts → BenchRunner-DglX1NOn.d.mts} +119 -66
package/dist/CoverageSampler-D5T9DRqe.mjs +27 -0
package/dist/CoverageSampler-D5T9DRqe.mjs.map +1 -0
package/dist/Formatters-BWj3d4sv.mjs +95 -0
package/dist/Formatters-BWj3d4sv.mjs.map +1 -0
package/dist/{HeapSampler-B8dtKHn1.mjs → HeapSampler-Dq-hpXem.mjs} +4 -4
package/dist/HeapSampler-Dq-hpXem.mjs.map +1 -0
package/dist/RunBenchCLI-C17DrJz8.mjs +3075 -0
package/dist/RunBenchCLI-C17DrJz8.mjs.map +1 -0
package/dist/StatisticalUtils-BD92crgM.mjs +255 -0
package/dist/StatisticalUtils-BD92crgM.mjs.map +1 -0
package/dist/TimeSampler-Ds8n7l2B.mjs +29 -0
package/dist/TimeSampler-Ds8n7l2B.mjs.map +1 -0
package/dist/ViewerServer-BJhdnxlN.mjs +639 -0
package/dist/ViewerServer-BJhdnxlN.mjs.map +1 -0
package/dist/ViewerServer-CuMNdNBz.mjs +2 -0
package/dist/bin/benchforge.mjs +4 -5
package/dist/bin/benchforge.mjs.map +1 -1
package/dist/index.d.mts +711 -558
package/dist/index.mjs +98 -3
package/dist/index.mjs.map +1 -0
package/dist/runners/WorkerScript.d.mts +12 -4
package/dist/runners/WorkerScript.mjs +77 -105
package/dist/runners/WorkerScript.mjs.map +1 -1
package/dist/viewer/assets/CIPlot-BkOvMoMa.js +1 -0
package/dist/viewer/assets/HistogramKde-CmSyUFY0.js +1 -0
package/dist/viewer/assets/LegendUtils-BJpbn_jr.js +55 -0
package/dist/viewer/assets/SampleTimeSeries-C4VBhXr3.js +1 -0
package/dist/viewer/assets/index-Br9bp_cX.js +153 -0
package/dist/viewer/assets/index-NzXXe_CC.css +1 -0
package/dist/viewer/index.html +19 -0
package/dist/viewer/speedscope/LICENSE +21 -0
package/dist/viewer/speedscope/SourceCodePro-Regular.ttf-ILST5JV6.woff2 +0 -0
package/dist/viewer/speedscope/favicon-16x16-V2DMIAZS.js +2 -0
package/dist/viewer/speedscope/favicon-16x16-V2DMIAZS.js.map +7 -0
package/dist/viewer/speedscope/favicon-16x16-VSI62OPJ.png +0 -0
package/dist/viewer/speedscope/favicon-32x32-3EB2YCUY.png +0 -0
package/dist/viewer/speedscope/favicon-32x32-THY3JDJL.js +2 -0
package/dist/viewer/speedscope/favicon-32x32-THY3JDJL.js.map +7 -0
package/dist/viewer/speedscope/favicon-FOKUP5Y5.ico +0 -0
package/dist/viewer/speedscope/favicon-M34RF7BI.js +2 -0
package/dist/viewer/speedscope/favicon-M34RF7BI.js.map +7 -0
package/dist/viewer/speedscope/file-format-schema.json +274 -0
package/dist/viewer/speedscope/index.html +19 -0
package/dist/viewer/speedscope/jfrview_bg-BLJXNNQB.wasm +0 -0
package/dist/viewer/speedscope/perf-vertx-stacks-01-collapsed-all-ZNUIGAJL.txt +199 -0
package/dist/viewer/speedscope/release.txt +3 -0
package/dist/viewer/speedscope/source-code-pro.LICENSE.md +93 -0
package/dist/viewer/speedscope/speedscope-GHPHNKXC.css +2 -0
package/dist/viewer/speedscope/speedscope-GHPHNKXC.css.map +7 -0
package/dist/viewer/speedscope/speedscope-QZFMJ7VP.js +212 -0
package/dist/viewer/speedscope/speedscope-QZFMJ7VP.js.map +7 -0
package/package.json +52 -27
package/src/bin/benchforge.ts +2 -2
package/src/cli/AnalyzeArchive.ts +232 -0
package/src/cli/BrowserBench.ts +322 -0
package/src/cli/CliArgs.ts +164 -51
package/src/cli/CliExport.ts +179 -0
package/src/cli/CliOptions.ts +147 -0
package/src/cli/CliReport.ts +197 -0
package/src/cli/FilterBenchmarks.ts +18 -30
package/src/cli/RunBenchCLI.ts +132 -866
package/src/cli/SuiteRunner.ts +160 -0
package/src/cli/ViewerServer.ts +282 -0
package/src/export/AllocExport.ts +121 -0
package/src/export/ArchiveExport.ts +146 -0
package/src/export/ArchiveFormat.ts +50 -0
package/src/export/CoverageExport.ts +148 -0
package/src/export/EditorUri.ts +10 -0
package/src/export/PerfettoExport.ts +64 -99
package/src/export/SpeedscopeTypes.ts +98 -0
package/src/export/TimeExport.ts +115 -0
package/src/index.ts +86 -67
package/src/matrix/BenchMatrix.ts +230 -0
package/src/matrix/CaseLoader.ts +8 -6
package/src/matrix/MatrixDirRunner.ts +153 -0
package/src/matrix/MatrixFilter.ts +49 -47
package/src/matrix/MatrixInlineRunner.ts +50 -0
package/src/matrix/MatrixReport.ts +90 -250
package/src/matrix/VariantLoader.ts +5 -5
package/src/profiling/browser/BenchLoop.ts +51 -0
package/src/profiling/browser/BrowserCDP.ts +133 -0
package/src/profiling/browser/BrowserGcStats.ts +33 -0
package/src/profiling/browser/BrowserProfiler.ts +160 -0
package/src/profiling/browser/CdpClient.ts +82 -0
package/src/profiling/browser/CdpPage.ts +138 -0
package/src/profiling/browser/ChromeLauncher.ts +158 -0
package/src/profiling/browser/ChromeTraceEvent.ts +28 -0
package/src/profiling/browser/PageLoadMode.ts +61 -0
package/src/profiling/node/CoverageSampler.ts +27 -0
package/src/profiling/node/CoverageTypes.ts +23 -0
package/src/profiling/node/HeapSampleReport.ts +261 -0
package/src/{heap-sample → profiling/node}/HeapSampler.ts +1 -2
package/src/{heap-sample → profiling/node}/ResolvedProfile.ts +18 -9
package/src/profiling/node/TimeSampler.ts +57 -0
package/src/report/BenchmarkReport.ts +146 -0
package/src/report/Colors.ts +9 -0
package/src/report/Formatters.ts +110 -0
package/src/report/GcSections.ts +151 -0
package/src/{GitUtils.ts → report/GitUtils.ts} +18 -19
package/src/report/HtmlReport.ts +223 -0
package/src/report/ParseStats.ts +73 -0
package/src/report/StandardSections.ts +147 -0
package/src/report/ViewerSections.ts +286 -0
package/src/report/text/TableReport.ts +253 -0
package/src/report/text/TextReport.ts +123 -0
package/src/runners/AdaptiveWrapper.ts +116 -236
package/src/runners/BenchRunner.ts +20 -15
package/src/{Benchmark.ts → runners/BenchmarkSpec.ts} +5 -6
package/src/runners/CreateRunner.ts +5 -7
package/src/runners/GcStats.ts +47 -50
package/src/{MeasuredResults.ts → runners/MeasuredResults.ts} +43 -37
package/src/runners/MergeBatches.ts +123 -0
package/src/{NodeGC.ts → runners/NodeGC.ts} +2 -3
package/src/runners/RunnerOrchestrator.ts +127 -243
package/src/runners/RunnerUtils.ts +75 -1
package/src/runners/SampleStats.ts +100 -0
package/src/runners/TimingRunner.ts +244 -0
package/src/runners/TimingUtils.ts +3 -2
package/src/runners/WorkerScript.ts +135 -151
package/src/stats/BootstrapDifference.ts +282 -0
package/src/{PermutationTest.ts → stats/PermutationTest.ts} +8 -17
package/src/stats/StatisticalUtils.ts +445 -0
package/src/{tests → test}/AdaptiveConvergence.test.ts +10 -10
package/src/test/AdaptiveRunner.test.ts +39 -41
package/src/{tests → test}/AdaptiveSampling.test.ts +9 -9
package/src/test/AdaptiveStatistics.integration.ts +2 -2
package/src/{tests → test}/BenchMatrix.test.ts +19 -16
package/src/test/BenchmarkReport.test.ts +63 -13
package/src/test/BrowserBench.e2e.test.ts +186 -17
package/src/test/BrowserBench.test.ts +10 -5
package/src/test/BuildTimeSection.test.ts +130 -0
package/src/test/CapSamples.test.ts +82 -0
package/src/test/CoverageExport.test.ts +115 -0
package/src/test/CoverageSampler.test.ts +33 -0
package/src/test/HeapAttribution.test.ts +14 -14
package/src/{tests → test}/MatrixFilter.test.ts +1 -1
package/src/{tests → test}/MatrixReport.test.ts +1 -1
package/src/test/PermutationTest.test.ts +1 -1
package/src/{tests → test}/RealDataValidation.test.ts +6 -6
package/src/test/RunBenchCLI.test.ts +39 -38
package/src/test/RunnerOrchestrator.test.ts +12 -12
package/src/test/StatisticalUtils.test.ts +48 -12
package/src/{table-util/test → test}/TableReport.test.ts +2 -2
package/src/test/TestUtils.ts +12 -7
package/src/test/TimeExport.test.ts +139 -0
package/src/test/TimeSampler.test.ts +37 -0
package/src/test/ViewerLive.e2e.test.ts +159 -0
package/src/test/ViewerStatic.static.e2e.test.ts +137 -0
package/src/{tests → test}/fixtures/baseline/impl.ts +1 -1
package/src/{tests → test}/fixtures/bevy30-samples.ts +3 -1
package/src/test/fixtures/cases/asyncCases.ts +9 -0
package/src/{tests → test}/fixtures/cases/cases.ts +5 -2
package/src/test/fixtures/cases/variants/product.ts +2 -0
package/src/test/fixtures/cases/variants/sum.ts +2 -0
package/src/test/fixtures/discover/fast.ts +1 -0
package/src/{tests → test}/fixtures/discover/slow.ts +1 -1
package/src/test/fixtures/invalid/bad.ts +1 -0
package/src/test/fixtures/loader/fast.ts +1 -0
package/src/{tests → test}/fixtures/loader/slow.ts +1 -1
package/src/test/fixtures/loader/stateful.ts +2 -0
package/src/test/fixtures/stateful/stateful.ts +2 -0
package/src/test/fixtures/variants/extra.ts +1 -0
package/src/test/fixtures/variants/impl.ts +1 -0
package/src/test/fixtures/worker/fast.ts +1 -0
package/src/{tests → test}/fixtures/worker/slow.ts +1 -1
package/src/viewer/DateFormat.ts +30 -0
package/src/viewer/Helpers.ts +23 -0
package/src/viewer/LineData.ts +120 -0
package/src/viewer/Providers.ts +191 -0
package/src/viewer/ReportData.ts +123 -0
package/src/viewer/State.ts +49 -0
package/src/viewer/Theme.ts +15 -0
package/src/viewer/components/App.tsx +73 -0
package/src/viewer/components/DropZone.tsx +71 -0
package/src/viewer/components/LazyPlot.ts +33 -0
package/src/viewer/components/SamplesPanel.tsx +214 -0
package/src/viewer/components/Shell.tsx +26 -0
package/src/viewer/components/SourcePanel.tsx +216 -0
package/src/viewer/components/SummaryPanel.tsx +332 -0
package/src/viewer/components/TabBar.tsx +131 -0
package/src/viewer/components/TabContent.tsx +46 -0
package/src/viewer/components/ThemeToggle.tsx +50 -0
package/src/viewer/index.html +20 -0
package/src/viewer/main.tsx +4 -0
package/src/viewer/plots/CIPlot.ts +313 -0
package/src/{html/browser → viewer/plots}/HistogramKde.ts +33 -38
package/src/viewer/plots/LegendUtils.ts +134 -0
package/src/viewer/plots/PlotTypes.ts +85 -0
package/src/viewer/plots/RenderPlots.ts +230 -0
package/src/viewer/plots/SampleTimeSeries.ts +306 -0
package/src/viewer/plots/SvgHelpers.ts +136 -0
package/src/viewer/plots/TimeSeriesMarks.ts +319 -0
package/src/viewer/report.css +427 -0
package/src/viewer/shell.css +357 -0
package/src/viewer/tsconfig.json +11 -0
package/dist/BrowserHeapSampler-B6asLKWQ.mjs +0 -202
package/dist/BrowserHeapSampler-B6asLKWQ.mjs.map +0 -1
package/dist/GcStats-wX7Xyblu.mjs +0 -77
package/dist/GcStats-wX7Xyblu.mjs.map +0 -1
package/dist/HeapSampler-B8dtKHn1.mjs.map +0 -1
package/dist/TimingUtils-DwOwkc8G.mjs +0 -597
package/dist/TimingUtils-DwOwkc8G.mjs.map +0 -1
package/dist/browser/index.js +0 -914
package/dist/src-B-DDaCa9.mjs +0 -3108
package/dist/src-B-DDaCa9.mjs.map +0 -1
package/src/BenchMatrix.ts +0 -380
package/src/BenchmarkReport.ts +0 -161
package/src/HtmlDataPrep.ts +0 -148
package/src/StandardSections.ts +0 -261
package/src/StatisticalUtils.ts +0 -175
package/src/TypeUtil.ts +0 -8
package/src/browser/BrowserGcStats.ts +0 -44
package/src/browser/BrowserHeapSampler.ts +0 -271
package/src/export/JsonExport.ts +0 -103
package/src/export/JsonFormat.ts +0 -91
package/src/export/SpeedscopeExport.ts +0 -202
package/src/heap-sample/HeapSampleReport.ts +0 -269
package/src/html/HtmlReport.ts +0 -131
package/src/html/HtmlTemplate.ts +0 -284
package/src/html/Types.ts +0 -88
package/src/html/browser/CIPlot.ts +0 -287
package/src/html/browser/LegendUtils.ts +0 -163
package/src/html/browser/RenderPlots.ts +0 -263
package/src/html/browser/SampleTimeSeries.ts +0 -389
package/src/html/browser/Types.ts +0 -96
package/src/html/browser/index.ts +0 -1
package/src/html/index.ts +0 -17
package/src/runners/BasicRunner.ts +0 -364
package/src/table-util/ConvergenceFormatters.ts +0 -19
package/src/table-util/Formatters.ts +0 -157
package/src/table-util/README.md +0 -70
package/src/table-util/TableReport.ts +0 -293
package/src/tests/fixtures/cases/asyncCases.ts +0 -7
package/src/tests/fixtures/cases/variants/product.ts +0 -2
package/src/tests/fixtures/cases/variants/sum.ts +0 -2
package/src/tests/fixtures/discover/fast.ts +0 -1
package/src/tests/fixtures/invalid/bad.ts +0 -1
package/src/tests/fixtures/loader/fast.ts +0 -1
package/src/tests/fixtures/loader/stateful.ts +0 -2
package/src/tests/fixtures/stateful/stateful.ts +0 -2
package/src/tests/fixtures/variants/extra.ts +0 -1
package/src/tests/fixtures/variants/impl.ts +0 -1
package/src/tests/fixtures/worker/fast.ts +0 -1
/package/src/{table-util/test → test}/TableValueExtractor.test.ts +0 -0
/package/src/{table-util/test → test}/TableValueExtractor.ts +0 -0

package/src/runners/AdaptiveWrapper.ts CHANGED Viewed

@@ -1,19 +1,22 @@
-import type { BenchmarkSpec } from "../Benchmark.ts";
-import type { MeasuredResults } from "../MeasuredResults.ts";
-import {
-  coefficientOfVariation,
-  medianAbsoluteDeviation,
-  percentile,
-} from "../StatisticalUtils.ts";
+import { median } from "../stats/StatisticalUtils.ts";
+import type { BenchmarkSpec } from "./BenchmarkSpec.ts";
 import type { BenchRunner, RunnerOptions } from "./BenchRunner.ts";
+import type { MeasuredResults } from "./MeasuredResults.ts";
 import { msToNs } from "./RunnerUtils.ts";
+import { computeStats, outlierImpactRatio } from "./SampleStats.ts";
+/** Options for adaptive sampling: collects until statistical convergence or timeout. */
 export interface AdaptiveOptions extends RunnerOptions {
+  /** Enable adaptive sampling (default: true when using adaptive runner) */
   adaptive?: boolean;
+  /** Minimum measurement time in ms before convergence can stop sampling (default: 1000) */
   minTime?: number;
+  /** Maximum measurement time in ms, hard stop (default: 10000) */
   maxTime?: number;
+  /** Target confidence percentage to stop early (default: 95) */
   targetConfidence?: number;
-  convergence?: number; // Confidence threshold (0-100)
+  /** Confidence threshold 0-100 (alias for targetConfidence) */
+  convergence?: number;
 }
 type Metrics = {
@@ -39,101 +42,85 @@ const initialBatch = 100;
 const continueBatch = 100;
 const continueIterations = 10;
-/** @return adaptive sampling runner wrapper */
+/** Wrap a runner with adaptive sampling (convergence detection or timeout). */
 export function createAdaptiveWrapper(
   baseRunner: BenchRunner,
   options: AdaptiveOptions,
 ): BenchRunner {
   return {
     async runBench<T = unknown>(
-      benchmark: BenchmarkSpec<T>,
-      runnerOptions: RunnerOptions,
+      bench: BenchmarkSpec<T>,
+      opts: RunnerOptions,
       params?: T,
     ): Promise<MeasuredResults[]> {
-      return runAdaptiveBench(
-        baseRunner,
-        benchmark,
-        runnerOptions,
-        options,
-        params,
-      );
+      return runAdaptiveBench(baseRunner, bench, opts, options, params);
     },
   };
 }
-/** @return convergence based on window stability */
+/** Check convergence by comparing sliding windows of samples for stability. */
 export function checkConvergence(samples: number[]): ConvergenceResult {
   const windowSize = getWindowSize(samples);
   const minSamples = windowSize * 2;
   if (samples.length < minSamples) {
-    return buildProgressResult(samples.length, minSamples);
+    const confidence = (samples.length / minSamples) * 100;
+    const reason = `Collecting samples: ${samples.length}/${minSamples}`;
+    return { converged: false, confidence, reason };
   }
-  const metrics = getStability(samples, windowSize);
-  return buildConvergence(metrics);
+  return buildConvergence(getStability(samples, windowSize));
 }
-/** @return results using adaptive sampling strategy */
+/** Run benchmark with adaptive sampling until convergence or timeout. */
 async function runAdaptiveBench<T>(
-  baseRunner: BenchRunner,
-  benchmark: BenchmarkSpec<T>,
-  runnerOptions: RunnerOptions,
-  options: AdaptiveOptions,
+  runner: BenchRunner,
+  bench: BenchmarkSpec<T>,
+  opts: RunnerOptions,
+  adaptive: AdaptiveOptions,
   params?: T,
 ): Promise<MeasuredResults[]> {
-  const {
-    minTime: min = options.minTime ?? minTime,
-    maxTime: max = options.maxTime ?? maxTime,
-    targetConfidence: target = options.convergence ?? targetConfidence,
-  } = runnerOptions as AdaptiveOptions;
+  const overrides = opts as AdaptiveOptions;
+  const min = overrides.minTime ?? adaptive.minTime ?? minTime;
+  const max = overrides.maxTime ?? adaptive.maxTime ?? maxTime;
+  const target =
+    overrides.convergence ?? adaptive.convergence ?? targetConfidence;
   const allSamples: number[] = [];
-  // Collect initial batch (includes warmup + settle)
-  const warmup = await collectInitial(
-    baseRunner,
-    benchmark,
-    runnerOptions,
+  const { warmup, startTime: hrtimeStart } = await collectInitial(
+    runner,
+    bench,
+    opts,
     params,
     allSamples,
   );
-  // Start timing AFTER warmup - warmup time doesn't count against maxTime
+  // Start timing after warmup so warmup time doesn't count against maxTime
   const startTime = performance.now();
   const limits = {
     minTime: min,
     maxTime: max,
     targetConfidence: target,
     startTime,
   };
-  await collectAdaptive(
-    baseRunner,
-    benchmark,
-    runnerOptions,
-    params,
-    allSamples,
-    limits,
-  );
+  await collectAdaptive(runner, bench, opts, params, allSamples, limits);
-  const convergence = checkConvergence(allSamples.map(s => s * msToNs));
+  const samplesNs = allSamples.map(s => s * msToNs);
+  const convergence = checkConvergence(samplesNs);
   return buildResults(
     allSamples,
     startTime,
     convergence,
-    benchmark.name,
+    bench.name,
     warmup,
+    hrtimeStart,
   );
 }
-/** @return window size scaled to execution time */
+/** Scale window size inversely with execution time -- fast ops need more samples. */
 function getWindowSize(samples: number[]): number {
-  if (samples.length < 20) return windowSize; // Default for initial samples
+  if (samples.length < 20) return windowSize;
   const recentMs = samples.slice(-20).map(s => s / msToNs);
-  const recentMedian = percentile(recentMs, 0.5);
+  const recentMedian = median(recentMs);
-  // Inverse scaling with execution time
   if (recentMedian < 0.01) return 200; // <10μs
   if (recentMedian < 0.1) return 100; // <100μs
   if (recentMedian < 1) return 50; // <1ms
@@ -141,91 +128,67 @@ function getWindowSize(samples: number[]): number {
   return 20; // >10ms
 }
-/** @return progress when samples insufficient */
-function buildProgressResult(
-  currentSamples: number,
-  minSamples: number,
-): ConvergenceResult {
-  return {
-    converged: false,
-    confidence: (currentSamples / minSamples) * 100,
-    reason: `Collecting samples: ${currentSamples}/${minSamples}`,
-  };
-}
-/** @return stability metrics between windows */
-function getStability(samples: number[], windowSize: number): Metrics {
-  const recent = samples.slice(-windowSize);
-  const previous = samples.slice(-windowSize * 2, -windowSize);
-  const recentMs = recent.map(s => s / msToNs);
-  const previousMs = previous.map(s => s / msToNs);
-  const medianRecent = percentile(recentMs, 0.5);
-  const medianPrevious = percentile(previousMs, 0.5);
-  const medianDrift = Math.abs(medianRecent - medianPrevious) / medianPrevious;
-  const impactRecent = getOutlierImpact(recentMs);
-  const impactPrevious = getOutlierImpact(previousMs);
-  const impactDrift = Math.abs(impactRecent.ratio - impactPrevious.ratio);
-  return {
-    medianDrift,
-    impactDrift,
-    medianStable: medianDrift < stability,
-    impactStable: impactDrift < stability,
-  };
-}
-/** @return convergence from stability metrics */
+/** Convert stability metrics to a convergence result with confidence score. */
 function buildConvergence(metrics: Metrics): ConvergenceResult {
   const { medianDrift, impactDrift, medianStable, impactStable } = metrics;
-  if (medianStable && impactStable) {
+  if (medianStable && impactStable)
     return {
       converged: true,
       confidence: 100,
       reason: "Stable performance pattern",
     };
-  }
-  const confidence = Math.min(
-    100,
-    (1 - medianDrift / stability) * 50 + (1 - impactDrift / stability) * 50,
-  );
+  const raw =
+    (1 - medianDrift / stability) * 50 + (1 - impactDrift / stability) * 50;
+  const confidence = Math.max(0, Math.min(100, raw));
   const reason =
     medianDrift > impactDrift
       ? `Median drifting: ${(medianDrift * 100).toFixed(1)}%`
       : `Outlier impact changing: ${(impactDrift * 100).toFixed(1)}%`;
+  return { converged: false, confidence, reason };
+}
+/** Compare median and outlier-impact drift between recent and previous windows. */
+function getStability(samples: number[], windowSize: number): Metrics {
+  const toMs = (s: number) => s / msToNs;
+  const recentMs = samples.slice(-windowSize).map(toMs);
+  const previousMs = samples.slice(-windowSize * 2, -windowSize).map(toMs);
-  return { converged: false, confidence: Math.max(0, confidence), reason };
+  const medianRecent = median(recentMs);
+  const medianPrevious = median(previousMs);
+  const medianDrift = Math.abs(medianRecent - medianPrevious) / medianPrevious;
+  const impactRecent = outlierImpactRatio(recentMs);
+  const impactPrevious = outlierImpactRatio(previousMs);
+  const impactDrift = Math.abs(impactRecent - impactPrevious);
+  const medianStable = medianDrift < stability;
+  const impactStable = impactDrift < stability;
+  return { medianDrift, impactDrift, medianStable, impactStable };
 }
-/** @return warmupSamples from initial batch */
+/** Collect the initial batch (warmup + settle), returning warmup samples. */
 async function collectInitial<T>(
-  baseRunner: BenchRunner,
-  benchmark: BenchmarkSpec<T>,
-  runnerOptions: RunnerOptions,
+  runner: BenchRunner,
+  bench: BenchmarkSpec<T>,
+  opts: RunnerOptions,
   params: T | undefined,
   allSamples: number[],
-): Promise<number[] | undefined> {
-  // Don't pass adaptive flag to base runner to avoid double wrapping
-  const opts = {
-    ...(runnerOptions as any),
+): Promise<{ warmup?: number[]; startTime?: number }> {
+  const batchOpts = {
+    ...(opts as any),
     maxTime: initialBatch,
     maxIterations: undefined,
   };
-  const results = await baseRunner.runBench(benchmark, opts, params);
+  const results = await runner.runBench(bench, batchOpts, params);
   appendSamples(results[0], allSamples);
-  return results[0].warmupSamples;
+  return { warmup: results[0].warmupSamples, startTime: results[0].startTime };
 }
-/** @return samples until convergence or timeout */
+/** Collect batches until convergence or timeout, with progress logging. */
 async function collectAdaptive<T>(
-  baseRunner: BenchRunner,
-  benchmark: BenchmarkSpec<T>,
-  runnerOptions: RunnerOptions,
+  runner: BenchRunner,
+  bench: BenchmarkSpec<T>,
+  opts: RunnerOptions,
   params: T | undefined,
   allSamples: number[],
   limits: {
@@ -242,150 +205,67 @@ async function collectAdaptive<T>(
     const convergence = checkConvergence(samplesNs);
     const elapsed = performance.now() - startTime;
-    if (elapsed - lastLog > 1000) {
-      const elapsedSec = (elapsed / 1000).toFixed(1);
-      const conf = convergence.confidence.toFixed(0);
-      process.stderr.write(
-        `\r◊ ${benchmark.name}: ${conf}% confident (${elapsedSec}s)   `,
-      );
-      lastLog = elapsed;
-    }
-    if (shouldStop(convergence, targetConfidence, elapsed, minTime)) {
-      break;
-    }
+    lastLog = logProgress(bench.name, convergence, elapsed, lastLog);
+    if (shouldStop(convergence, targetConfidence, elapsed, minTime)) break;
-    // Skip warmup for continuation batches (warmup done in initial batch)
-    const opts = {
-      ...(runnerOptions as any),
+    const batch = {
+      ...(opts as any),
       maxTime: continueBatch,
       maxIterations: continueIterations,
       skipWarmup: true,
     };
-    const batchResults = await baseRunner.runBench(benchmark, opts, params);
-    appendSamples(batchResults[0], allSamples);
+    const results = await runner.runBench(bench, batch, params);
+    appendSamples(results[0], allSamples);
   }
   process.stderr.write("\r" + " ".repeat(60) + "\r");
 }
-/** @return measured results with convergence metrics */
+/** Build final MeasuredResults from collected samples and convergence state. */
 function buildResults(
-  samplesMs: number[],
-  startTime: number,
+  samples: number[],
+  elapsedStart: number,
   convergence: ConvergenceResult,
   name: string,
   warmupSamples?: number[],
+  startTime?: number,
 ): MeasuredResults[] {
-  const totalTime = (performance.now() - startTime) / 1000;
-  const samplesNs = samplesMs.map(s => s * msToNs);
-  const timeStats = computeTimeStats(samplesNs);
+  const totalTime = (performance.now() - elapsedStart) / 1000;
+  const time = computeStats(samples);
   return [
-    {
-      name,
-      samples: samplesMs,
-      warmupSamples,
-      time: timeStats,
-      totalTime,
-      convergence,
-    },
+    { name, samples, warmupSamples, time, totalTime, startTime, convergence },
   ];
 }
-/** @return outlier impact as proportion of total time */
-function getOutlierImpact(samples: number[]): { ratio: number; count: number } {
-  if (samples.length === 0) return { ratio: 0, count: 0 };
-  const median = percentile(samples, 0.5);
-  const q75 = percentile(samples, 0.75);
-  const threshold = median + 1.5 * (q75 - median);
-  let excessTime = 0;
-  let count = 0;
-  for (const sample of samples) {
-    if (sample > threshold) {
-      excessTime += sample - median;
-      count++;
-    }
-  }
-  const totalTime = samples.reduce((a, b) => a + b, 0);
-  return {
-    ratio: totalTime > 0 ? excessTime / totalTime : 0,
-    count,
-  };
-}
-/** Append samples one-by-one to avoid stack overflow from spread on large arrays */
+/** Append samples one-by-one to avoid stack overflow from spread on large arrays. */
 function appendSamples(result: MeasuredResults, samples: number[]): void {
   if (!result.samples?.length) return;
   for (const sample of result.samples) samples.push(sample);
 }
-/** @return true if convergence reached or timeout */
-function shouldStop(
+/** Log adaptive sampling progress at ~1s intervals. */
+function logProgress(
+  name: string,
   convergence: ConvergenceResult,
-  targetConfidence: number,
-  elapsedTime: number,
-  minTime: number,
-): boolean {
-  if (convergence.converged && convergence.confidence >= targetConfidence) {
-    return true;
-  }
-  // After minTime, accept whichever is higher: targetConfidence or fallbackThreshold
-  const threshold = Math.max(targetConfidence, fallbackThreshold);
-  return elapsedTime >= minTime && convergence.confidence >= threshold;
+  elapsed: number,
+  lastLog: number,
+): number {
+  if (elapsed - lastLog <= 1000) return lastLog;
+  const sec = (elapsed / 1000).toFixed(1);
+  const conf = convergence.confidence.toFixed(0);
+  process.stderr.write(`\r◊ ${name}: ${conf}% confident (${sec}s)   `);
+  return elapsed;
 }
-/** @return time percentiles and statistics in ms */
-function computeTimeStats(samplesNs: number[]) {
-  const samplesMs = samplesNs.map(s => s / msToNs);
-  const { min, max, sum } = getMinMaxSum(samplesNs);
-  const percentiles = getPercentiles(samplesNs);
-  const robust = getRobustMetrics(samplesMs);
-  return {
-    min: min / msToNs,
-    max: max / msToNs,
-    avg: sum / samplesNs.length / msToNs,
-    ...percentiles,
-    ...robust,
-  };
-}
-/** @return min, max, sum of samples */
-function getMinMaxSum(samples: number[]) {
-  const min = samples.reduce(
-    (a, b) => Math.min(a, b),
-    Number.POSITIVE_INFINITY,
-  );
-  const max = samples.reduce(
-    (a, b) => Math.max(a, b),
-    Number.NEGATIVE_INFINITY,
+/** @return true if convergence target met, or minTime elapsed with fallback confidence. */
+function shouldStop(
+  convergence: ConvergenceResult,
+  target: number,
+  elapsed: number,
+  minElapsed: number,
+): boolean {
+  if (convergence.converged && convergence.confidence >= target) return true;
+  return (
+    elapsed >= minElapsed &&
+    convergence.confidence >= Math.max(target, fallbackThreshold)
   );
-  const sum = samples.reduce((a, b) => a + b, 0);
-  return { min, max, sum };
-}
-/** @return percentiles in ms */
-function getPercentiles(samples: number[]) {
-  return {
-    p25: percentile(samples, 0.25) / msToNs,
-    p50: percentile(samples, 0.5) / msToNs,
-    p75: percentile(samples, 0.75) / msToNs,
-    p95: percentile(samples, 0.95) / msToNs,
-    p99: percentile(samples, 0.99) / msToNs,
-    p999: percentile(samples, 0.999) / msToNs,
-  };
-}
-/** @return robust variability metrics */
-function getRobustMetrics(samplesMs: number[]) {
-  const impact = getOutlierImpact(samplesMs);
-  return {
-    cv: coefficientOfVariation(samplesMs),
-    mad: medianAbsoluteDeviation(samplesMs),
-    outlierRate: impact.ratio,
-  };
 }

package/src/runners/BenchRunner.ts CHANGED Viewed

@@ -1,7 +1,7 @@
-import type { BenchmarkSpec } from "../Benchmark.ts";
-import type { MeasuredResults } from "../MeasuredResults.ts";
+import type { BenchmarkSpec } from "./BenchmarkSpec.ts";
+import type { MeasuredResults } from "./MeasuredResults.ts";
-/** Interface for benchmark execution libraries */
+/** Benchmark execution strategy that collects timing samples. */
 export interface BenchRunner {
   runBench<T = unknown>(
     benchmark: BenchmarkSpec<T>,
@@ -10,6 +10,7 @@ export interface BenchRunner {
   ): Promise<MeasuredResults[]>;
 }
+/** Configuration for benchmark execution: timing limits, warmup, profiling, and V8 options. */
 export interface RunnerOptions {
   /** Minimum time to run each benchmark (milliseconds) */
   minTime?: number;
@@ -28,13 +29,11 @@ export interface RunnerOptions {
   /** Minimum samples required - mitata only */
   minSamples?: number;
   /** Force GC after each iteration (requires --expose-gc) */
-  collect?: boolean;
-  /** Enable CPU performance counters (requires root access) */
-  cpuCounters?: boolean;
+  gcForce?: boolean;
   /** Trace V8 optimization tiers (requires --allow-natives-syntax) */
   traceOpt?: boolean;
-  /** Skip post-warmup settle time (default: false) */
-  noSettle?: boolean;
+  /** Post-warmup settle time in ms for V8 background compilation (0 to skip) */
+  pauseWarmup?: number;
   /** Iterations before first pause (then pauseInterval applies) */
   pauseFirst?: number;
   /** Iterations between pauses for V8 optimization (0 to disable) */
@@ -43,15 +42,21 @@ export interface RunnerOptions {
   pauseDuration?: number;
   /** Collect GC stats via --trace-gc-nvp (requires worker mode) */
   gcStats?: boolean;
-  /** Heap sampling allocation attribution */
-  heapSample?: boolean;
-  /** Heap sampling interval in bytes */
-  heapInterval?: number;
-  /** Heap sampling stack depth */
-  heapDepth?: number;
+  /** Allocation sampling attribution */
+  alloc?: boolean;
+  /** Allocation sampling interval in bytes */
+  allocInterval?: number;
+  /** Allocation sampling stack depth */
+  allocDepth?: number;
+  /** V8 CPU time sampling */
+  profile?: boolean;
+  /** CPU sampling interval in microseconds (default 1000) */
+  profileInterval?: number;
+  /** Collect per-function execution counts via V8 precise coverage */
+  callCounts?: boolean;
 }
-/** Execute benchmark with optional parameters */
+/** Invoke the benchmark function, forwarding setup params. */
 export function executeBenchmark<T>(
   benchmark: BenchmarkSpec<T>,
   params?: T,

package/src/{Benchmark.ts → runners/BenchmarkSpec.ts} RENAMED Viewed

@@ -1,4 +1,4 @@
-/** Single benchmark function specification */
+/** Benchmark function with optional module path for worker-mode serialization. */
 export interface BenchmarkSpec<T = unknown> {
   name: string;
   fn: BenchmarkFunction<T>;
@@ -10,23 +10,22 @@ export interface BenchmarkSpec<T = unknown> {
   setupExportName?: string;
 }
+/** Benchmark function, optionally receiving setup parameters from the group. */
 export type BenchmarkFunction<T = unknown> =
   | ((params: T) => void)
   | (() => void);
-/** Group of benchmarks with shared setup */
+/** Group of benchmarks with shared setup and optional baseline. */
 export interface BenchGroup<T = unknown> {
   name: string;
-  /** Prepare parameters for all benchmarks in this group */
   setup?: () => T | Promise<T>;
   benchmarks: BenchmarkSpec<T>[];
-  /** Baseline benchmark for comparison */
   baseline?: BenchmarkSpec<T>;
-  /** Metadata for reporting (e.g., lines of code) */
+  /** Metadata for reporting (e.g. lines of code). */
   metadata?: Record<string, any>;
 }
-/** Collection of benchmark groups */
+/** Named collection of benchmark groups. */
 export interface BenchSuite {
   name: string;
   groups: BenchGroup<any>[];

package/src/runners/CreateRunner.ts CHANGED Viewed

@@ -1,11 +1,9 @@
-import { BasicRunner } from "./BasicRunner.ts";
 import type { BenchRunner } from "./BenchRunner.ts";
+import { TimingRunner } from "./TimingRunner.ts";
-export type KnownRunner = "basic";
+export type KnownRunner = "timing";
-/** @return benchmark runner */
-export async function createRunner(
-  _runnerName: KnownRunner,
-): Promise<BenchRunner> {
-  return new BasicRunner();
+/** Create a benchmark runner by name. */
+export async function createRunner(_name: KnownRunner): Promise<BenchRunner> {
+  return new TimingRunner();
 }