npm - benchforge - Versions diffs - 0.1.11 → 0.2.4 - Mend

benchforge 0.1.11 → 0.2.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (253) hide show

package/LICENSE +20 -0
package/README.md +99 -294
package/bin/benchforge +1 -2
package/dist/AnalyzeArchive-8NCJhmhS.mjs +145 -0
package/dist/AnalyzeArchive-8NCJhmhS.mjs.map +1 -0
package/dist/BenchMatrix-BZVrBB_h.mjs +1050 -0
package/dist/BenchMatrix-BZVrBB_h.mjs.map +1 -0
package/dist/{BenchRunner-BzyUfiyB.d.mts → BenchRunner-DglX1NOn.d.mts} +119 -66
package/dist/CoverageSampler-D5T9DRqe.mjs +27 -0
package/dist/CoverageSampler-D5T9DRqe.mjs.map +1 -0
package/dist/Formatters-BWj3d4sv.mjs +95 -0
package/dist/Formatters-BWj3d4sv.mjs.map +1 -0
package/dist/{HeapSampler-B8dtKHn1.mjs → HeapSampler-Dq-hpXem.mjs} +4 -4
package/dist/HeapSampler-Dq-hpXem.mjs.map +1 -0
package/dist/RunBenchCLI-C17DrJz8.mjs +3075 -0
package/dist/RunBenchCLI-C17DrJz8.mjs.map +1 -0
package/dist/StatisticalUtils-BD92crgM.mjs +255 -0
package/dist/StatisticalUtils-BD92crgM.mjs.map +1 -0
package/dist/TimeSampler-Ds8n7l2B.mjs +29 -0
package/dist/TimeSampler-Ds8n7l2B.mjs.map +1 -0
package/dist/ViewerServer-BJhdnxlN.mjs +639 -0
package/dist/ViewerServer-BJhdnxlN.mjs.map +1 -0
package/dist/ViewerServer-CuMNdNBz.mjs +2 -0
package/dist/bin/benchforge.mjs +4 -5
package/dist/bin/benchforge.mjs.map +1 -1
package/dist/index.d.mts +711 -558
package/dist/index.mjs +98 -3
package/dist/index.mjs.map +1 -0
package/dist/runners/WorkerScript.d.mts +12 -4
package/dist/runners/WorkerScript.mjs +77 -105
package/dist/runners/WorkerScript.mjs.map +1 -1
package/dist/viewer/assets/CIPlot-BkOvMoMa.js +1 -0
package/dist/viewer/assets/HistogramKde-CmSyUFY0.js +1 -0
package/dist/viewer/assets/LegendUtils-BJpbn_jr.js +55 -0
package/dist/viewer/assets/SampleTimeSeries-C4VBhXr3.js +1 -0
package/dist/viewer/assets/index-Br9bp_cX.js +153 -0
package/dist/viewer/assets/index-NzXXe_CC.css +1 -0
package/dist/viewer/index.html +19 -0
package/dist/viewer/speedscope/LICENSE +21 -0
package/dist/viewer/speedscope/SourceCodePro-Regular.ttf-ILST5JV6.woff2 +0 -0
package/dist/viewer/speedscope/favicon-16x16-V2DMIAZS.js +2 -0
package/dist/viewer/speedscope/favicon-16x16-V2DMIAZS.js.map +7 -0
package/dist/viewer/speedscope/favicon-16x16-VSI62OPJ.png +0 -0
package/dist/viewer/speedscope/favicon-32x32-3EB2YCUY.png +0 -0
package/dist/viewer/speedscope/favicon-32x32-THY3JDJL.js +2 -0
package/dist/viewer/speedscope/favicon-32x32-THY3JDJL.js.map +7 -0
package/dist/viewer/speedscope/favicon-FOKUP5Y5.ico +0 -0
package/dist/viewer/speedscope/favicon-M34RF7BI.js +2 -0
package/dist/viewer/speedscope/favicon-M34RF7BI.js.map +7 -0
package/dist/viewer/speedscope/file-format-schema.json +274 -0
package/dist/viewer/speedscope/index.html +19 -0
package/dist/viewer/speedscope/jfrview_bg-BLJXNNQB.wasm +0 -0
package/dist/viewer/speedscope/perf-vertx-stacks-01-collapsed-all-ZNUIGAJL.txt +199 -0
package/dist/viewer/speedscope/release.txt +3 -0
package/dist/viewer/speedscope/source-code-pro.LICENSE.md +93 -0
package/dist/viewer/speedscope/speedscope-GHPHNKXC.css +2 -0
package/dist/viewer/speedscope/speedscope-GHPHNKXC.css.map +7 -0
package/dist/viewer/speedscope/speedscope-QZFMJ7VP.js +212 -0
package/dist/viewer/speedscope/speedscope-QZFMJ7VP.js.map +7 -0
package/package.json +52 -27
package/src/bin/benchforge.ts +2 -2
package/src/cli/AnalyzeArchive.ts +232 -0
package/src/cli/BrowserBench.ts +322 -0
package/src/cli/CliArgs.ts +164 -51
package/src/cli/CliExport.ts +179 -0
package/src/cli/CliOptions.ts +147 -0
package/src/cli/CliReport.ts +197 -0
package/src/cli/FilterBenchmarks.ts +18 -30
package/src/cli/RunBenchCLI.ts +132 -866
package/src/cli/SuiteRunner.ts +160 -0
package/src/cli/ViewerServer.ts +282 -0
package/src/export/AllocExport.ts +121 -0
package/src/export/ArchiveExport.ts +146 -0
package/src/export/ArchiveFormat.ts +50 -0
package/src/export/CoverageExport.ts +148 -0
package/src/export/EditorUri.ts +10 -0
package/src/export/PerfettoExport.ts +64 -99
package/src/export/SpeedscopeTypes.ts +98 -0
package/src/export/TimeExport.ts +115 -0
package/src/index.ts +86 -67
package/src/matrix/BenchMatrix.ts +230 -0
package/src/matrix/CaseLoader.ts +8 -6
package/src/matrix/MatrixDirRunner.ts +153 -0
package/src/matrix/MatrixFilter.ts +49 -47
package/src/matrix/MatrixInlineRunner.ts +50 -0
package/src/matrix/MatrixReport.ts +90 -250
package/src/matrix/VariantLoader.ts +5 -5
package/src/profiling/browser/BenchLoop.ts +51 -0
package/src/profiling/browser/BrowserCDP.ts +133 -0
package/src/profiling/browser/BrowserGcStats.ts +33 -0
package/src/profiling/browser/BrowserProfiler.ts +160 -0
package/src/profiling/browser/CdpClient.ts +82 -0
package/src/profiling/browser/CdpPage.ts +138 -0
package/src/profiling/browser/ChromeLauncher.ts +158 -0
package/src/profiling/browser/ChromeTraceEvent.ts +28 -0
package/src/profiling/browser/PageLoadMode.ts +61 -0
package/src/profiling/node/CoverageSampler.ts +27 -0
package/src/profiling/node/CoverageTypes.ts +23 -0
package/src/profiling/node/HeapSampleReport.ts +261 -0
package/src/{heap-sample → profiling/node}/HeapSampler.ts +1 -2
package/src/{heap-sample → profiling/node}/ResolvedProfile.ts +18 -9
package/src/profiling/node/TimeSampler.ts +57 -0
package/src/report/BenchmarkReport.ts +146 -0
package/src/report/Colors.ts +9 -0
package/src/report/Formatters.ts +110 -0
package/src/report/GcSections.ts +151 -0
package/src/{GitUtils.ts → report/GitUtils.ts} +18 -19
package/src/report/HtmlReport.ts +223 -0
package/src/report/ParseStats.ts +73 -0
package/src/report/StandardSections.ts +147 -0
package/src/report/ViewerSections.ts +286 -0
package/src/report/text/TableReport.ts +253 -0
package/src/report/text/TextReport.ts +123 -0
package/src/runners/AdaptiveWrapper.ts +116 -236
package/src/runners/BenchRunner.ts +20 -15
package/src/{Benchmark.ts → runners/BenchmarkSpec.ts} +5 -6
package/src/runners/CreateRunner.ts +5 -7
package/src/runners/GcStats.ts +47 -50
package/src/{MeasuredResults.ts → runners/MeasuredResults.ts} +43 -37
package/src/runners/MergeBatches.ts +123 -0
package/src/{NodeGC.ts → runners/NodeGC.ts} +2 -3
package/src/runners/RunnerOrchestrator.ts +127 -243
package/src/runners/RunnerUtils.ts +75 -1
package/src/runners/SampleStats.ts +100 -0
package/src/runners/TimingRunner.ts +244 -0
package/src/runners/TimingUtils.ts +3 -2
package/src/runners/WorkerScript.ts +135 -151
package/src/stats/BootstrapDifference.ts +282 -0
package/src/{PermutationTest.ts → stats/PermutationTest.ts} +8 -17
package/src/stats/StatisticalUtils.ts +445 -0
package/src/{tests → test}/AdaptiveConvergence.test.ts +10 -10
package/src/test/AdaptiveRunner.test.ts +39 -41
package/src/{tests → test}/AdaptiveSampling.test.ts +9 -9
package/src/test/AdaptiveStatistics.integration.ts +2 -2
package/src/{tests → test}/BenchMatrix.test.ts +19 -16
package/src/test/BenchmarkReport.test.ts +63 -13
package/src/test/BrowserBench.e2e.test.ts +186 -17
package/src/test/BrowserBench.test.ts +10 -5
package/src/test/BuildTimeSection.test.ts +130 -0
package/src/test/CapSamples.test.ts +82 -0
package/src/test/CoverageExport.test.ts +115 -0
package/src/test/CoverageSampler.test.ts +33 -0
package/src/test/HeapAttribution.test.ts +14 -14
package/src/{tests → test}/MatrixFilter.test.ts +1 -1
package/src/{tests → test}/MatrixReport.test.ts +1 -1
package/src/test/PermutationTest.test.ts +1 -1
package/src/{tests → test}/RealDataValidation.test.ts +6 -6
package/src/test/RunBenchCLI.test.ts +39 -38
package/src/test/RunnerOrchestrator.test.ts +12 -12
package/src/test/StatisticalUtils.test.ts +48 -12
package/src/{table-util/test → test}/TableReport.test.ts +2 -2
package/src/test/TestUtils.ts +12 -7
package/src/test/TimeExport.test.ts +139 -0
package/src/test/TimeSampler.test.ts +37 -0
package/src/test/ViewerLive.e2e.test.ts +159 -0
package/src/test/ViewerStatic.static.e2e.test.ts +137 -0
package/src/{tests → test}/fixtures/baseline/impl.ts +1 -1
package/src/{tests → test}/fixtures/bevy30-samples.ts +3 -1
package/src/test/fixtures/cases/asyncCases.ts +9 -0
package/src/{tests → test}/fixtures/cases/cases.ts +5 -2
package/src/test/fixtures/cases/variants/product.ts +2 -0
package/src/test/fixtures/cases/variants/sum.ts +2 -0
package/src/test/fixtures/discover/fast.ts +1 -0
package/src/{tests → test}/fixtures/discover/slow.ts +1 -1
package/src/test/fixtures/invalid/bad.ts +1 -0
package/src/test/fixtures/loader/fast.ts +1 -0
package/src/{tests → test}/fixtures/loader/slow.ts +1 -1
package/src/test/fixtures/loader/stateful.ts +2 -0
package/src/test/fixtures/stateful/stateful.ts +2 -0
package/src/test/fixtures/variants/extra.ts +1 -0
package/src/test/fixtures/variants/impl.ts +1 -0
package/src/test/fixtures/worker/fast.ts +1 -0
package/src/{tests → test}/fixtures/worker/slow.ts +1 -1
package/src/viewer/DateFormat.ts +30 -0
package/src/viewer/Helpers.ts +23 -0
package/src/viewer/LineData.ts +120 -0
package/src/viewer/Providers.ts +191 -0
package/src/viewer/ReportData.ts +123 -0
package/src/viewer/State.ts +49 -0
package/src/viewer/Theme.ts +15 -0
package/src/viewer/components/App.tsx +73 -0
package/src/viewer/components/DropZone.tsx +71 -0
package/src/viewer/components/LazyPlot.ts +33 -0
package/src/viewer/components/SamplesPanel.tsx +214 -0
package/src/viewer/components/Shell.tsx +26 -0
package/src/viewer/components/SourcePanel.tsx +216 -0
package/src/viewer/components/SummaryPanel.tsx +332 -0
package/src/viewer/components/TabBar.tsx +131 -0
package/src/viewer/components/TabContent.tsx +46 -0
package/src/viewer/components/ThemeToggle.tsx +50 -0
package/src/viewer/index.html +20 -0
package/src/viewer/main.tsx +4 -0
package/src/viewer/plots/CIPlot.ts +313 -0
package/src/{html/browser → viewer/plots}/HistogramKde.ts +33 -38
package/src/viewer/plots/LegendUtils.ts +134 -0
package/src/viewer/plots/PlotTypes.ts +85 -0
package/src/viewer/plots/RenderPlots.ts +230 -0
package/src/viewer/plots/SampleTimeSeries.ts +306 -0
package/src/viewer/plots/SvgHelpers.ts +136 -0
package/src/viewer/plots/TimeSeriesMarks.ts +319 -0
package/src/viewer/report.css +427 -0
package/src/viewer/shell.css +357 -0
package/src/viewer/tsconfig.json +11 -0
package/dist/BrowserHeapSampler-B6asLKWQ.mjs +0 -202
package/dist/BrowserHeapSampler-B6asLKWQ.mjs.map +0 -1
package/dist/GcStats-wX7Xyblu.mjs +0 -77
package/dist/GcStats-wX7Xyblu.mjs.map +0 -1
package/dist/HeapSampler-B8dtKHn1.mjs.map +0 -1
package/dist/TimingUtils-DwOwkc8G.mjs +0 -597
package/dist/TimingUtils-DwOwkc8G.mjs.map +0 -1
package/dist/browser/index.js +0 -914
package/dist/src-B-DDaCa9.mjs +0 -3108
package/dist/src-B-DDaCa9.mjs.map +0 -1
package/src/BenchMatrix.ts +0 -380
package/src/BenchmarkReport.ts +0 -161
package/src/HtmlDataPrep.ts +0 -148
package/src/StandardSections.ts +0 -261
package/src/StatisticalUtils.ts +0 -175
package/src/TypeUtil.ts +0 -8
package/src/browser/BrowserGcStats.ts +0 -44
package/src/browser/BrowserHeapSampler.ts +0 -271
package/src/export/JsonExport.ts +0 -103
package/src/export/JsonFormat.ts +0 -91
package/src/export/SpeedscopeExport.ts +0 -202
package/src/heap-sample/HeapSampleReport.ts +0 -269
package/src/html/HtmlReport.ts +0 -131
package/src/html/HtmlTemplate.ts +0 -284
package/src/html/Types.ts +0 -88
package/src/html/browser/CIPlot.ts +0 -287
package/src/html/browser/LegendUtils.ts +0 -163
package/src/html/browser/RenderPlots.ts +0 -263
package/src/html/browser/SampleTimeSeries.ts +0 -389
package/src/html/browser/Types.ts +0 -96
package/src/html/browser/index.ts +0 -1
package/src/html/index.ts +0 -17
package/src/runners/BasicRunner.ts +0 -364
package/src/table-util/ConvergenceFormatters.ts +0 -19
package/src/table-util/Formatters.ts +0 -157
package/src/table-util/README.md +0 -70
package/src/table-util/TableReport.ts +0 -293
package/src/tests/fixtures/cases/asyncCases.ts +0 -7
package/src/tests/fixtures/cases/variants/product.ts +0 -2
package/src/tests/fixtures/cases/variants/sum.ts +0 -2
package/src/tests/fixtures/discover/fast.ts +0 -1
package/src/tests/fixtures/invalid/bad.ts +0 -1
package/src/tests/fixtures/loader/fast.ts +0 -1
package/src/tests/fixtures/loader/stateful.ts +0 -2
package/src/tests/fixtures/stateful/stateful.ts +0 -2
package/src/tests/fixtures/variants/extra.ts +0 -1
package/src/tests/fixtures/variants/impl.ts +0 -1
package/src/tests/fixtures/worker/fast.ts +0 -1
/package/src/{table-util/test → test}/TableValueExtractor.test.ts +0 -0
/package/src/{table-util/test → test}/TableValueExtractor.ts +0 -0

package/src/stats/StatisticalUtils.ts ADDED Viewed

@@ -0,0 +1,445 @@
+/** Whether CI was computed from block-level or sample-level resampling */
+export type CILevel = "block" | "sample";
+/** Stat descriptor for multi-bootstrap: known stat kinds enable zero-alloc inner loops */
+export type StatKind = "mean" | "min" | "max" | { percentile: number };
+/** Bootstrap estimate with confidence interval and raw resample distribution */
+export interface BootstrapResult {
+  /** Point estimate from the original sample */
+  estimate: number;
+  /** Confidence interval [lower, upper] from bootstrap resampling */
+  ci: [number, number];
+  /** Bootstrap resample distribution (for visualization) */
+  samples: number[];
+  /** Block-level (between-run) or sample-level (within-run) resampling */
+  ciLevel: CILevel;
+  /** Original sample count before subsampling (set only when cap applied) */
+  subsampled?: number;
+}
+export type CIDirection = "faster" | "slower" | "uncertain" | "equivalent";
+/** Binned histogram for efficient transfer to browser */
+export interface HistogramBin {
+  /** Bin center value */
+  x: number;
+  count: number;
+}
+/**
+ * Bootstrap confidence interval for percentage difference between two sample medians.
+ * Used for baseline comparisons: negative percent means current is faster.
+ */
+export interface DifferenceCI {
+  /** Observed percentage difference (current - baseline) / baseline */
+  percent: number;
+  /** Confidence interval [lower, upper] in percent */
+  ci: [number, number];
+  /** Whether the CI excludes zero: "faster", "slower", or "uncertain" */
+  direction: CIDirection;
+  /** Bootstrap distribution histogram for visualization */
+  histogram?: HistogramBin[];
+  /** Label for the CI plot title (e.g. "mean Δ%") */
+  label?: string;
+  /** Blocks trimmed per side [baseline, current] via Tukey fences */
+  trimmed?: [number, number];
+  /** Block-level (between-run) or sample-level (within-run) resampling */
+  ciLevel?: CILevel;
+  /** false when batch count is too low for reliable CI */
+  ciReliable?: boolean;
+  /** Original sample count before subsampling (set only when cap applied) */
+  subsampled?: number;
+}
+/** Options for bootstrap resampling */
+type BootstrapOptions = {
+  /** Number of bootstrap resamples (default: 10000) */
+  resamples?: number;
+  /** Confidence level 0-1 (default: 0.95) */
+  confidence?: number;
+};
+interface StatOp {
+  origIndex: number;
+  compute: (buf: number[]) => number;
+  pointEstimate: (s: number[]) => number;
+}
+export const defaultConfidence = 0.95;
+export const bootstrapSamples = 10000;
+export const maxBootstrapInput = 10_000;
+const outlierMultiplier = 1.5;
+/** Swap direction labels for higher-is-better metrics (positive = faster) */
+export function swapDirection(ci: DifferenceCI): DifferenceCI {
+  const swap: Record<CIDirection, CIDirection> = {
+    faster: "slower",
+    slower: "faster",
+    uncertain: "uncertain",
+    equivalent: "equivalent",
+  };
+  return { ...ci, direction: swap[ci.direction] };
+}
+/** Negate percent and CI for "higher is better" metrics (e.g., throughput) */
+export function flipCI(ci: DifferenceCI): DifferenceCI {
+  return {
+    ...ci,
+    percent: -ci.percent,
+    ci: [-ci.ci[1], -ci.ci[0]],
+    histogram: ci.histogram?.map(bin => ({ x: -bin.x, count: bin.count })),
+  };
+}
+/** Compute a statistic from samples by kind */
+export function computeStat(samples: number[], kind: StatKind): number {
+  if (kind === "mean") return average(samples);
+  if (kind === "min") return minOf(samples);
+  if (kind === "max") return maxOf(samples);
+  return percentile(samples, kind.percentile);
+}
+/** @return true if the stat kind supports bootstrap CI (min/max don't) */
+export function isBootstrappable(kind: StatKind): boolean {
+  return kind !== "min" && kind !== "max";
+}
+/** @return smallest value in samples (loop to avoid spread-arg limits) */
+export function minOf(samples: number[]): number {
+  let min = samples[0];
+  for (let i = 1; i < samples.length; i++) {
+    if (samples[i] < min) min = samples[i];
+  }
+  return min;
+}
+/** @return largest value in samples (loop to avoid spread-arg limits) */
+export function maxOf(samples: number[]): number {
+  let max = samples[0];
+  for (let i = 1; i < samples.length; i++) {
+    if (samples[i] > max) max = samples[i];
+  }
+  return max;
+}
+/** @return relative standard deviation (coefficient of variation) */
+export function coefficientOfVariation(samples: number[]): number {
+  const mean = average(samples);
+  if (mean === 0) return 0;
+  const stdDev = standardDeviation(samples);
+  return stdDev / mean;
+}
+/** @return median absolute deviation for robust variability measure */
+export function medianAbsoluteDeviation(samples: number[]): number {
+  const med = median(samples);
+  const deviations = samples.map(x => Math.abs(x - med));
+  return median(deviations);
+}
+/** @return outliers detected via Tukey's interquartile range method */
+export function findOutliers(samples: number[]): {
+  rate: number;
+  indices: number[];
+} {
+  const [lo, hi] = tukeyFences(samples, outlierMultiplier);
+  const indices = samples.flatMap((v, i) => (v < lo || v > hi ? [i] : []));
+  return { rate: indices.length / samples.length, indices };
+}
+/** Sample-level bootstrap CI: resample individual samples with replacement. */
+export function sampleBootstrap(
+  samples: number[],
+  statFn: (s: number[]) => number,
+  options: BootstrapOptions = {},
+): BootstrapResult {
+  const { resamples = bootstrapSamples, confidence: conf = defaultConfidence } =
+    options;
+  const sub = subsample(samples, maxBootstrapInput);
+  const buf = new Array(sub.length);
+  const stats = Array.from({ length: resamples }, () => {
+    resampleInto(sub, buf);
+    return statFn(buf);
+  });
+  return {
+    estimate: statFn(samples),
+    ci: computeInterval(stats, conf),
+    samples: stats,
+    ciLevel: "sample",
+    ...(sub !== samples && { subsampled: samples.length }),
+  };
+}
+/** Shared-resample bootstrap: one resample per iteration, all stats computed on it.
+ *  Mean is computed first (non-destructive), then percentiles via in-place quickSelect. */
+export function multiSampleBootstrap(
+  samples: number[],
+  stats: StatKind[],
+  options: BootstrapOptions = {},
+): BootstrapResult[] {
+  const { resamples = bootstrapSamples, confidence: conf = defaultConfidence } =
+    options;
+  const sub = subsample(samples, maxBootstrapInput);
+  const n = sub.length;
+  const buf = new Array(n);
+  const ops = buildStatOps(stats, n);
+  const allStats = ops.map(() => new Array<number>(resamples));
+  for (let i = 0; i < resamples; i++) {
+    resampleInto(sub, buf);
+    for (let j = 0; j < ops.length; j++) {
+      allStats[j][i] = ops[j].compute(buf);
+    }
+  }
+  const capped = sub !== samples;
+  const results = new Array<BootstrapResult>(stats.length);
+  for (let j = 0; j < ops.length; j++) {
+    results[ops[j].origIndex] = {
+      estimate: ops[j].pointEstimate(samples),
+      ci: computeInterval(allStats[j], conf),
+      samples: allStats[j],
+      ciLevel: "sample",
+      ...(capped && { subsampled: samples.length }),
+    };
+  }
+  return results;
+}
+/** Bootstrap CIs for multiple stats, dispatching block vs sample automatically.
+ *  Returns undefined for non-bootstrappable stats (min/max). */
+export function bootstrapCIs(
+  samples: number[],
+  batchOffsets: number[] | undefined,
+  stats: StatKind[],
+  options?: BootstrapOptions,
+): (BootstrapResult | undefined)[] {
+  const bsStats = stats.filter(isBootstrappable);
+  if (bsStats.length === 0) return stats.map(() => undefined);
+  const hasBlocks = (batchOffsets?.length ?? 0) >= 2;
+  const bsResults = hasBlocks
+    ? bsStats.map(s =>
+        blockBootstrap(samples, batchOffsets!, statKindToFn(s), options),
+      )
+    : multiSampleBootstrap(samples, bsStats, options);
+  const results: (BootstrapResult | undefined)[] = new Array(stats.length);
+  let bi = 0;
+  for (let i = 0; i < stats.length; i++) {
+    results[i] = isBootstrappable(stats[i]) ? bsResults[bi++] : undefined;
+  }
+  return results;
+}
+/** Convert StatKind to a stat function */
+export function statKindToFn(kind: StatKind): (s: number[]) => number {
+  if (kind === "mean") return average;
+  if (kind === "min") return minOf;
+  if (kind === "max") return maxOf;
+  const p = kind.percentile;
+  return (s: number[]) => percentile(s, p);
+}
+/** Block bootstrap CI: Tukey-trim outlier batches, then resample per-block
+ *  statFn values as independent observations. Requires 2+ blocks. */
+export function blockBootstrap(
+  samples: number[],
+  blocks: number[],
+  statFn: (s: number[]) => number,
+  options: BootstrapOptions = {},
+): BootstrapResult {
+  const { resamples = bootstrapSamples, confidence: conf = defaultConfidence } =
+    options;
+  const side = prepareBlocks(samples, blocks, statFn);
+  const stats = Array.from({ length: resamples }, () =>
+    average(createResample(side.blockVals)),
+  );
+  return {
+    estimate: statFn(side.filtered),
+    ci: computeInterval(stats, conf),
+    samples: stats,
+    ciLevel: "block",
+  };
+}
+/** @return mean of values */
+export function average(values: number[]): number {
+  const sum = values.reduce((a, b) => a + b, 0);
+  return sum / values.length;
+}
+/** @return median (50th percentile) of values */
+export function median(values: number[]): number {
+  return percentile(values, 0.5);
+}
+/** @return standard deviation with Bessel's correction */
+export function standardDeviation(samples: number[]): number {
+  if (samples.length <= 1) return 0;
+  const mean = average(samples);
+  const variance =
+    samples.reduce((sum, x) => sum + (x - mean) ** 2, 0) / (samples.length - 1);
+  return Math.sqrt(variance);
+}
+/** @return value at percentile p (0-1), using O(N) quickselect */
+export function percentile(values: number[], p: number): number {
+  const copy = values.slice();
+  const k = Math.max(0, Math.ceil(copy.length * p) - 1);
+  return quickSelect(copy, k);
+}
+/** Hoare's selection: O(N) average k-th smallest element. Mutates arr. */
+export function quickSelect(arr: number[], k: number): number {
+  let lo = 0;
+  let hi = arr.length - 1;
+  while (lo < hi) {
+    const [i, j] = partition(arr, lo, hi);
+    if (k <= j) hi = j;
+    else if (k >= i) lo = i;
+    else break;
+  }
+  return arr[k];
+}
+/** Fill buf in-place with bootstrap resample (with replacement) from source */
+export function resampleInto(source: number[], buf: number[]): void {
+  const n = source.length;
+  for (let i = 0; i < n; i++) {
+    buf[i] = source[Math.floor(Math.random() * n)];
+  }
+}
+/** @return bootstrap resample with replacement */
+export function createResample(samples: number[]): number[] {
+  const n = samples.length;
+  return Array.from(
+    { length: n },
+    () => samples[Math.floor(Math.random() * n)],
+  );
+}
+/** @return Tukey fence bounds [lo, hi] for the given IQR multiplier.
+ *  minIqr prevents degenerate fences when values are tightly clustered. */
+export function tukeyFences(
+  values: number[],
+  multiplier = 3,
+  minIqr = 0,
+): [lo: number, hi: number] {
+  const q1 = percentile(values, 0.25);
+  const q3 = percentile(values, 0.75);
+  const iqr = Math.max(q3 - q1, minIqr);
+  return [q1 - multiplier * iqr, q3 + multiplier * iqr];
+}
+/** @return indices of values below the upper 3x IQR Tukey fence.
+ *  Only trims slow outliers — fast batches reflect less environmental noise, not errors.
+ *  Floors IQR at 2% of median to avoid over-trimming tightly clustered batch means. */
+export function tukeyKeep(values: number[]): number[] {
+  if (values.length < 4) return values.map((_, i) => i);
+  const minIqr = median(values) * 0.02;
+  const [, hi] = tukeyFences(values, 3, minIqr);
+  return values.flatMap((v, i) => (v <= hi ? [i] : []));
+}
+/** @return samples split into blocks by offset boundaries */
+export function splitByOffsets(
+  samples: number[],
+  offsets: number[],
+): number[][] {
+  return offsets.map((start, i) => {
+    const end = i + 1 < offsets.length ? offsets[i + 1] : samples.length;
+    return samples.slice(start, end);
+  });
+}
+/** @return per-block statistic values from sample data split by offsets */
+export function blockValues(
+  samples: number[],
+  offsets: number[],
+  fn: (s: number[]) => number,
+): number[] {
+  return splitByOffsets(samples, offsets).map(fn);
+}
+/** Tukey-trim outlier blocks and compute per-block statistic for one side */
+export function prepareBlocks(
+  samples: number[],
+  offsets: number[],
+  fn: (s: number[]) => number,
+  noTrim?: boolean,
+): { blockVals: number[]; filtered: number[]; trimCount: number } {
+  const splits = splitByOffsets(samples, offsets);
+  const means = splits.map(average);
+  const keep = noTrim ? means.map((_, i) => i) : tukeyKeep(means);
+  return {
+    blockVals: keep.map(i => fn(splits[i])),
+    filtered: keep.flatMap(i => splits[i]),
+    trimCount: means.length - keep.length,
+  };
+}
+/** Random subsample without replacement via partial Fisher-Yates. Returns original if n <= max. */
+export function subsample(samples: number[], max: number): number[] {
+  if (samples.length <= max) return samples;
+  const copy = samples.slice();
+  for (let i = 0; i < max; i++) {
+    const j = i + Math.floor(Math.random() * (copy.length - i));
+    [copy[i], copy[j]] = [copy[j], copy[i]];
+  }
+  return copy.slice(0, max);
+}
+/** @return confidence interval [lower, upper] */
+export function computeInterval(
+  values: number[],
+  conf: number,
+): [number, number] {
+  const alpha = (1 - conf) / 2;
+  return [percentile(values, alpha), percentile(values, 1 - alpha)];
+}
+/** Build stat operations in safe order: mean/min/max first (non-destructive),
+ *  then percentiles ascending (use quickSelect which mutates buf) */
+function buildStatOps(stats: StatKind[], n: number): StatOp[] {
+  const simple = (order: number, i: number, fn: (s: number[]) => number) => ({
+    order,
+    compute: fn,
+    pointEstimate: fn,
+    origIndex: i,
+  });
+  const ops = stats.map((s, i): StatOp & { order: number } => {
+    if (s === "mean") return simple(-3, i, average);
+    if (s === "min") return simple(-2, i, minOf);
+    if (s === "max") return simple(-1, i, maxOf);
+    const p = s.percentile;
+    const k = Math.max(0, Math.ceil(n * p) - 1);
+    return {
+      order: p,
+      origIndex: i,
+      compute: (buf: number[]) => quickSelect(buf, k),
+      pointEstimate: (v: number[]) => percentile(v, p),
+    };
+  });
+  ops.sort((a, b) => a.order - b.order);
+  return ops;
+}
+/** Hoare partition around the midpoint pivot. @return [i, j] boundary indices. */
+function partition(arr: number[], lo: number, hi: number): [number, number] {
+  const pivot = arr[lo + ((hi - lo) >> 1)];
+  let i = lo;
+  let j = hi;
+  while (i <= j) {
+    while (arr[i] < pivot) i++;
+    while (arr[j] > pivot) j--;
+    if (i <= j) {
+      [arr[i], arr[j]] = [arr[j], arr[i]];
+      i++;
+      j--;
+    }
+  }
+  return [i, j];
+}

package/src/{tests → test}/AdaptiveConvergence.test.ts RENAMED Viewed

@@ -2,7 +2,7 @@ import { test } from "vitest";
 import { checkConvergence } from "../runners/AdaptiveWrapper.ts";
 import { bevy30SamplesNs } from "./fixtures/bevy30-samples.ts";
-test("convergence with insufficient samples", () => {
+test.skip("convergence with insufficient samples", () => {
   const samples = [1e6, 2e6, 3e6]; // 3 samples in nanoseconds
   const result = checkConvergence(samples);
@@ -14,7 +14,7 @@ test("convergence with insufficient samples", () => {
   }
 });
-test("convergence with stable samples", () => {
+test.skip("convergence with stable samples", () => {
   // Create very stable samples (all within 1% of each other)
   const base = 50e6; // 50ms in nanoseconds
   const samples = Array.from(
@@ -30,7 +30,7 @@ test("convergence with stable samples", () => {
   }
 });
-test("convergence with drifting median", () => {
+test.skip("convergence with drifting median", () => {
   // Create samples with increasing median over time
   const samples = Array.from(
     { length: 200 },
@@ -48,7 +48,7 @@ test("convergence with drifting median", () => {
   }
 });
-test("convergence with outliers", () => {
+test.skip("convergence with outliers", () => {
   // Create stable samples with occasional outliers every 20 samples
   const base = 50e6;
   const samples = Array.from({ length: 200 }, (_, i) =>
@@ -63,7 +63,7 @@ test("convergence with outliers", () => {
   }
 });
-test("convergence with real bevy30 data - early samples", () => {
+test.skip("convergence with real bevy30 data - early samples", () => {
   // Test with first 100 samples (should show initial instability)
   const early = bevy30SamplesNs.slice(0, 100);
   const result = checkConvergence(early);
@@ -78,7 +78,7 @@ test("convergence with real bevy30 data - early samples", () => {
   );
 });
-test("convergence with real bevy30 data - middle samples", () => {
+test.skip("convergence with real bevy30 data - middle samples", () => {
   // Test with middle 200 samples (should be more stable)
   const middle = bevy30SamplesNs.slice(200, 400);
   const result = checkConvergence(middle);
@@ -92,7 +92,7 @@ test("convergence with real bevy30 data - middle samples", () => {
   );
 });
-test("convergence with real bevy30 data - all samples", () => {
+test.skip("convergence with real bevy30 data - all samples", () => {
   const result = checkConvergence(bevy30SamplesNs);
   if (result.confidence > 100 || result.confidence < 0) {
@@ -109,7 +109,7 @@ test("convergence with real bevy30 data - all samples", () => {
   );
 });
-test("convergence progression over time", () => {
+test.skip("convergence progression over time", () => {
   const checkpoints = [50, 100, 150, 200, 300, 400, 500, 610];
   const progressions = checkpoints.map(n => {
     const result = checkConvergence(bevy30SamplesNs.slice(0, n));
@@ -132,7 +132,7 @@ test("convergence progression over time", () => {
   }
 });
-test("window size adaptation for different execution times", () => {
+test.skip("window size adaptation for different execution times", () => {
   // Fast samples (microseconds)
   const fastSamples = Array.from(
     { length: 100 },
@@ -155,7 +155,7 @@ test("window size adaptation for different execution times", () => {
   }
 });
-test("outlier impact calculation", () => {
+test.skip("outlier impact calculation", () => {
   // 95 stable samples + 5 outliers (2x slower)
   const base = 50e6; // 50ms
   const stable = Array.from(

package/src/test/AdaptiveRunner.test.ts CHANGED Viewed

@@ -1,42 +1,40 @@
 import { expect, test } from "vitest";
-import type { BenchmarkSpec } from "../Benchmark.ts";
 import {
   checkConvergence,
   createAdaptiveWrapper,
 } from "../runners/AdaptiveWrapper.ts";
-import { BasicRunner } from "../runners/BasicRunner.ts";
-test(
-  "adaptive runner collects samples for minimum time",
-  { timeout: 10000 },
-  async () => {
-    const runner = new BasicRunner();
-    const adaptive = createAdaptiveWrapper(runner, {
-      minTime: 100,
-      maxTime: 300,
-    });
-    const benchmark: BenchmarkSpec = {
-      name: "test-min-time",
-      fn: () => {
-        let sum = 0;
-        for (let i = 0; i < 1000; i++) sum += i;
-        return sum;
-      },
-    };
-    const start = performance.now();
-    const results = await adaptive.runBench(benchmark, { minTime: 100 });
-    const elapsed = performance.now() - start;
-    expect(results).toHaveLength(1);
-    expect(results[0].samples.length).toBeGreaterThan(0);
-    expect(elapsed).toBeGreaterThanOrEqual(100);
-  },
-);
-test("adaptive runner respects max time limit", async () => {
-  const runner = new BasicRunner();
+import type { BenchmarkSpec } from "../runners/BenchmarkSpec.ts";
+import { TimingRunner } from "../runners/TimingRunner.ts";
+test.skip("adaptive runner collects samples for minimum time", {
+  timeout: 10000,
+}, async () => {
+  const runner = new TimingRunner();
+  const adaptive = createAdaptiveWrapper(runner, {
+    minTime: 100,
+    maxTime: 300,
+  });
+  const benchmark: BenchmarkSpec = {
+    name: "test-min-time",
+    fn: () => {
+      let sum = 0;
+      for (let i = 0; i < 1000; i++) sum += i;
+      return sum;
+    },
+  };
+  const start = performance.now();
+  const results = await adaptive.runBench(benchmark, { minTime: 100 });
+  const elapsed = performance.now() - start;
+  expect(results).toHaveLength(1);
+  expect(results[0].samples.length).toBeGreaterThan(0);
+  expect(elapsed).toBeGreaterThanOrEqual(100);
+});
+test.skip("adaptive runner respects max time limit", async () => {
+  const runner = new TimingRunner();
   const adaptive = createAdaptiveWrapper(runner, {
     minTime: 100,
     maxTime: 2000,
@@ -62,8 +60,8 @@ test("adaptive runner respects max time limit", async () => {
   expect(results[0].totalTime).toBeLessThanOrEqual(2.0);
 });
-test("adaptive runner merges results correctly", async () => {
-  const runner = new BasicRunner();
+test.skip("adaptive runner merges results correctly", async () => {
+  const runner = new TimingRunner();
   const adaptive = createAdaptiveWrapper(runner, {
     minTime: 100,
     maxTime: 200,
@@ -101,8 +99,8 @@ test("adaptive runner merges results correctly", async () => {
   expect(result.totalTime).toBeGreaterThan(0);
 }, 10000);
-test("convergence detection with stable benchmark", async () => {
-  const runner = new BasicRunner();
+test.skip("convergence detection with stable benchmark", async () => {
+  const runner = new TimingRunner();
   const adaptive = createAdaptiveWrapper(runner, {
     minTime: 100,
     maxTime: 2000,
@@ -129,8 +127,8 @@ test("convergence detection with stable benchmark", async () => {
   expect(result.convergence?.reason).toBeDefined();
 });
-test("convergence detection with variable benchmark", async () => {
-  const runner = new BasicRunner();
+test.skip("convergence detection with variable benchmark", async () => {
+  const runner = new TimingRunner();
   const adaptive = createAdaptiveWrapper(runner, {
     minTime: 100,
     maxTime: 1000,
@@ -162,7 +160,7 @@ test("convergence detection with variable benchmark", async () => {
   expect(result.convergence?.confidence).toBeLessThanOrEqual(100);
 });
-test("checkConvergence function basics", () => {
+test.skip("checkConvergence function basics", () => {
   // Not enough samples
   const fewSamples = [1e6, 1.1e6, 1e6];
   const fewResult = checkConvergence(fewSamples);