npm - benchforge - Versions diffs - 0.1.9 → 0.2.4 - Mend

benchforge 0.1.9 → 0.2.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (253) hide show

package/LICENSE +20 -0
package/README.md +99 -260
package/bin/benchforge +1 -2
package/dist/AnalyzeArchive-8NCJhmhS.mjs +145 -0
package/dist/AnalyzeArchive-8NCJhmhS.mjs.map +1 -0
package/dist/BenchMatrix-BZVrBB_h.mjs +1050 -0
package/dist/BenchMatrix-BZVrBB_h.mjs.map +1 -0
package/dist/BenchRunner-DglX1NOn.d.mts +302 -0
package/dist/CoverageSampler-D5T9DRqe.mjs +27 -0
package/dist/CoverageSampler-D5T9DRqe.mjs.map +1 -0
package/dist/Formatters-BWj3d4sv.mjs +95 -0
package/dist/Formatters-BWj3d4sv.mjs.map +1 -0
package/dist/{HeapSampler-B8dtKHn1.mjs → HeapSampler-Dq-hpXem.mjs} +4 -4
package/dist/HeapSampler-Dq-hpXem.mjs.map +1 -0
package/dist/RunBenchCLI-C17DrJz8.mjs +3075 -0
package/dist/RunBenchCLI-C17DrJz8.mjs.map +1 -0
package/dist/StatisticalUtils-BD92crgM.mjs +255 -0
package/dist/StatisticalUtils-BD92crgM.mjs.map +1 -0
package/dist/TimeSampler-Ds8n7l2B.mjs +29 -0
package/dist/TimeSampler-Ds8n7l2B.mjs.map +1 -0
package/dist/ViewerServer-BJhdnxlN.mjs +639 -0
package/dist/ViewerServer-BJhdnxlN.mjs.map +1 -0
package/dist/ViewerServer-CuMNdNBz.mjs +2 -0
package/dist/bin/benchforge.mjs +4 -5
package/dist/bin/benchforge.mjs.map +1 -1
package/dist/index.d.mts +731 -522
package/dist/index.mjs +98 -3
package/dist/index.mjs.map +1 -0
package/dist/runners/WorkerScript.d.mts +12 -4
package/dist/runners/WorkerScript.mjs +92 -120
package/dist/runners/WorkerScript.mjs.map +1 -1
package/dist/viewer/assets/CIPlot-BkOvMoMa.js +1 -0
package/dist/viewer/assets/HistogramKde-CmSyUFY0.js +1 -0
package/dist/viewer/assets/LegendUtils-BJpbn_jr.js +55 -0
package/dist/viewer/assets/SampleTimeSeries-C4VBhXr3.js +1 -0
package/dist/viewer/assets/index-Br9bp_cX.js +153 -0
package/dist/viewer/assets/index-NzXXe_CC.css +1 -0
package/dist/viewer/index.html +19 -0
package/dist/viewer/speedscope/LICENSE +21 -0
package/dist/viewer/speedscope/SourceCodePro-Regular.ttf-ILST5JV6.woff2 +0 -0
package/dist/viewer/speedscope/favicon-16x16-V2DMIAZS.js +2 -0
package/dist/viewer/speedscope/favicon-16x16-V2DMIAZS.js.map +7 -0
package/dist/viewer/speedscope/favicon-16x16-VSI62OPJ.png +0 -0
package/dist/viewer/speedscope/favicon-32x32-3EB2YCUY.png +0 -0
package/dist/viewer/speedscope/favicon-32x32-THY3JDJL.js +2 -0
package/dist/viewer/speedscope/favicon-32x32-THY3JDJL.js.map +7 -0
package/dist/viewer/speedscope/favicon-FOKUP5Y5.ico +0 -0
package/dist/viewer/speedscope/favicon-M34RF7BI.js +2 -0
package/dist/viewer/speedscope/favicon-M34RF7BI.js.map +7 -0
package/dist/viewer/speedscope/file-format-schema.json +274 -0
package/dist/viewer/speedscope/index.html +19 -0
package/dist/viewer/speedscope/jfrview_bg-BLJXNNQB.wasm +0 -0
package/dist/viewer/speedscope/perf-vertx-stacks-01-collapsed-all-ZNUIGAJL.txt +199 -0
package/dist/viewer/speedscope/release.txt +3 -0
package/dist/viewer/speedscope/source-code-pro.LICENSE.md +93 -0
package/dist/viewer/speedscope/speedscope-GHPHNKXC.css +2 -0
package/dist/viewer/speedscope/speedscope-GHPHNKXC.css.map +7 -0
package/dist/viewer/speedscope/speedscope-QZFMJ7VP.js +212 -0
package/dist/viewer/speedscope/speedscope-QZFMJ7VP.js.map +7 -0
package/package.json +52 -26
package/src/bin/benchforge.ts +2 -2
package/src/cli/AnalyzeArchive.ts +232 -0
package/src/cli/BrowserBench.ts +322 -0
package/src/cli/CliArgs.ts +164 -48
package/src/cli/CliExport.ts +179 -0
package/src/cli/CliOptions.ts +147 -0
package/src/cli/CliReport.ts +197 -0
package/src/cli/FilterBenchmarks.ts +18 -30
package/src/cli/RunBenchCLI.ts +138 -844
package/src/cli/SuiteRunner.ts +160 -0
package/src/cli/ViewerServer.ts +282 -0
package/src/export/AllocExport.ts +121 -0
package/src/export/ArchiveExport.ts +146 -0
package/src/export/ArchiveFormat.ts +50 -0
package/src/export/CoverageExport.ts +148 -0
package/src/export/EditorUri.ts +10 -0
package/src/export/PerfettoExport.ts +91 -126
package/src/export/SpeedscopeTypes.ts +98 -0
package/src/export/TimeExport.ts +115 -0
package/src/index.ts +87 -62
package/src/matrix/BenchMatrix.ts +230 -0
package/src/matrix/CaseLoader.ts +8 -6
package/src/matrix/MatrixDirRunner.ts +153 -0
package/src/matrix/MatrixFilter.ts +55 -53
package/src/matrix/MatrixInlineRunner.ts +50 -0
package/src/matrix/MatrixReport.ts +94 -254
package/src/matrix/VariantLoader.ts +9 -9
package/src/profiling/browser/BenchLoop.ts +51 -0
package/src/profiling/browser/BrowserCDP.ts +133 -0
package/src/profiling/browser/BrowserGcStats.ts +33 -0
package/src/profiling/browser/BrowserProfiler.ts +160 -0
package/src/profiling/browser/CdpClient.ts +82 -0
package/src/profiling/browser/CdpPage.ts +138 -0
package/src/profiling/browser/ChromeLauncher.ts +158 -0
package/src/profiling/browser/ChromeTraceEvent.ts +28 -0
package/src/profiling/browser/PageLoadMode.ts +61 -0
package/src/profiling/node/CoverageSampler.ts +27 -0
package/src/profiling/node/CoverageTypes.ts +23 -0
package/src/profiling/node/HeapSampleReport.ts +261 -0
package/src/{heap-sample → profiling/node}/HeapSampler.ts +55 -13
package/src/profiling/node/ResolvedProfile.ts +98 -0
package/src/profiling/node/TimeSampler.ts +57 -0
package/src/report/BenchmarkReport.ts +146 -0
package/src/report/Colors.ts +9 -0
package/src/report/Formatters.ts +110 -0
package/src/report/GcSections.ts +151 -0
package/src/{GitUtils.ts → report/GitUtils.ts} +18 -19
package/src/report/HtmlReport.ts +223 -0
package/src/report/ParseStats.ts +73 -0
package/src/report/StandardSections.ts +147 -0
package/src/report/ViewerSections.ts +286 -0
package/src/report/text/TableReport.ts +253 -0
package/src/report/text/TextReport.ts +123 -0
package/src/runners/AdaptiveWrapper.ts +167 -287
package/src/runners/BenchRunner.ts +27 -22
package/src/{Benchmark.ts → runners/BenchmarkSpec.ts} +5 -6
package/src/runners/CreateRunner.ts +5 -7
package/src/runners/GcStats.ts +58 -61
package/src/{MeasuredResults.ts → runners/MeasuredResults.ts} +43 -37
package/src/runners/MergeBatches.ts +123 -0
package/src/{NodeGC.ts → runners/NodeGC.ts} +2 -3
package/src/runners/RunnerOrchestrator.ts +180 -296
package/src/runners/RunnerUtils.ts +75 -1
package/src/runners/SampleStats.ts +100 -0
package/src/runners/TimingRunner.ts +244 -0
package/src/runners/TimingUtils.ts +3 -2
package/src/runners/WorkerScript.ts +162 -178
package/src/stats/BootstrapDifference.ts +282 -0
package/src/{PermutationTest.ts → stats/PermutationTest.ts} +31 -40
package/src/stats/StatisticalUtils.ts +445 -0
package/src/{tests → test}/AdaptiveConvergence.test.ts +10 -10
package/src/test/AdaptiveRunner.test.ts +39 -41
package/src/{tests → test}/AdaptiveSampling.test.ts +9 -9
package/src/test/AdaptiveStatistics.integration.ts +9 -41
package/src/{tests → test}/BenchMatrix.test.ts +31 -28
package/src/test/BenchmarkReport.test.ts +63 -13
package/src/test/BrowserBench.e2e.test.ts +186 -17
package/src/test/BrowserBench.test.ts +10 -5
package/src/test/BuildTimeSection.test.ts +130 -0
package/src/test/CapSamples.test.ts +82 -0
package/src/test/CoverageExport.test.ts +115 -0
package/src/test/CoverageSampler.test.ts +33 -0
package/src/test/HeapAttribution.test.ts +51 -0
package/src/{tests → test}/MatrixFilter.test.ts +16 -16
package/src/{tests → test}/MatrixReport.test.ts +1 -1
package/src/test/PermutationTest.test.ts +1 -1
package/src/{tests → test}/RealDataValidation.test.ts +6 -6
package/src/test/RunBenchCLI.test.ts +57 -56
package/src/test/RunnerOrchestrator.test.ts +12 -12
package/src/test/StatisticalUtils.test.ts +48 -12
package/src/{table-util/test → test}/TableReport.test.ts +2 -2
package/src/test/TestUtils.ts +35 -30
package/src/test/TimeExport.test.ts +139 -0
package/src/test/TimeSampler.test.ts +37 -0
package/src/test/ViewerLive.e2e.test.ts +159 -0
package/src/test/ViewerStatic.static.e2e.test.ts +137 -0
package/src/{tests → test}/fixtures/baseline/impl.ts +1 -1
package/src/{tests → test}/fixtures/bevy30-samples.ts +3 -1
package/src/test/fixtures/cases/asyncCases.ts +9 -0
package/src/{tests → test}/fixtures/cases/cases.ts +5 -2
package/src/test/fixtures/cases/variants/product.ts +2 -0
package/src/test/fixtures/cases/variants/sum.ts +2 -0
package/src/test/fixtures/discover/fast.ts +1 -0
package/src/{tests → test}/fixtures/discover/slow.ts +1 -1
package/src/test/fixtures/invalid/bad.ts +1 -0
package/src/test/fixtures/loader/fast.ts +1 -0
package/src/{tests → test}/fixtures/loader/slow.ts +1 -1
package/src/test/fixtures/loader/stateful.ts +2 -0
package/src/test/fixtures/stateful/stateful.ts +2 -0
package/src/test/fixtures/variants/extra.ts +1 -0
package/src/test/fixtures/variants/impl.ts +1 -0
package/src/test/fixtures/worker/fast.ts +1 -0
package/src/{tests → test}/fixtures/worker/slow.ts +1 -1
package/src/viewer/DateFormat.ts +30 -0
package/src/viewer/Helpers.ts +23 -0
package/src/viewer/LineData.ts +120 -0
package/src/viewer/Providers.ts +191 -0
package/src/viewer/ReportData.ts +123 -0
package/src/viewer/State.ts +49 -0
package/src/viewer/Theme.ts +15 -0
package/src/viewer/components/App.tsx +73 -0
package/src/viewer/components/DropZone.tsx +71 -0
package/src/viewer/components/LazyPlot.ts +33 -0
package/src/viewer/components/SamplesPanel.tsx +214 -0
package/src/viewer/components/Shell.tsx +26 -0
package/src/viewer/components/SourcePanel.tsx +216 -0
package/src/viewer/components/SummaryPanel.tsx +332 -0
package/src/viewer/components/TabBar.tsx +131 -0
package/src/viewer/components/TabContent.tsx +46 -0
package/src/viewer/components/ThemeToggle.tsx +50 -0
package/src/viewer/index.html +20 -0
package/src/viewer/main.tsx +4 -0
package/src/viewer/plots/CIPlot.ts +313 -0
package/src/{html/browser → viewer/plots}/HistogramKde.ts +42 -47
package/src/viewer/plots/LegendUtils.ts +134 -0
package/src/viewer/plots/PlotTypes.ts +85 -0
package/src/viewer/plots/RenderPlots.ts +230 -0
package/src/viewer/plots/SampleTimeSeries.ts +306 -0
package/src/viewer/plots/SvgHelpers.ts +136 -0
package/src/viewer/plots/TimeSeriesMarks.ts +319 -0
package/src/viewer/report.css +427 -0
package/src/viewer/shell.css +357 -0
package/src/viewer/tsconfig.json +11 -0
package/dist/BenchRunner-CSKN9zPy.d.mts +0 -225
package/dist/BrowserHeapSampler-DCeL42RE.mjs +0 -202
package/dist/BrowserHeapSampler-DCeL42RE.mjs.map +0 -1
package/dist/GcStats-ByEovUi1.mjs +0 -77
package/dist/GcStats-ByEovUi1.mjs.map +0 -1
package/dist/HeapSampler-B8dtKHn1.mjs.map +0 -1
package/dist/TimingUtils-ClclVQ7E.mjs +0 -597
package/dist/TimingUtils-ClclVQ7E.mjs.map +0 -1
package/dist/browser/index.js +0 -914
package/dist/src-Cf_LXwlp.mjs +0 -2873
package/dist/src-Cf_LXwlp.mjs.map +0 -1
package/src/BenchMatrix.ts +0 -380
package/src/BenchmarkReport.ts +0 -156
package/src/HtmlDataPrep.ts +0 -148
package/src/StandardSections.ts +0 -261
package/src/StatisticalUtils.ts +0 -176
package/src/TypeUtil.ts +0 -8
package/src/browser/BrowserGcStats.ts +0 -44
package/src/browser/BrowserHeapSampler.ts +0 -271
package/src/export/JsonExport.ts +0 -103
package/src/export/JsonFormat.ts +0 -91
package/src/heap-sample/HeapSampleReport.ts +0 -196
package/src/html/HtmlReport.ts +0 -131
package/src/html/HtmlTemplate.ts +0 -284
package/src/html/Types.ts +0 -88
package/src/html/browser/CIPlot.ts +0 -287
package/src/html/browser/LegendUtils.ts +0 -163
package/src/html/browser/RenderPlots.ts +0 -263
package/src/html/browser/SampleTimeSeries.ts +0 -389
package/src/html/browser/Types.ts +0 -96
package/src/html/browser/index.ts +0 -1
package/src/html/index.ts +0 -17
package/src/runners/BasicRunner.ts +0 -364
package/src/table-util/ConvergenceFormatters.ts +0 -19
package/src/table-util/Formatters.ts +0 -152
package/src/table-util/README.md +0 -70
package/src/table-util/TableReport.ts +0 -293
package/src/tests/fixtures/cases/asyncCases.ts +0 -7
package/src/tests/fixtures/cases/variants/product.ts +0 -2
package/src/tests/fixtures/cases/variants/sum.ts +0 -2
package/src/tests/fixtures/discover/fast.ts +0 -1
package/src/tests/fixtures/invalid/bad.ts +0 -1
package/src/tests/fixtures/loader/fast.ts +0 -1
package/src/tests/fixtures/loader/stateful.ts +0 -2
package/src/tests/fixtures/stateful/stateful.ts +0 -2
package/src/tests/fixtures/variants/extra.ts +0 -1
package/src/tests/fixtures/variants/impl.ts +0 -1
package/src/tests/fixtures/worker/fast.ts +0 -1
package/src/{table-util/test → test}/TableValueExtractor.test.ts +0 -0
package/src/{table-util/test → test}/TableValueExtractor.ts +9 -9

package/src/stats/BootstrapDifference.ts ADDED Viewed

@@ -0,0 +1,282 @@
+import type {
+  BootstrapResult,
+  CIDirection,
+  DifferenceCI,
+  HistogramBin,
+  StatKind,
+} from "./StatisticalUtils.ts";
+import {
+  average,
+  bootstrapSamples,
+  computeInterval,
+  createResample,
+  defaultConfidence,
+  isBootstrappable,
+  maxBootstrapInput,
+  maxOf,
+  minOf,
+  percentile,
+  prepareBlocks,
+  quickSelect,
+  resampleInto,
+  statKindToFn,
+  subsample,
+} from "./StatisticalUtils.ts";
+/** Options for blockDifferenceCI (extends DiffOptions with block parameters) */
+export type BlockDiffOptions = DiffOptions & {
+  /** Block boundaries for the second sample array (defaults to blocksA) */
+  blocksB?: number[];
+  /** Disable Tukey trimming of outlier batches */
+  noBatchTrim?: boolean;
+};
+/** Options for difference CI functions */
+type DiffOptions = {
+  /** Number of bootstrap resamples (default: 10000) */
+  resamples?: number;
+  /** Confidence level 0-1 (default: 0.95) */
+  confidence?: number;
+  /** Equivalence margin in percent. CI within [-margin, +margin] ==> "equivalent" */
+  equivMargin?: number;
+};
+type BinnedCI = {
+  estimate: number;
+  ci: [number, number];
+  histogram: HistogramBin[];
+};
+interface DiffOp {
+  origIndex: number;
+  execIndex: number;
+  computeA: (buf: number[]) => number;
+  computeB: (buf: number[]) => number;
+  pointEstimate: (s: number[]) => number;
+}
+/** @return sample-level bootstrap CI for percentage difference between baseline (a) and current (b). */
+export function sampleDifferenceCI(
+  a: number[],
+  b: number[],
+  statFn: (s: number[]) => number,
+  options: DiffOptions = {},
+): DifferenceCI {
+  const { resamples = bootstrapSamples, confidence: conf = defaultConfidence } =
+    options;
+  const baseVal = statFn(a);
+  const currVal = statFn(b);
+  const observedPct = ((currVal - baseVal) / baseVal) * 100;
+  const subA = subsample(a, maxBootstrapInput);
+  const subB = subsample(b, maxBootstrapInput);
+  const bufA = new Array(subA.length);
+  const bufB = new Array(subB.length);
+  const diffs = Array.from({ length: resamples }, () => {
+    resampleInto(subA, bufA);
+    resampleInto(subB, bufB);
+    const base = statFn(bufA);
+    return ((statFn(bufB) - base) / base) * 100;
+  });
+  const ci = computeInterval(diffs, conf);
+  const capped = subA !== a || subB !== b;
+  return {
+    percent: observedPct,
+    ci,
+    direction: classifyDirection(ci, observedPct, options.equivMargin),
+    histogram: binValues(diffs),
+    ciLevel: "sample",
+    ...(capped && { subsampled: Math.max(a.length, b.length) }),
+  };
+}
+/** Shared-resample difference CI: one resample pair per iteration, all stats computed.
+ *  @return DifferenceCI[] in same order as input stats. */
+export function multiSampleDifferenceCI(
+  a: number[],
+  b: number[],
+  stats: StatKind[],
+  options: DiffOptions = {},
+): DifferenceCI[] {
+  const { resamples = bootstrapSamples, confidence: conf = defaultConfidence } =
+    options;
+  const subA = subsample(a, maxBootstrapInput);
+  const subB = subsample(b, maxBootstrapInput);
+  const bufA = new Array(subA.length);
+  const bufB = new Array(subB.length);
+  const ops = buildDiffOps(stats, subA.length, subB.length);
+  const allDiffs = ops.map(() => new Array<number>(resamples));
+  // Point estimates from original data
+  const baseVals = ops.map(op => op.pointEstimate(a));
+  const currVals = ops.map(op => op.pointEstimate(b));
+  const observedPcts = ops.map(
+    (_, j) => ((currVals[j] - baseVals[j]) / baseVals[j]) * 100,
+  );
+  for (let i = 0; i < resamples; i++) {
+    resampleInto(subA, bufA);
+    resampleInto(subB, bufB);
+    for (let j = 0; j < ops.length; j++) {
+      const base = ops[j].computeA(bufA);
+      const curr = ops[j].computeB(bufB);
+      allDiffs[j][i] = ((curr - base) / base) * 100;
+    }
+  }
+  const capped = subA !== a || subB !== b;
+  const results = new Array<DifferenceCI>(stats.length);
+  for (const op of ops) {
+    const j = op.execIndex;
+    const ci = computeInterval(allDiffs[j], conf);
+    results[op.origIndex] = {
+      percent: observedPcts[j],
+      ci,
+      direction: classifyDirection(ci, observedPcts[j], options.equivMargin),
+      histogram: binValues(allDiffs[j]),
+      ciLevel: "sample",
+      ...(capped && { subsampled: Math.max(a.length, b.length) }),
+    };
+  }
+  return results;
+}
+/** Difference CIs for multiple stats, dispatching block vs sample automatically.
+ *  Returns undefined for non-bootstrappable stats (min/max). */
+export function diffCIs(
+  a: number[],
+  aOffsets: number[] | undefined,
+  b: number[],
+  bOffsets: number[] | undefined,
+  stats: StatKind[],
+  options: BlockDiffOptions = {},
+): (DifferenceCI | undefined)[] {
+  const bsStats = stats.filter(isBootstrappable);
+  if (bsStats.length === 0) return stats.map(() => undefined);
+  const hasBlocks =
+    (aOffsets?.length ?? 0) >= 2 && (bOffsets?.length ?? 0) >= 2;
+  const bsResults = hasBlocks
+    ? bsStats.map(s =>
+        blockDifferenceCI(a, aOffsets!, b, statKindToFn(s), {
+          ...options,
+          blocksB: bOffsets!,
+        }),
+      )
+    : multiSampleDifferenceCI(a, b, bsStats, options);
+  const results: (DifferenceCI | undefined)[] = new Array(stats.length);
+  let bi = 0;
+  for (let i = 0; i < stats.length; i++) {
+    results[i] = isBootstrappable(stats[i]) ? bsResults[bi++] : undefined;
+  }
+  return results;
+}
+/** @return block bootstrap CI for percentage difference between baseline (a) and current (b).
+ *  Tukey-trims outlier batches, then resamples per-block statFn values. Requires 2+ blocks. */
+export function blockDifferenceCI(
+  a: number[],
+  blocksA: number[],
+  b: number[],
+  statFn: (s: number[]) => number,
+  options: BlockDiffOptions = {},
+): DifferenceCI {
+  const { resamples = bootstrapSamples, confidence: conf = defaultConfidence } =
+    options;
+  const bB = options.blocksB ?? blocksA;
+  const noTrim = options.noBatchTrim;
+  const sideA = prepareBlocks(a, blocksA, statFn, noTrim);
+  const sideB = prepareBlocks(b, bB, statFn, noTrim);
+  const baseVal = statFn(sideA.filtered);
+  const currVal = statFn(sideB.filtered);
+  const observedPct = ((currVal - baseVal) / baseVal) * 100;
+  const drawA = () => average(createResample(sideA.blockVals));
+  const drawB = () => average(createResample(sideB.blockVals));
+  const diffs = Array.from({ length: resamples }, () => {
+    const base = drawA();
+    return ((drawB() - base) / base) * 100;
+  });
+  const ci = computeInterval(diffs, conf);
+  return {
+    percent: observedPct,
+    ci,
+    direction: classifyDirection(ci, observedPct, options.equivMargin),
+    histogram: binValues(diffs),
+    trimmed: [sideA.trimCount, sideB.trimCount],
+    ciLevel: "block",
+  };
+}
+/** @return binned CI with histogram from a BootstrapResult */
+export function binBootstrapResult(result: BootstrapResult): BinnedCI {
+  const { estimate, ci, samples } = result;
+  return { estimate, ci, histogram: binValues(samples) };
+}
+/** @return CI direction, with optional equivalence margin (in percent) */
+function classifyDirection(
+  ci: [number, number],
+  observed: number,
+  margin?: number,
+): CIDirection {
+  const withinMargin =
+    margin != null && margin > 0 && ci[0] >= -margin && ci[1] <= margin;
+  if (withinMargin) return "equivalent";
+  const excludesZero = ci[0] > 0 || ci[1] < 0;
+  if (excludesZero) return observed < 0 ? "faster" : "slower";
+  return "uncertain";
+}
+/** @return values binned into histogram for compact visualization */
+function binValues(values: number[], binCount = 30): HistogramBin[] {
+  let min = values[0];
+  let max = values[0];
+  for (let i = 1; i < values.length; i++) {
+    if (values[i] < min) min = values[i];
+    if (values[i] > max) max = values[i];
+  }
+  if (min === max) return [{ x: min, count: values.length }];
+  const step = (max - min) / binCount;
+  const counts = new Array(binCount).fill(0);
+  for (const v of values) {
+    const bin = Math.min(Math.floor((v - min) / step), binCount - 1);
+    counts[bin]++;
+  }
+  return counts.map((count, i) => ({ x: min + (i + 0.5) * step, count }));
+}
+/** Build diff operations: mean/min/max first (non-destructive), then percentiles ascending.
+ *  Each side (A, B) gets its own quickSelect k values since sample sizes may differ. */
+function buildDiffOps(stats: StatKind[], nA: number, nB: number): DiffOp[] {
+  const uniform = (order: number, i: number, fn: (s: number[]) => number) => ({
+    order,
+    origIndex: i,
+    execIndex: 0,
+    computeA: fn,
+    computeB: fn,
+    pointEstimate: fn,
+  });
+  const entries = stats.map((s, i) => {
+    if (s === "mean") return uniform(-3, i, average);
+    if (s === "min") return uniform(-2, i, minOf);
+    if (s === "max") return uniform(-1, i, maxOf);
+    const p = s.percentile;
+    const kA = Math.max(0, Math.ceil(nA * p) - 1);
+    const kB = Math.max(0, Math.ceil(nB * p) - 1);
+    return {
+      order: p,
+      origIndex: i,
+      execIndex: 0,
+      computeA: (buf: number[]) => quickSelect(buf, kA),
+      computeB: (buf: number[]) => quickSelect(buf, kB),
+      pointEstimate: (v: number[]) => percentile(v, p),
+    };
+  });
+  entries.sort((a, b) => a.order - b.order);
+  for (let i = 0; i < entries.length; i++) entries[i].execIndex = i;
+  return entries;
+}

package/src/{PermutationTest.ts → stats/PermutationTest.ts} RENAMED Viewed

@@ -1,19 +1,10 @@
 /**
  * Permutation-based hypothesis testing for benchmark comparisons.
- *
- * Currently unused - the main reporting pipeline uses bootstrapDifferenceCI()
- * from StatisticalUtils.ts instead, which provides confidence intervals on
- * the difference rather than p-values.
- *
- * Kept for potential future use cases where p-values are needed.
+ * Currently unused -- the reporting pipeline uses blockDifferenceCI() instead,
+ * which provides confidence intervals rather than p-values.
  */
-import { average, percentile } from "./StatisticalUtils.ts";
-const significanceThreshold = 0.05;
-const strongSignificance = 0.001;
-const goodSignificance = 0.01;
-const defaultBootstrapSamples = 10000;
+import { average, bootstrapSamples, median } from "./StatisticalUtils.ts";
 /** Statistical comparison between baseline and current benchmark samples */
 export interface ComparisonResult {
@@ -39,17 +30,20 @@ export interface ComparisonResult {
   };
 }
+const significanceThreshold = 0.05;
+const strongSignificance = 0.001;
+const goodSignificance = 0.01;
 /** @return statistical comparison between baseline and current samples */
 export function compareWithBaseline(
   baseline: number[],
   current: number[],
 ): ComparisonResult {
-  const baselineMedian = percentile(baseline, 0.5);
-  const currentMedian = percentile(current, 0.5);
+  const baselineMedian = median(baseline);
+  const currentMedian = median(current);
   const baselineMean = average(baseline);
   const currentMean = average(current);
-  const median = (s: number[]) => percentile(s, 0.5);
   const medianPValue = bootstrapDifferenceTest(baseline, current, median);
   const meanPValue = bootstrapDifferenceTest(baseline, current, average);
@@ -63,25 +57,6 @@ export function compareWithBaseline(
   };
 }
-/** @return change statistics for a current vs baseline comparison */
-function changeStats(current: number, base: number, pValue: number) {
-  return {
-    absolute: current - base,
-    percent: ((current - base) / base) * 100,
-    pValue,
-    significant: pValue < significanceThreshold,
-    significance: getSignificance(pValue),
-  };
-}
-/** @return significance level based on p-value thresholds */
-function getSignificance(pValue: number): "strong" | "good" | "weak" | "none" {
-  if (pValue < strongSignificance) return "strong";
-  if (pValue < goodSignificance) return "good";
-  if (pValue < significanceThreshold) return "weak";
-  return "none";
-}
 /** @return p-value from permutation test for difference in statistics */
 function bootstrapDifferenceTest(
   sample1: number[],
@@ -93,12 +68,23 @@ function bootstrapDifferenceTest(
   const n1 = sample1.length;
   let moreExtreme = 0;
-  for (let i = 0; i < defaultBootstrapSamples; i++) {
+  for (let i = 0; i < bootstrapSamples; i++) {
     const { resample1, resample2 } = shuffleAndSplit(combined, n1);
     const diff = statistic(resample2) - statistic(resample1);
     if (Math.abs(diff) >= Math.abs(observedDiff)) moreExtreme++;
   }
-  return moreExtreme / defaultBootstrapSamples;
+  return moreExtreme / bootstrapSamples;
+}
+/** @return change statistics for a current vs baseline comparison */
+function changeStats(current: number, base: number, pValue: number) {
+  return {
+    absolute: current - base,
+    percent: ((current - base) / base) * 100,
+    pValue,
+    significant: pValue < significanceThreshold,
+    significance: getSignificance(pValue),
+  };
 }
 /** @return randomly shuffled samples split at n1 (Fisher-Yates shuffle) */
@@ -108,8 +94,13 @@ function shuffleAndSplit(combined: number[], n1: number) {
     const j = Math.floor(Math.random() * (i + 1));
     [shuffled[i], shuffled[j]] = [shuffled[j], shuffled[i]];
   }
-  return {
-    resample1: shuffled.slice(0, n1),
-    resample2: shuffled.slice(n1),
-  };
+  return { resample1: shuffled.slice(0, n1), resample2: shuffled.slice(n1) };
+}
+/** @return significance level based on p-value thresholds */
+function getSignificance(pValue: number): "strong" | "good" | "weak" | "none" {
+  if (pValue < strongSignificance) return "strong";
+  if (pValue < goodSignificance) return "good";
+  if (pValue < significanceThreshold) return "weak";
+  return "none";
 }