npm - benchforge - Versions diffs - 0.1.11 → 0.2.4 - Mend

benchforge 0.1.11 → 0.2.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (253) hide show

package/LICENSE +20 -0
package/README.md +99 -294
package/bin/benchforge +1 -2
package/dist/AnalyzeArchive-8NCJhmhS.mjs +145 -0
package/dist/AnalyzeArchive-8NCJhmhS.mjs.map +1 -0
package/dist/BenchMatrix-BZVrBB_h.mjs +1050 -0
package/dist/BenchMatrix-BZVrBB_h.mjs.map +1 -0
package/dist/{BenchRunner-BzyUfiyB.d.mts → BenchRunner-DglX1NOn.d.mts} +119 -66
package/dist/CoverageSampler-D5T9DRqe.mjs +27 -0
package/dist/CoverageSampler-D5T9DRqe.mjs.map +1 -0
package/dist/Formatters-BWj3d4sv.mjs +95 -0
package/dist/Formatters-BWj3d4sv.mjs.map +1 -0
package/dist/{HeapSampler-B8dtKHn1.mjs → HeapSampler-Dq-hpXem.mjs} +4 -4
package/dist/HeapSampler-Dq-hpXem.mjs.map +1 -0
package/dist/RunBenchCLI-C17DrJz8.mjs +3075 -0
package/dist/RunBenchCLI-C17DrJz8.mjs.map +1 -0
package/dist/StatisticalUtils-BD92crgM.mjs +255 -0
package/dist/StatisticalUtils-BD92crgM.mjs.map +1 -0
package/dist/TimeSampler-Ds8n7l2B.mjs +29 -0
package/dist/TimeSampler-Ds8n7l2B.mjs.map +1 -0
package/dist/ViewerServer-BJhdnxlN.mjs +639 -0
package/dist/ViewerServer-BJhdnxlN.mjs.map +1 -0
package/dist/ViewerServer-CuMNdNBz.mjs +2 -0
package/dist/bin/benchforge.mjs +4 -5
package/dist/bin/benchforge.mjs.map +1 -1
package/dist/index.d.mts +711 -558
package/dist/index.mjs +98 -3
package/dist/index.mjs.map +1 -0
package/dist/runners/WorkerScript.d.mts +12 -4
package/dist/runners/WorkerScript.mjs +77 -105
package/dist/runners/WorkerScript.mjs.map +1 -1
package/dist/viewer/assets/CIPlot-BkOvMoMa.js +1 -0
package/dist/viewer/assets/HistogramKde-CmSyUFY0.js +1 -0
package/dist/viewer/assets/LegendUtils-BJpbn_jr.js +55 -0
package/dist/viewer/assets/SampleTimeSeries-C4VBhXr3.js +1 -0
package/dist/viewer/assets/index-Br9bp_cX.js +153 -0
package/dist/viewer/assets/index-NzXXe_CC.css +1 -0
package/dist/viewer/index.html +19 -0
package/dist/viewer/speedscope/LICENSE +21 -0
package/dist/viewer/speedscope/SourceCodePro-Regular.ttf-ILST5JV6.woff2 +0 -0
package/dist/viewer/speedscope/favicon-16x16-V2DMIAZS.js +2 -0
package/dist/viewer/speedscope/favicon-16x16-V2DMIAZS.js.map +7 -0
package/dist/viewer/speedscope/favicon-16x16-VSI62OPJ.png +0 -0
package/dist/viewer/speedscope/favicon-32x32-3EB2YCUY.png +0 -0
package/dist/viewer/speedscope/favicon-32x32-THY3JDJL.js +2 -0
package/dist/viewer/speedscope/favicon-32x32-THY3JDJL.js.map +7 -0
package/dist/viewer/speedscope/favicon-FOKUP5Y5.ico +0 -0
package/dist/viewer/speedscope/favicon-M34RF7BI.js +2 -0
package/dist/viewer/speedscope/favicon-M34RF7BI.js.map +7 -0
package/dist/viewer/speedscope/file-format-schema.json +274 -0
package/dist/viewer/speedscope/index.html +19 -0
package/dist/viewer/speedscope/jfrview_bg-BLJXNNQB.wasm +0 -0
package/dist/viewer/speedscope/perf-vertx-stacks-01-collapsed-all-ZNUIGAJL.txt +199 -0
package/dist/viewer/speedscope/release.txt +3 -0
package/dist/viewer/speedscope/source-code-pro.LICENSE.md +93 -0
package/dist/viewer/speedscope/speedscope-GHPHNKXC.css +2 -0
package/dist/viewer/speedscope/speedscope-GHPHNKXC.css.map +7 -0
package/dist/viewer/speedscope/speedscope-QZFMJ7VP.js +212 -0
package/dist/viewer/speedscope/speedscope-QZFMJ7VP.js.map +7 -0
package/package.json +52 -27
package/src/bin/benchforge.ts +2 -2
package/src/cli/AnalyzeArchive.ts +232 -0
package/src/cli/BrowserBench.ts +322 -0
package/src/cli/CliArgs.ts +164 -51
package/src/cli/CliExport.ts +179 -0
package/src/cli/CliOptions.ts +147 -0
package/src/cli/CliReport.ts +197 -0
package/src/cli/FilterBenchmarks.ts +18 -30
package/src/cli/RunBenchCLI.ts +132 -866
package/src/cli/SuiteRunner.ts +160 -0
package/src/cli/ViewerServer.ts +282 -0
package/src/export/AllocExport.ts +121 -0
package/src/export/ArchiveExport.ts +146 -0
package/src/export/ArchiveFormat.ts +50 -0
package/src/export/CoverageExport.ts +148 -0
package/src/export/EditorUri.ts +10 -0
package/src/export/PerfettoExport.ts +64 -99
package/src/export/SpeedscopeTypes.ts +98 -0
package/src/export/TimeExport.ts +115 -0
package/src/index.ts +86 -67
package/src/matrix/BenchMatrix.ts +230 -0
package/src/matrix/CaseLoader.ts +8 -6
package/src/matrix/MatrixDirRunner.ts +153 -0
package/src/matrix/MatrixFilter.ts +49 -47
package/src/matrix/MatrixInlineRunner.ts +50 -0
package/src/matrix/MatrixReport.ts +90 -250
package/src/matrix/VariantLoader.ts +5 -5
package/src/profiling/browser/BenchLoop.ts +51 -0
package/src/profiling/browser/BrowserCDP.ts +133 -0
package/src/profiling/browser/BrowserGcStats.ts +33 -0
package/src/profiling/browser/BrowserProfiler.ts +160 -0
package/src/profiling/browser/CdpClient.ts +82 -0
package/src/profiling/browser/CdpPage.ts +138 -0
package/src/profiling/browser/ChromeLauncher.ts +158 -0
package/src/profiling/browser/ChromeTraceEvent.ts +28 -0
package/src/profiling/browser/PageLoadMode.ts +61 -0
package/src/profiling/node/CoverageSampler.ts +27 -0
package/src/profiling/node/CoverageTypes.ts +23 -0
package/src/profiling/node/HeapSampleReport.ts +261 -0
package/src/{heap-sample → profiling/node}/HeapSampler.ts +1 -2
package/src/{heap-sample → profiling/node}/ResolvedProfile.ts +18 -9
package/src/profiling/node/TimeSampler.ts +57 -0
package/src/report/BenchmarkReport.ts +146 -0
package/src/report/Colors.ts +9 -0
package/src/report/Formatters.ts +110 -0
package/src/report/GcSections.ts +151 -0
package/src/{GitUtils.ts → report/GitUtils.ts} +18 -19
package/src/report/HtmlReport.ts +223 -0
package/src/report/ParseStats.ts +73 -0
package/src/report/StandardSections.ts +147 -0
package/src/report/ViewerSections.ts +286 -0
package/src/report/text/TableReport.ts +253 -0
package/src/report/text/TextReport.ts +123 -0
package/src/runners/AdaptiveWrapper.ts +116 -236
package/src/runners/BenchRunner.ts +20 -15
package/src/{Benchmark.ts → runners/BenchmarkSpec.ts} +5 -6
package/src/runners/CreateRunner.ts +5 -7
package/src/runners/GcStats.ts +47 -50
package/src/{MeasuredResults.ts → runners/MeasuredResults.ts} +43 -37
package/src/runners/MergeBatches.ts +123 -0
package/src/{NodeGC.ts → runners/NodeGC.ts} +2 -3
package/src/runners/RunnerOrchestrator.ts +127 -243
package/src/runners/RunnerUtils.ts +75 -1
package/src/runners/SampleStats.ts +100 -0
package/src/runners/TimingRunner.ts +244 -0
package/src/runners/TimingUtils.ts +3 -2
package/src/runners/WorkerScript.ts +135 -151
package/src/stats/BootstrapDifference.ts +282 -0
package/src/{PermutationTest.ts → stats/PermutationTest.ts} +8 -17
package/src/stats/StatisticalUtils.ts +445 -0
package/src/{tests → test}/AdaptiveConvergence.test.ts +10 -10
package/src/test/AdaptiveRunner.test.ts +39 -41
package/src/{tests → test}/AdaptiveSampling.test.ts +9 -9
package/src/test/AdaptiveStatistics.integration.ts +2 -2
package/src/{tests → test}/BenchMatrix.test.ts +19 -16
package/src/test/BenchmarkReport.test.ts +63 -13
package/src/test/BrowserBench.e2e.test.ts +186 -17
package/src/test/BrowserBench.test.ts +10 -5
package/src/test/BuildTimeSection.test.ts +130 -0
package/src/test/CapSamples.test.ts +82 -0
package/src/test/CoverageExport.test.ts +115 -0
package/src/test/CoverageSampler.test.ts +33 -0
package/src/test/HeapAttribution.test.ts +14 -14
package/src/{tests → test}/MatrixFilter.test.ts +1 -1
package/src/{tests → test}/MatrixReport.test.ts +1 -1
package/src/test/PermutationTest.test.ts +1 -1
package/src/{tests → test}/RealDataValidation.test.ts +6 -6
package/src/test/RunBenchCLI.test.ts +39 -38
package/src/test/RunnerOrchestrator.test.ts +12 -12
package/src/test/StatisticalUtils.test.ts +48 -12
package/src/{table-util/test → test}/TableReport.test.ts +2 -2
package/src/test/TestUtils.ts +12 -7
package/src/test/TimeExport.test.ts +139 -0
package/src/test/TimeSampler.test.ts +37 -0
package/src/test/ViewerLive.e2e.test.ts +159 -0
package/src/test/ViewerStatic.static.e2e.test.ts +137 -0
package/src/{tests → test}/fixtures/baseline/impl.ts +1 -1
package/src/{tests → test}/fixtures/bevy30-samples.ts +3 -1
package/src/test/fixtures/cases/asyncCases.ts +9 -0
package/src/{tests → test}/fixtures/cases/cases.ts +5 -2
package/src/test/fixtures/cases/variants/product.ts +2 -0
package/src/test/fixtures/cases/variants/sum.ts +2 -0
package/src/test/fixtures/discover/fast.ts +1 -0
package/src/{tests → test}/fixtures/discover/slow.ts +1 -1
package/src/test/fixtures/invalid/bad.ts +1 -0
package/src/test/fixtures/loader/fast.ts +1 -0
package/src/{tests → test}/fixtures/loader/slow.ts +1 -1
package/src/test/fixtures/loader/stateful.ts +2 -0
package/src/test/fixtures/stateful/stateful.ts +2 -0
package/src/test/fixtures/variants/extra.ts +1 -0
package/src/test/fixtures/variants/impl.ts +1 -0
package/src/test/fixtures/worker/fast.ts +1 -0
package/src/{tests → test}/fixtures/worker/slow.ts +1 -1
package/src/viewer/DateFormat.ts +30 -0
package/src/viewer/Helpers.ts +23 -0
package/src/viewer/LineData.ts +120 -0
package/src/viewer/Providers.ts +191 -0
package/src/viewer/ReportData.ts +123 -0
package/src/viewer/State.ts +49 -0
package/src/viewer/Theme.ts +15 -0
package/src/viewer/components/App.tsx +73 -0
package/src/viewer/components/DropZone.tsx +71 -0
package/src/viewer/components/LazyPlot.ts +33 -0
package/src/viewer/components/SamplesPanel.tsx +214 -0
package/src/viewer/components/Shell.tsx +26 -0
package/src/viewer/components/SourcePanel.tsx +216 -0
package/src/viewer/components/SummaryPanel.tsx +332 -0
package/src/viewer/components/TabBar.tsx +131 -0
package/src/viewer/components/TabContent.tsx +46 -0
package/src/viewer/components/ThemeToggle.tsx +50 -0
package/src/viewer/index.html +20 -0
package/src/viewer/main.tsx +4 -0
package/src/viewer/plots/CIPlot.ts +313 -0
package/src/{html/browser → viewer/plots}/HistogramKde.ts +33 -38
package/src/viewer/plots/LegendUtils.ts +134 -0
package/src/viewer/plots/PlotTypes.ts +85 -0
package/src/viewer/plots/RenderPlots.ts +230 -0
package/src/viewer/plots/SampleTimeSeries.ts +306 -0
package/src/viewer/plots/SvgHelpers.ts +136 -0
package/src/viewer/plots/TimeSeriesMarks.ts +319 -0
package/src/viewer/report.css +427 -0
package/src/viewer/shell.css +357 -0
package/src/viewer/tsconfig.json +11 -0
package/dist/BrowserHeapSampler-B6asLKWQ.mjs +0 -202
package/dist/BrowserHeapSampler-B6asLKWQ.mjs.map +0 -1
package/dist/GcStats-wX7Xyblu.mjs +0 -77
package/dist/GcStats-wX7Xyblu.mjs.map +0 -1
package/dist/HeapSampler-B8dtKHn1.mjs.map +0 -1
package/dist/TimingUtils-DwOwkc8G.mjs +0 -597
package/dist/TimingUtils-DwOwkc8G.mjs.map +0 -1
package/dist/browser/index.js +0 -914
package/dist/src-B-DDaCa9.mjs +0 -3108
package/dist/src-B-DDaCa9.mjs.map +0 -1
package/src/BenchMatrix.ts +0 -380
package/src/BenchmarkReport.ts +0 -161
package/src/HtmlDataPrep.ts +0 -148
package/src/StandardSections.ts +0 -261
package/src/StatisticalUtils.ts +0 -175
package/src/TypeUtil.ts +0 -8
package/src/browser/BrowserGcStats.ts +0 -44
package/src/browser/BrowserHeapSampler.ts +0 -271
package/src/export/JsonExport.ts +0 -103
package/src/export/JsonFormat.ts +0 -91
package/src/export/SpeedscopeExport.ts +0 -202
package/src/heap-sample/HeapSampleReport.ts +0 -269
package/src/html/HtmlReport.ts +0 -131
package/src/html/HtmlTemplate.ts +0 -284
package/src/html/Types.ts +0 -88
package/src/html/browser/CIPlot.ts +0 -287
package/src/html/browser/LegendUtils.ts +0 -163
package/src/html/browser/RenderPlots.ts +0 -263
package/src/html/browser/SampleTimeSeries.ts +0 -389
package/src/html/browser/Types.ts +0 -96
package/src/html/browser/index.ts +0 -1
package/src/html/index.ts +0 -17
package/src/runners/BasicRunner.ts +0 -364
package/src/table-util/ConvergenceFormatters.ts +0 -19
package/src/table-util/Formatters.ts +0 -157
package/src/table-util/README.md +0 -70
package/src/table-util/TableReport.ts +0 -293
package/src/tests/fixtures/cases/asyncCases.ts +0 -7
package/src/tests/fixtures/cases/variants/product.ts +0 -2
package/src/tests/fixtures/cases/variants/sum.ts +0 -2
package/src/tests/fixtures/discover/fast.ts +0 -1
package/src/tests/fixtures/invalid/bad.ts +0 -1
package/src/tests/fixtures/loader/fast.ts +0 -1
package/src/tests/fixtures/loader/stateful.ts +0 -2
package/src/tests/fixtures/stateful/stateful.ts +0 -2
package/src/tests/fixtures/variants/extra.ts +0 -1
package/src/tests/fixtures/variants/impl.ts +0 -1
package/src/tests/fixtures/worker/fast.ts +0 -1
/package/src/{table-util/test → test}/TableValueExtractor.test.ts +0 -0
/package/src/{table-util/test → test}/TableValueExtractor.ts +0 -0

package/src/test/BuildTimeSection.test.ts ADDED Viewed

@@ -0,0 +1,130 @@
+import { expect, test } from "vitest";
+import type { BenchmarkReport } from "../report/BenchmarkReport.ts";
+import { computeColumnValues } from "../report/BenchmarkReport.ts";
+import { buildTimeSection } from "../report/StandardSections.ts";
+import { reportResults, valuesForReports } from "../report/text/TextReport.ts";
+import type { MeasuredResults } from "../runners/MeasuredResults.ts";
+/** @return minimal MeasuredResults with the given samples (time fields derived trivially). */
+function measured(samples: number[]): MeasuredResults {
+  const sorted = [...samples].sort((a, b) => a - b);
+  return {
+    name: "t",
+    samples,
+    time: {
+      min: sorted[0],
+      max: sorted[sorted.length - 1],
+      avg: samples.reduce((a, b) => a + b, 0) / samples.length,
+      p50: sorted[Math.floor(sorted.length * 0.5)],
+      p75: sorted[Math.floor(sorted.length * 0.75)],
+      p99: sorted[Math.floor(sorted.length * 0.99)],
+      p999: sorted[Math.floor(sorted.length * 0.999)],
+    },
+  };
+}
+function report(name: string, samples: number[]): BenchmarkReport {
+  return { name, measuredResults: measured(samples) };
+}
+function range(n: number): number[] {
+  return Array.from({ length: n }, (_, i) => i + 1);
+}
+test("default buildTimeSection produces mean, p50, p99 columns", () => {
+  const section = buildTimeSection();
+  expect(section.columns.map(c => c.key ?? c.title)).toEqual([
+    "mean",
+    "p50",
+    "p99",
+  ]);
+});
+test("computeColumnValues computes values from samples", () => {
+  const section = buildTimeSection("mean,p50,max,min");
+  const row = computeColumnValues(section, measured([10, 20, 30, 40, 50]));
+  expect(row.mean).toBe(30);
+  expect(row.min).toBe(10);
+  expect(row.max).toBe(50);
+  expect(row.p50).toBeGreaterThanOrEqual(20);
+  expect(row.p50).toBeLessThanOrEqual(40);
+});
+test("p70 returns value near 70th percentile of [1..100]", () => {
+  const section = buildTimeSection("p70");
+  const row = computeColumnValues(section, measured(range(100)));
+  expect(row.p70).toBeGreaterThanOrEqual(69);
+  expect(row.p70).toBeLessThanOrEqual(71);
+});
+test("p999 uses divide-by-1000 convention", () => {
+  const section = buildTimeSection("p999");
+  const row = computeColumnValues(section, measured(range(1000)));
+  expect(row.p999).toBeGreaterThanOrEqual(999);
+});
+test("p9999 uses divide-by-10000 convention", () => {
+  const section = buildTimeSection("p9999");
+  const row = computeColumnValues(section, measured(range(10000)));
+  expect(row.p9999).toBeGreaterThanOrEqual(9999);
+});
+test("median and p50 produce the same value", () => {
+  const a = computeColumnValues(
+    buildTimeSection("median"),
+    measured(range(100)),
+  );
+  const b = computeColumnValues(buildTimeSection("p50"), measured(range(100)));
+  expect(a.p50).toBe(b.p50);
+});
+test("mean and avg dedupe to a single column", () => {
+  const section = buildTimeSection("mean,avg");
+  expect(section.columns.length).toBe(1);
+});
+test("min and max return exact values", () => {
+  const section = buildTimeSection("min,max");
+  const row = computeColumnValues(section, measured([5, 1, 9, 3, 7]));
+  expect(row.min).toBe(1);
+  expect(row.max).toBe(9);
+});
+test("empty stats string throws", () => {
+  expect(() => buildTimeSection("")).toThrow(/at least one column/);
+  expect(() => buildTimeSection("  ,  ")).toThrow(/at least one column/);
+});
+test("unknown token throws with vocabulary hint", () => {
+  expect(() => buildTimeSection("wat")).toThrow(
+    /expected mean, median, min, max, or p<N>/,
+  );
+});
+test("single-digit percentile token is rejected", () => {
+  expect(() => buildTimeSection("p5")).toThrow(/at least 2 digits/);
+});
+test("3+ digit percentile tokens not starting with 9 are rejected", () => {
+  expect(() => buildTimeSection("p100")).toThrow(/must start with 9/);
+  expect(() => buildTimeSection("p500")).toThrow(/must start with 9/);
+  expect(() => buildTimeSection("p1000")).toThrow(/must start with 9/);
+});
+test("reportResults renders user-chosen columns as table headers", () => {
+  const groups = [{ name: "g", reports: [report("bench", range(100))] }];
+  const table = reportResults(groups, [buildTimeSection("p70,p95")]);
+  expect(table).toContain("p70");
+  expect(table).toContain("p95");
+});
+test("valuesForReports extracts user-chosen keys", () => {
+  const rows = valuesForReports(
+    [report("bench", range(100))],
+    [buildTimeSection("p70,p95")],
+  );
+  expect(rows[0].p70).toBeGreaterThanOrEqual(69);
+  expect(rows[0].p70).toBeLessThanOrEqual(71);
+  expect(rows[0].p95).toBeGreaterThanOrEqual(94);
+  expect(rows[0].p95).toBeLessThanOrEqual(96);
+});

package/src/test/CapSamples.test.ts ADDED Viewed

@@ -0,0 +1,82 @@
+import { expect, test } from "vitest";
+import { sampleDifferenceCI } from "../stats/BootstrapDifference.ts";
+import {
+  average,
+  maxBootstrapInput,
+  percentile,
+  sampleBootstrap,
+} from "../stats/StatisticalUtils.ts";
+test("sampleBootstrap uses full samples for point estimate", () => {
+  const samples = Array.from({ length: 5000 }, (_, i) => i);
+  const result = sampleBootstrap(samples, average, { resamples: 100 });
+  expect(result.estimate).toBe(average(samples));
+});
+test("sampleDifferenceCI preserves point estimate", () => {
+  const a = Array.from({ length: 5000 }, () => 50 + Math.random() * 10);
+  const b = a.map(v => v * 1.1);
+  const result = sampleDifferenceCI(a, b, average, { resamples: 100 });
+  const expected = ((average(b) - average(a)) / average(a)) * 100;
+  expect(result.percent).toBeCloseTo(expected, 10);
+});
+test("sampleBootstrap point estimate uses full array when capped", () => {
+  const n = maxBootstrapInput + 5000;
+  const samples = Array.from({ length: n }, (_, i) => i);
+  const result = sampleBootstrap(samples, average, { resamples: 50 });
+  expect(result.estimate).toBe(average(samples));
+  expect(result.subsampled).toBe(n);
+});
+test("sampleBootstrap does not set subsampled when under cap", () => {
+  const samples = Array.from({ length: 100 }, (_, i) => i);
+  const result = sampleBootstrap(samples, average, { resamples: 50 });
+  expect(result.subsampled).toBeUndefined();
+});
+test("sampleDifferenceCI sets subsampled when inputs exceed cap", () => {
+  const n = maxBootstrapInput + 1000;
+  const a = Array.from({ length: n }, () => 50 + Math.random() * 10);
+  const b = a.map(v => v * 1.1);
+  const result = sampleDifferenceCI(a, b, average, { resamples: 50 });
+  expect(result.percent).toBeCloseTo(10, 0);
+  expect(result.subsampled).toBe(n);
+});
+test("sampleDifferenceCI no subsampled flag when under cap", () => {
+  const a = Array.from({ length: 100 }, () => 50 + Math.random() * 10);
+  const b = a.map(v => v * 1.1);
+  const result = sampleDifferenceCI(a, b, average, { resamples: 50 });
+  expect(result.subsampled).toBeUndefined();
+});
+test("quickselect-based percentile matches sorted percentile", () => {
+  const data = Array.from({ length: 1000 }, () => Math.random() * 100);
+  const sorted = [...data].sort((a, b) => a - b);
+  for (const p of [0.25, 0.5, 0.75, 0.99]) {
+    const k = Math.max(0, Math.ceil(sorted.length * p) - 1);
+    expect(percentile(data, p)).toBe(sorted[k]);
+  }
+});
+test("quickselect handles small arrays", () => {
+  expect(percentile([42], 0.5)).toBe(42);
+  expect(percentile([1, 2], 0.5)).toBe(1);
+  expect(percentile([1, 2], 1.0)).toBe(2);
+});
+test("quickselect handles duplicate values", () => {
+  const data = [5, 5, 5, 5, 5, 10, 10, 10, 10, 10];
+  expect(percentile(data, 0.5)).toBe(5);
+  expect(percentile(data, 0.99)).toBe(10);
+});
+test("sampleBootstrap reuses buffer (no per-iteration allocation)", () => {
+  const samples = [10, 20, 30, 40, 50];
+  const result = sampleBootstrap(samples, average, { resamples: 50 });
+  expect(result.estimate).toBe(average(samples));
+  expect(result.samples).toHaveLength(50);
+  expect(result.ci[0]).toBeLessThanOrEqual(result.estimate);
+  expect(result.ci[1]).toBeGreaterThanOrEqual(result.estimate);
+});

package/src/test/CoverageExport.test.ts ADDED Viewed

@@ -0,0 +1,115 @@
+import { expect, test } from "vitest";
+import {
+  annotateFramesWithCounts,
+  buildCoverageMap,
+} from "../export/CoverageExport.ts";
+import type { CoverageData } from "../profiling/node/CoverageTypes.ts";
+const source = `function foo() {
+  return 1;
+}
+function bar() {
+  return 2;
+}
+const baz = () => 3;
+`;
+const coverage: CoverageData = {
+  scripts: [
+    {
+      url: "file:///test.js",
+      functions: [
+        {
+          functionName: "foo",
+          ranges: [{ startOffset: 0, endOffset: 30, count: 10 }],
+        },
+        {
+          functionName: "bar",
+          ranges: [{ startOffset: 31, endOffset: 60, count: 5 }],
+        },
+        {
+          functionName: "",
+          ranges: [{ startOffset: 61, endOffset: 80, count: 3 }],
+        },
+      ],
+    },
+  ],
+};
+test("buildCoverageMap resolves offsets to lines", () => {
+  const result = buildCoverageMap(coverage, { "file:///test.js": source });
+  expect(result.map.has("file:///test.js")).toBe(true);
+  const entries = result.map.get("file:///test.js")!;
+  expect(entries).toHaveLength(3);
+  const foo = entries.find(e => e.functionName === "foo");
+  expect(foo).toBeDefined();
+  expect(foo!.startLine).toBe(1);
+  expect(foo!.count).toBe(10);
+  const bar = entries.find(e => e.functionName === "bar");
+  expect(bar).toBeDefined();
+  expect(bar!.startLine).toBe(4);
+  expect(bar!.count).toBe(5);
+  // byName aggregates across all scripts
+  expect(result.byName.get("foo")).toBe(10);
+  expect(result.byName.get("bar")).toBe(5);
+});
+test("annotateFramesWithCounts appends [N] to matched frames", () => {
+  const result = buildCoverageMap(coverage, { "file:///test.js": source });
+  const frames = [
+    { name: "foo", file: "file:///test.js", line: 1 },
+    { name: "bar", file: "file:///test.js", line: 4 },
+    { name: "unmatched", file: "file:///other.js", line: 1 },
+  ];
+  annotateFramesWithCounts(frames, result);
+  expect(frames[0].name).toBe("foo [10]");
+  expect(frames[1].name).toBe("bar [5]");
+  expect(frames[2].name).toBe("unmatched"); // no coverage data for this file
+});
+test("annotateFramesWithCounts falls back to name-only for frames without file", () => {
+  const result = buildCoverageMap(coverage, { "file:///test.js": source });
+  const frames = [
+    { name: "foo" }, // no file — should match by name
+    { name: "bar" },
+    { name: "(anonymous)" }, // anonymous — should not match by name
+  ];
+  annotateFramesWithCounts(frames, result);
+  expect(frames[0].name).toBe("foo [10]");
+  expect(frames[1].name).toBe("bar [5]");
+  expect(frames[2].name).toBe("(anonymous)");
+});
+test("annotateFramesWithCounts formats large counts", () => {
+  const bigCoverage: CoverageData = {
+    scripts: [
+      {
+        url: "file:///big.js",
+        functions: [
+          {
+            functionName: "hot",
+            ranges: [{ startOffset: 0, endOffset: 10, count: 1_500_000 }],
+          },
+        ],
+      },
+    ],
+  };
+  const result = buildCoverageMap(bigCoverage, {
+    "file:///big.js": "function hot() {}",
+  });
+  const frames = [{ name: "hot", file: "file:///big.js", line: 1 }];
+  annotateFramesWithCounts(frames, result);
+  expect(frames[0].name).toBe("hot [1.5M]");
+});

package/src/test/CoverageSampler.test.ts ADDED Viewed

@@ -0,0 +1,33 @@
+import { expect, test } from "vitest";
+import { withCoverageProfiling } from "../profiling/node/CoverageSampler.ts";
+test("withCoverageProfiling returns function execution counts", async () => {
+  function hotFunction() {
+    let sum = 0;
+    for (let i = 0; i < 100; i++) sum += i;
+    return sum;
+  }
+  const { result, coverage } = await withCoverageProfiling(_session => {
+    for (let i = 0; i < 10; i++) hotFunction();
+    return 42;
+  });
+  expect(result).toBe(42);
+  expect(coverage.scripts.length).toBeGreaterThan(0);
+  // Find our test file in the coverage data
+  const thisScript = coverage.scripts.find(s =>
+    s.url.includes("CoverageSampler.test"),
+  );
+  expect(thisScript).toBeDefined();
+  expect(thisScript!.functions.length).toBeGreaterThan(0);
+  // Find hotFunction and verify its count
+  const hotFn = thisScript!.functions.find(
+    f => f.functionName === "hotFunction",
+  );
+  expect(hotFn).toBeDefined();
+  const count = hotFn!.ranges[0].count;
+  expect(count).toBe(10);
+});

package/src/test/HeapAttribution.test.ts CHANGED Viewed

@@ -2,12 +2,12 @@ import { expect, test } from "vitest";
 import {
   aggregateSites,
   type HeapSite,
-} from "../heap-sample/HeapSampleReport.ts";
+} from "../profiling/node/HeapSampleReport.ts";
 test("unknown column does not merge distinct functions on same line", () => {
   const sites: HeapSite[] = [
-    { fn: "Foo", url: "test.ts", line: 10, col: undefined, bytes: 100 },
-    { fn: "Bar", url: "test.ts", line: 10, col: undefined, bytes: 200 },
+    { name: "Foo", url: "test.ts", line: 10, col: undefined, bytes: 100 },
+    { name: "Bar", url: "test.ts", line: 10, col: undefined, bytes: 200 },
   ];
   const aggregated = aggregateSites(sites);
   expect(aggregated).toHaveLength(2);
@@ -15,8 +15,8 @@ test("unknown column does not merge distinct functions on same line", () => {
 test("same column merges regardless of function name", () => {
   const sites: HeapSite[] = [
-    { fn: "Foo", url: "test.ts", line: 10, col: 5, bytes: 100 },
-    { fn: "Foo", url: "test.ts", line: 10, col: 5, bytes: 200 },
+    { name: "Foo", url: "test.ts", line: 10, col: 5, bytes: 100 },
+    { name: "Foo", url: "test.ts", line: 10, col: 5, bytes: 200 },
   ];
   const aggregated = aggregateSites(sites);
   expect(aggregated).toHaveLength(1);
@@ -25,18 +25,18 @@ test("same column merges regardless of function name", () => {
 test("aggregation preserves distinct caller stacks", () => {
   const stackA = [
-    { fn: "root", url: "a.ts", line: 1, col: 0 },
-    { fn: "foo", url: "a.ts", line: 10, col: 0 },
-    { fn: "alloc", url: "a.ts", line: 20, col: 5 },
+    { name: "root", url: "a.ts", line: 1, col: 0 },
+    { name: "foo", url: "a.ts", line: 10, col: 0 },
+    { name: "alloc", url: "a.ts", line: 20, col: 5 },
   ];
   const stackB = [
-    { fn: "root", url: "a.ts", line: 1, col: 0 },
-    { fn: "bar", url: "a.ts", line: 15, col: 0 },
-    { fn: "alloc", url: "a.ts", line: 20, col: 5 },
+    { name: "root", url: "a.ts", line: 1, col: 0 },
+    { name: "bar", url: "a.ts", line: 15, col: 0 },
+    { name: "alloc", url: "a.ts", line: 20, col: 5 },
   ];
   const sites: HeapSite[] = [
-    { fn: "alloc", url: "a.ts", line: 20, col: 5, bytes: 800, stack: stackA },
-    { fn: "alloc", url: "a.ts", line: 20, col: 5, bytes: 200, stack: stackB },
+    { name: "alloc", url: "a.ts", line: 20, col: 5, bytes: 800, stack: stackA },
+    { name: "alloc", url: "a.ts", line: 20, col: 5, bytes: 200, stack: stackB },
   ];
   const aggregated = aggregateSites(sites);
@@ -44,7 +44,7 @@ test("aggregation preserves distinct caller stacks", () => {
   expect(aggregated[0].bytes).toBe(1000);
   expect(aggregated[0].callers).toHaveLength(2);
   // Primary stack should be the highest-bytes path (foo)
-  expect(aggregated[0].stack![1].fn).toBe("foo");
+  expect(aggregated[0].stack![1].name).toBe("foo");
   // Callers sorted by bytes descending
   expect(aggregated[0].callers![0].bytes).toBe(800);
   expect(aggregated[0].callers![1].bytes).toBe(200);

package/src/{tests → test}/MatrixFilter.test.ts RENAMED Viewed

@@ -1,5 +1,5 @@
 import { expect, test } from "vitest";
-import type { BenchMatrix } from "../BenchMatrix.ts";
+import type { BenchMatrix } from "../matrix/BenchMatrix.ts";
 import { filterMatrix, parseMatrixFilter } from "../matrix/MatrixFilter.ts";
 const inlineMatrix: BenchMatrix<string> = {

package/src/{tests → test}/MatrixReport.test.ts RENAMED Viewed

@@ -1,5 +1,5 @@
 import { expect, test } from "vitest";
-import type { CaseResult, MatrixResults } from "../BenchMatrix.ts";
+import type { CaseResult, MatrixResults } from "../matrix/BenchMatrix.ts";
 import { reportMatrixResults } from "../matrix/MatrixReport.ts";
 /** Create simple measured results for testing */

package/src/test/PermutationTest.test.ts CHANGED Viewed

@@ -1,5 +1,5 @@
 import { expect, test } from "vitest";
-import { compareWithBaseline } from "../PermutationTest.ts";
+import { compareWithBaseline } from "../stats/PermutationTest.ts";
 import { assertValid, getSampleData } from "./TestUtils.ts";
 test("detects 20% performance improvement", () => {

package/src/{tests → test}/RealDataValidation.test.ts RENAMED Viewed

@@ -4,10 +4,10 @@ import {
   coefficientOfVariation,
   medianAbsoluteDeviation,
   percentile,
-} from "../StatisticalUtils.ts";
+} from "../stats/StatisticalUtils.ts";
 import { bevy30SamplesMs, bevy30SamplesNs } from "./fixtures/bevy30-samples.ts";
-test("bevy30 data characteristics", () => {
+test.skip("bevy30 data characteristics", () => {
   const sortedMs = [...bevy30SamplesMs].sort((a, b) => a - b);
   const stats = {
@@ -48,7 +48,7 @@ test("bevy30 data characteristics", () => {
   if (stats.cv > 0.5) console.warn("Very high variation - may be unstable");
 });
-test("convergence at different time points matches CLI behavior", () => {
+test.skip("convergence at different time points matches CLI behavior", () => {
   // Simulate 5-second run (approximately 100 samples at ~50ms each)
   const samples5s = bevy30SamplesNs.slice(0, 100);
   const result5s = checkConvergence(samples5s);
@@ -76,7 +76,7 @@ test("convergence at different time points matches CLI behavior", () => {
     );
 });
-test("warm-up detection in real data", () => {
+test.skip("warm-up detection in real data", () => {
   const windowSize = 20;
   const windows: Array<{ start: number; median: number }> = [];
@@ -104,7 +104,7 @@ test("warm-up detection in real data", () => {
   }
 });
-test("convergence stability over sliding windows", () => {
+test.skip("convergence stability over sliding windows", () => {
   const windowSize = 100;
   const step = 50;
   const history: Array<{ start: number; confidence: number }> = [];
@@ -132,7 +132,7 @@ test("convergence stability over sliding windows", () => {
   }
 });
-test("adaptive algorithm would stop at correct time", () => {
+test.skip("adaptive algorithm would stop at correct time", () => {
   const target = 95;
   const fallback = 80;
   const minSamples = 50;

package/src/test/RunBenchCLI.test.ts CHANGED Viewed

@@ -1,8 +1,8 @@
 import { execSync } from "node:child_process";
 import path from "node:path";
 import { expect, test } from "vitest";
-import type { BenchSuite } from "../Benchmark.ts";
 import { filterBenchmarks } from "../cli/FilterBenchmarks.ts";
+import type { BenchSuite } from "../runners/BenchmarkSpec.ts";
 import { runBenchCLITest } from "./TestUtils.ts";
 const testSuite: BenchSuite = {
@@ -68,7 +68,7 @@ function executeBenchforgeFile(file: string, args = ""): string {
 }
 test("runs all benchmarks", { timeout: 30000 }, async () => {
-  const output = await runBenchCLITest(testSuite, "--time 0.1");
+  const output = await runBenchCLITest(testSuite, "--duration 0.1");
   expect(output).toContain("concatenation");
   expect(output).toContain("template literal");
@@ -79,7 +79,10 @@ test("runs all benchmarks", { timeout: 30000 }, async () => {
 });
 test("filters by substring", { timeout: 15000 }, async () => {
-  const output = await runBenchCLITest(testSuite, "--filter concat --time 0.1");
+  const output = await runBenchCLITest(
+    testSuite,
+    "--filter concat --duration 0.1",
+  );
   expect(output).toContain("concatenation");
   expect(output).not.toContain("addition");
@@ -88,7 +91,7 @@ test("filters by substring", { timeout: 15000 }, async () => {
 test("filters by regex", { timeout: 15000 }, async () => {
   const output = await runBenchCLITest(
     testSuite,
-    "--filter ^template --time 0.1",
+    "--filter ^template --duration 0.1",
   );
   expect(output).toContain("template literal");
   expect(output).not.toContain("addition");
@@ -106,7 +109,7 @@ test("filter preserves suite structure", () => {
 });
 test("e2e: runs user script", { timeout: 30000 }, () => {
-  const output = executeTestScript("--time 0.1");
+  const output = executeTestScript("--duration 0.1");
   expect(output).toContain("plus");
   expect(output).toContain("multiply");
@@ -122,14 +125,14 @@ test("e2e: runs user script", { timeout: 30000 }, () => {
 });
 test("e2e: filter flag", { timeout: 30000 }, () => {
-  const output = executeTestScript('--filter "plus" --time 0.1');
+  const output = executeTestScript('--filter "plus" --duration 0.1');
   expect(output).toContain("plus");
   expect(output).not.toContain("multiply");
 });
 test("runs benchmarks with setup function", { timeout: 30000 }, async () => {
-  const output = await runBenchCLITest(suiteWithSetup, "--time 0.1");
+  const output = await runBenchCLITest(suiteWithSetup, "--duration 0.1");
   expect(output).toContain("sum numbers");
   expect(output).toContain("join strings");
@@ -137,40 +140,38 @@ test("runs benchmarks with setup function", { timeout: 30000 }, async () => {
   expect(output).toContain("runs");
 });
-test(
-  "runs benchmarks with baseline comparison",
-  { timeout: 30000 },
-  async () => {
-    const suiteWithBaseline: BenchSuite = {
-      name: "Baseline Test",
-      groups: [
-        {
-          name: "Sort Comparison",
-          setup: () => ({
-            data: Array.from({ length: 10 }, () => Math.random()),
-          }),
-          baseline: {
-            name: "baseline sort",
-            fn: ({ data }: any) => [...data].sort(),
-          },
-          benchmarks: [
-            {
-              name: "optimized sort",
-              fn: ({ data }: any) => [...data].sort((a, b) => a - b),
-            },
-          ],
+test("runs benchmarks with baseline comparison", {
+  timeout: 30000,
+}, async () => {
+  const suiteWithBaseline: BenchSuite = {
+    name: "Baseline Test",
+    groups: [
+      {
+        name: "Sort Comparison",
+        setup: () => ({
+          data: Array.from({ length: 10 }, () => Math.random()),
+        }),
+        baseline: {
+          name: "baseline sort",
+          fn: ({ data }: any) => [...data].sort(),
         },
-      ],
-    };
+        benchmarks: [
+          {
+            name: "optimized sort",
+            fn: ({ data }: any) => [...data].sort((a, b) => a - b),
+          },
+        ],
+      },
+    ],
+  };
-    const output = await runBenchCLITest(suiteWithBaseline, "--time 0.01");
+  const output = await runBenchCLITest(suiteWithBaseline, "--iterations 20");
-    expect(output).toContain("baseline sort");
-    expect(output).toContain("optimized sort");
-    expect(output).toContain("Δ%"); // Diff column should appear
-    expect(output).toContain("mean");
-  },
-);
+  expect(output).toContain("baseline sort");
+  expect(output).toContain("optimized sort");
+  expect(output).toContain("Δ%"); // Diff column should appear
+  expect(output).toContain("mean");
+});
 test("file mode: BenchSuite export", { timeout: 30000 }, () => {
   const output = executeBenchforgeFile(